diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
new file mode 100644
index 00000000..ab8d24d6
--- /dev/null
+++ b/.github/workflows/release.yml
@@ -0,0 +1,204 @@
+name: Release
+
+on:
+  push:
+    tags:
+      - "v*"
+    branches:
+      - nightly
+  workflow_dispatch:
+
+jobs:
+  ci-gate:
+    name: Wait for CI to pass on this ref
+    runs-on: ubuntu-latest
+    env:
+      GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Wait for CI workflow conclusion on ${{ github.sha }}
+        run: |
+          set -euo pipefail
+          # Poll up to 60 minutes for the matching CI run on this SHA.
+          for i in $(seq 1 120); do
+            json="$(gh run list --workflow CI --commit "${GITHUB_SHA}" --limit 1 --json status,conclusion 2>/dev/null || echo '[]')"
+            count="$(echo "${json}" | jq 'length')"
+            if [ "${count}" -eq 0 ]; then
+              echo "[${i}/120] No CI run yet for ${GITHUB_SHA}"
+              sleep 30
+              continue
+            fi
+            status="$(echo "${json}" | jq -r '.[0].status')"
+            conclusion="$(echo "${json}" | jq -r '.[0].conclusion')"
+            if [ "${status}" = "completed" ]; then
+              if [ "${conclusion}" = "success" ]; then
+                echo "CI succeeded for ${GITHUB_SHA}."
+                exit 0
+              fi
+              echo "CI for ${GITHUB_SHA} completed with conclusion: ${conclusion}"
+              exit 1
+            fi
+            echo "[${i}/120] CI status=${status}"
+            sleep 30
+          done
+          echo "Timed out waiting for CI on ${GITHUB_SHA}."
+          exit 1
+
+  build:
+    name: Build ${{ matrix.os }}-${{ matrix.arch }}
+    needs: ci-gate
+    runs-on: ubuntu-latest
+    strategy:
+      fail-fast: true
+      matrix:
+        include:
+          - target: bun-darwin-arm64
+            os: darwin
+            arch: arm64
+          - target: bun-darwin-x64
+            os: darwin
+            arch: x64
+          - target: bun-linux-x64
+            os: linux
+            arch: x64
+          - target: bun-linux-arm64
+            os: linux
+            arch: arm64
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Setup Node
+        uses: actions/setup-node@v4
+        with:
+          node-version: "20"
+          cache: npm
+
+      - name: Setup Bun
+        uses: oven-sh/setup-bun@v2
+
+      - name: Install dependencies
+        run: npm ci
+
+      - name: Build TypeScript + embed assets
+        run: npm run build
+
+      - name: Cross-compile standalone binary for ${{ matrix.target }}
+        run: |
+          set -euo pipefail
+          bun build --compile --target=${{ matrix.target }} ./src/cli.ts --outfile "jaiph-${{ matrix.os }}-${{ matrix.arch }}"
+          ls -la "jaiph-${{ matrix.os }}-${{ matrix.arch }}"
+
+      - name: Upload binary artifact
+        uses: actions/upload-artifact@v4
+        with:
+          name: jaiph-${{ matrix.os }}-${{ matrix.arch }}
+          path: jaiph-${{ matrix.os }}-${{ matrix.arch }}
+          if-no-files-found: error
+          retention-days: 7
+
+  release:
+    name: Publish release assets
+    needs: build
+    runs-on: ubuntu-latest
+    permissions:
+      contents: write
+    env:
+      GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Resolve tag and channel
+        id: meta
+        run: |
+          set -euo pipefail
+          case "${GITHUB_REF}" in
+            refs/tags/v*)
+              tag="${GITHUB_REF_NAME}"; channel="stable" ;;
+            refs/heads/nightly|refs/tags/nightly)
+              tag="nightly"; channel="nightly" ;;
+            *)
+              echo "Unsupported ref for release: ${GITHUB_REF}" >&2; exit 1 ;;
+          esac
+          echo "tag=${tag}" >> "${GITHUB_OUTPUT}"
+          echo "channel=${channel}" >> "${GITHUB_OUTPUT}"
+
+      - name: Download binary artifacts
+        uses: actions/download-artifact@v4
+        with:
+          path: release-assets
+          merge-multiple: true
+
+      - name: Generate SHA256SUMS
+        working-directory: release-assets
+        run: |
+          set -euo pipefail
+          ls -la
+          rm -f SHA256SUMS
+          sha256sum jaiph-darwin-arm64 jaiph-darwin-x64 jaiph-linux-x64 jaiph-linux-arm64 > SHA256SUMS
+          cat SHA256SUMS
+
+      - name: Sanity gate (linux-x64 --version)
+        working-directory: release-assets
+        run: |
+          set -euo pipefail
+          chmod +x jaiph-linux-x64
+          got="$(./jaiph-linux-x64 --version)"
+          echo "got: ${got}"
+          if [ "${{ steps.meta.outputs.channel }}" = "stable" ]; then
+            tag="${{ steps.meta.outputs.tag }}"
+            expected="jaiph ${tag#v}"
+            if [ "${got}" != "${expected}" ]; then
+              echo "Version sanity check failed: expected '${expected}', got '${got}'" >&2
+              exit 1
+            fi
+          else
+            if ! printf '%s\n' "${got}" | grep -Eq '^jaiph [0-9]+\.[0-9]+\.[0-9]+'; then
+              echo "Version sanity check failed: '${got}' does not look like a jaiph version" >&2
+              exit 1
+            fi
+          fi
+
+      - name: Publish stable release ${{ steps.meta.outputs.tag }}
+        if: steps.meta.outputs.channel == 'stable'
+        working-directory: release-assets
+        run: |
+          set -euo pipefail
+          tag="${{ steps.meta.outputs.tag }}"
+          if gh release view "${tag}" >/dev/null 2>&1; then
+            gh release upload "${tag}" --clobber \
+              jaiph-darwin-arm64 jaiph-darwin-x64 \
+              jaiph-linux-x64 jaiph-linux-arm64 \
+              SHA256SUMS
+          else
+            gh release create "${tag}" \
+              --title "${tag}" \
+              --notes "Jaiph ${tag} — standalone binaries (darwin/linux × arm64/x64) plus SHA256SUMS." \
+              jaiph-darwin-arm64 jaiph-darwin-x64 \
+              jaiph-linux-x64 jaiph-linux-arm64 \
+              SHA256SUMS
+          fi
+
+      - name: Publish nightly prerelease
+        if: steps.meta.outputs.channel == 'nightly'
+        working-directory: release-assets
+        run: |
+          set -euo pipefail
+          if gh release view nightly >/dev/null 2>&1; then
+            gh release upload nightly --clobber \
+              jaiph-darwin-arm64 jaiph-darwin-x64 \
+              jaiph-linux-x64 jaiph-linux-arm64 \
+              SHA256SUMS
+          else
+            gh release create nightly \
+              --title "Nightly" \
+              --notes "Rolling nightly prerelease — standalone binaries built from the latest \`nightly\` branch." \
+              --prerelease \
+              --target "${GITHUB_SHA}" \
+              jaiph-darwin-arm64 jaiph-darwin-x64 \
+              jaiph-linux-x64 jaiph-linux-arm64 \
+              SHA256SUMS
+          fi
diff --git a/.gitignore b/.gitignore
index b15d9eec..0b049cf9 100644
--- a/.gitignore
+++ b/.gitignore
@@ -9,6 +9,10 @@ docs/.bundle/
 dist/
 .tmp/
 
+# Generated by tools/embed-assets.js from package.json's `version` field, so
+# the CLI version lives in only one place in tree (package.json).
+src/version.ts
+
 # logs
 *.log
 npm-debug.log*
diff --git a/.jaiph/architect_review.jh b/.jaiph/architect_review.jh
index 22fa919b..552663cd 100755
--- a/.jaiph/architect_review.jh
+++ b/.jaiph/architect_review.jh
@@ -1,6 +1,7 @@
 #!/usr/bin/env jaiph
 
 import "jaiphlang/queue" as queue
+import "./lib_common.jh" as common
 
 config {
   agent.backend = "cursor"
@@ -10,29 +11,8 @@ config {
   # agent.claude_flags = "--permission-mode bypassPermissions"
 }
 
-script first_line_str = `printf '%s\n' "$1" | head -n 1`
-
-script rest_lines_str = `printf '%s\n' "$1" | tail -n +2`
-
-script arg_nonempty = `[ -n "$1" ]`
-
-script str_equals = `[ "$1" = "$2" ]`
-
-script mkdir_p_simple = `mkdir -p "$1"`
-
-script jaiph_tmp_dir = `printf '%s\n' "$JAIPH_WORKSPACE/.jaiph/tmp"`
-
 script jaiph_review_body_file = `printf '%s\n' "$JAIPH_WORKSPACE/.jaiph/tmp/architect_review_body.txt"`
 
-# Writes UTF-8 text to a path (path, then content).
-script save_string_to_file = ```python3
-import sys
-if len(sys.argv) < 3:
-    sys.exit(2)
-path, content = sys.argv[1], sys.argv[2]
-open(path, "w", encoding="utf-8").write(content)
-```
-
 # Packed as: first line = verdict, rest = updated_description (must stay top-level:
 # const … = prompt """…""" is not supported inside ensure … catch — see parseRecoverStatement).
 workflow architect_agent_review(task) {
@@ -93,31 +73,31 @@ workflow architect_agent_review(task) {
 }
 
 workflow review_one_header(header) {
-  run arg_nonempty(header) catch (err) {
+  run common.arg_nonempty(header) catch (err) {
     return ""
   }
   const task = run queue.get_task_by_header(header)
   ensure queue.task_is_dev_ready(task) catch (err) {
     const packed = run architect_agent_review(task)
-    const verdict = run first_line_str(packed)
-    const updated_description = run rest_lines_str(packed)
+    const verdict = run common.first_line_str(packed)
+    const updated_description = run common.rest_lines_str(packed)
     const body_file = run jaiph_review_body_file()
-    run mkdir_p_simple(run jaiph_tmp_dir())
-    run str_equals(verdict, "dev-ready") catch (err) {
-      run arg_nonempty(updated_description) catch (err) {
+    run common.mkdir_p_simple(run common.jaiph_tmp_dir())
+    run common.str_equals(verdict, "dev-ready") catch (err) {
+      run common.arg_nonempty(updated_description) catch (err) {
         fail "needs-work requires a non-empty updated_description (questions for the author)."
       }
-      run save_string_to_file(body_file, updated_description)
+      run common.save_string_to_file(body_file, updated_description)
       run queue.set_task_description_from_file(header, body_file)
       log "Needs work (description updated): ${header}"
       return ""
     }
-    run arg_nonempty(updated_description) catch (err) {
+    run common.arg_nonempty(updated_description) catch (err) {
       run queue.mark_task_dev_ready(header)
       log "Marked dev-ready: ${header}"
       return ""
     }
-    run save_string_to_file(body_file, updated_description)
+    run common.save_string_to_file(body_file, updated_description)
     run queue.set_task_description_from_file(header, body_file)
     run queue.mark_task_dev_ready(header)
     log "Marked dev-ready: ${header}"
@@ -128,16 +108,16 @@ workflow review_one_header(header) {
 
 workflow process_headers_recursive(header, remaining) {
   run review_one_header(header)
-  run arg_nonempty(remaining) catch (err) {
+  run common.arg_nonempty(remaining) catch (err) {
     return ""
   }
-  const next = run first_line_str(remaining)
-  const rest = run rest_lines_str(remaining)
+  const next = run common.first_line_str(remaining)
+  const rest = run common.rest_lines_str(remaining)
   run process_headers_recursive(next, rest)
 }
 
 workflow maybe_process_headers(first, rest) {
-  run arg_nonempty(first) catch (err) {
+  run common.arg_nonempty(first) catch (err) {
     return ""
   }
   run process_headers_recursive(first, rest)
@@ -145,8 +125,8 @@ workflow maybe_process_headers(first, rest) {
 
 workflow default() {
   const headers = run queue.get_all_task_headers()
-  const first = run first_line_str(headers)
-  const rest = run rest_lines_str(headers)
+  const first = run common.first_line_str(headers)
+  const rest = run common.rest_lines_str(headers)
   run maybe_process_headers(first, rest)
   ensure queue.all_dev_ready() catch (err) {
     fail "One or more tasks need work. Review the agent output above."
diff --git a/.jaiph/docs_parity.jh b/.jaiph/docs_parity.jh
index 30bf62cc..143911e6 100755
--- a/.jaiph/docs_parity.jh
+++ b/.jaiph/docs_parity.jh
@@ -1,22 +1,16 @@
 #!/usr/bin/env jaiph
 
 const role = """
-  You are an expert technical writer for this project.
-  1. You are fluent in Markdown and can read TypeScript code and Bash
-  2. You write for a developer audience, focusing on clarity and practical
-     examples.
-  3. You are concise, specific, and value dense
-  4. Write so that a new developer to this codebase can understand your
-     writing, but don't assume your audience are experts in the topic/area you
-     are writing about.
-  5. You are good in formulating generic context and describing the problem
-     starting from the generic part, leaving the specific details for the
-     last step, once the audience is aware of the generic context and the
-     problem.
-  6. You write problem explanation and goals in a human approachable way,
-     while keeping details dense in separate sections, so both human and AI
-  7. Source code and docs/architecture.md are the single source of truth. You don't
-     trust the existing documentation blindly.
+  Project-specific context for documenting Jaiph:
+  - You read TypeScript and Bash fluently so you can verify documentation
+    against the implementation.
+  - Source code and docs/architecture.md are the single source of truth.
+    Do not trust existing documentation blindly; verify claims against the
+    code before reproducing them.
+  - Navigation links between docs pages are provided by the Jekyll template
+    (docs/_layouts/docs.html). Do not add manual navigation blocks (e.g.
+    "More Documentation" sections) to individual markdown pages — inline
+    contextual links to other docs are fine.
 """
 
 script assert_newline_paths_are_files = ```
@@ -100,6 +94,11 @@ script build_allowed_paths_block = ```
 
 workflow update_from_task(taskDesc) {
   prompt """
+    Before doing anything else, read and follow the documentation skill at
+    .jaiph/skills/documentation-writer/SKILL.md. It defines the Diátaxis
+    framework, the four document types, the clarify -> outline -> write
+    workflow, and the four guiding principles (clarity, accuracy,
+    user-centricity, consistency) you must apply to this task.
     <role>
     ${role}
     </role>
@@ -123,6 +122,11 @@ workflow update_from_task(taskDesc) {
 
 workflow docs_page(path) {
   prompt """
+    Before doing anything else, read and follow the documentation skill at
+    .jaiph/skills/documentation-writer/SKILL.md. It defines the Diátaxis
+    framework, the four document types, the clarify -> outline -> write
+    workflow, and the four guiding principles (clarity, accuracy,
+    user-centricity, consistency) you must apply to this task.
     <role>
     ${role}
     </role>
@@ -149,11 +153,16 @@ workflow docs_page(path) {
        individual markdown pages. Inline contextual links to other docs are
        fine.
     </task>
-"""
+  """
 }
 
 workflow docs_overview(docPaths) {
   prompt """
+    Before doing anything else, read and follow the documentation skill at
+    .jaiph/skills/documentation-writer/SKILL.md. It defines the Diátaxis
+    framework, the four document types, the clarify -> outline -> write
+    workflow, and the four guiding principles (clarity, accuracy,
+    user-centricity, consistency) you must apply to this task.
     <role>
     ${role}
     </role>
@@ -197,7 +206,7 @@ workflow docs_overview(docPaths) {
     10.Ensure src/cli/shared/usage.ts is up to date with the latest CLI commands
        and options. It should be a single source of truth for the CLI usage.
     </task>
-"""
+  """
 }
 
 workflow default() {
diff --git a/.jaiph/docs_parity_redesign.jh b/.jaiph/docs_parity_redesign.jh
new file mode 100755
index 00000000..42df461a
--- /dev/null
+++ b/.jaiph/docs_parity_redesign.jh
@@ -0,0 +1,202 @@
+#!/usr/bin/env jaiph
+
+# Redesign-aware variant of docs_parity.jh, meant to be run BY HAND after the
+# Diátaxis docs redesign (QUEUE.md "Docs redesign" tasks 1-7) has landed.
+#
+# Differences from docs_parity.jh:
+#   - Lists docs recursively and EXCLUDES docs/_legacy/ (the build-excluded
+#     quarantine of the pre-redesign pages). The stock workflow globs only the
+#     flat docs/*.md and would both miss nested pages and risk touching legacy.
+#   - The overview pass VERIFIES and tightens the new Diátaxis structure against
+#     the source code; it does NOT merge / split / move / re-quadrant pages the
+#     way the stock docs_overview does (that would undo the redesign).
+#   - Docs-only: it never edits src/ or usage.ts.
+#
+# Run on a clean worktree:  jaiph run .jaiph/docs_parity_redesign.jh
+
+const role = """
+  Project-specific context for documenting Jaiph:
+  - You read TypeScript and Bash fluently so you can verify documentation
+    against the implementation.
+  - Source code and docs/architecture.md are the single source of truth.
+    Do not trust existing documentation blindly; verify claims against the
+    code before reproducing them.
+  - Navigation links between docs pages are provided by the Jekyll template
+    (docs/_layouts/docs.html). Do not add manual navigation blocks (e.g.
+    "More Documentation" sections) to individual markdown pages — inline
+    contextual links to other docs are fine.
+  - docs/_legacy/ is a build-excluded quarantine of the OLD documentation.
+    Never read it as a source, never edit it, never resurrect its pages.
+"""
+
+script assert_worktree_clean_for_docs = ```
+  local current_changed_files
+  current_changed_files="$(
+    {
+      git diff --name-only --cached
+      git diff --name-only
+      git ls-files --others --exclude-standard
+    } | sort -u
+  )"
+  if [ -n "$current_changed_files" ]; then
+    echo "Refusing to run docs parity workflow on a dirty worktree." >&2
+    echo "Please commit, stash, or discard these files first:" >&2
+    echo "$current_changed_files" >&2
+    return 1
+  fi
+```
+
+rule worktree_is_clean() {
+  run assert_worktree_clean_for_docs()
+}
+
+script assert_newline_paths_are_files = ```
+  while IFS= read -r f; do
+    f="${f#"${f%%[![:space:]]*}"}"
+    f="${f%"${f##*[![:space:]]}"}"
+    [ -z "$f" ] && continue
+    test -f "$f" || return 1
+  done <<< "$1"
+```
+
+rule docs_files_present(list) {
+  run assert_newline_paths_are_files(list)
+}
+
+# Pattern-based allowlist (not a frozen snapshot): permit the doc entry points
+# and ANY docs/**/*.md page — so pages the prompt legitimately CREATES still
+# pass — while rejecting source, tests, .jaiph/, scratch files, and the
+# quarantine / vendored / generated trees.
+script assert_only_allowed_changed = ```
+  local after_changed_files
+  after_changed_files="$(
+    {
+      git diff --name-only --cached
+      git diff --name-only
+      git ls-files --others --exclude-standard
+    } | sort -u
+  )"
+  while IFS= read -r changed_file; do
+    [ -z "$changed_file" ] && continue
+    case "$changed_file" in
+      README.md|CHANGELOG.md|docs/index.html|docs/_layouts/docs.html|docs/_config.yml)
+        continue ;;
+    esac
+    if printf '%s\n' "$changed_file" | grep -qE '^docs/.*\.md$' \
+       && ! printf '%s\n' "$changed_file" | grep -qE '(^|/)docs/(_legacy|vendor|_site)/'; then
+      continue
+    fi
+    echo "Unexpected file changed by docs prompt: $changed_file" >&2
+    return 1
+  done <<< "$after_changed_files"
+```
+
+rule only_expected_docs_changed_after_prompt() {
+  run assert_only_allowed_changed()
+}
+
+# Recursive list of published docs pages, excluding quarantine, Jekyll output,
+# and Bundler's docs/vendor/ tree. BSD/macOS find treats * in -path as not
+# crossing '/', so prune -path 'docs/vendor/*' misses nested gem READMEs; use
+# grep instead of case (POSIX case patterns do not let * match '/' either).
+script list_docs_md_paths = ```
+  find docs -type f -name '*.md' -print \
+    | grep -vE '(^|/)docs/(_legacy|vendor|_site)/' \
+    | sort
+```
+
+# Files the parity prompts are permitted to change (docs only — never src).
+script build_allowed_paths_block = ```
+  {
+    printf '%s\n' README.md CHANGELOG.md docs/index.html docs/_layouts/docs.html docs/_config.yml
+    find docs -type f -name '*.md' -print \
+      | grep -vE '(^|/)docs/(_legacy|vendor|_site)/'
+  } | sort -u
+```
+
+workflow docs_page(path) {
+  prompt """
+    Before doing anything else, read and follow the documentation skill at
+    .jaiph/skills/documentation-writer/SKILL.md. It defines the Diátaxis
+    framework, the four document types, the clarify -> outline -> write
+    workflow, and the four guiding principles (clarity, accuracy,
+    user-centricity, consistency) you must apply to this task.
+    <role>
+    ${role}
+    </role>
+    <task>
+    Verify ${path} against the Jaiph source code (the single source of truth)
+    and docs/architecture.md.
+    0. This page belongs to a fixed Diátaxis quadrant declared in its
+       `diataxis:` front matter (tutorial / how-to / reference / explanation /
+       contributor). KEEP that type. Do NOT move content to or from other pages,
+       do NOT change the permalink, do NOT merge or split the page.
+    1. Verify every factual claim, example, flag, config key, env var, and error
+       code against the source. Fix drift in the page to match the code.
+    2. Repair cross-type bleed WITHIN the page only (e.g. delete a tutorial-style
+       walkthrough that crept into a reference page) — relocating it is out of
+       scope for this pass.
+    3. Keep examples executable and aligned with current behavior. Keep prose
+       approachable, concise, and free of AI-like filler and excess emojis.
+    4. Inline contextual links to other docs are fine; do NOT add manual
+       navigation blocks. Never touch docs/_legacy/.
+    5. Edit ONLY this documentation page. Never edit source, tests
+       (*.test.ts), config, or anything under .jaiph/, and never create helper
+       or scratch scripts (e.g. *.mjs, *.sh) — make every change directly in
+       the documentation file.
+    </task>
+  """
+}
+
+workflow docs_redesign_overview(docPaths) {
+  prompt """
+    Before doing anything else, read and follow the documentation skill at
+    .jaiph/skills/documentation-writer/SKILL.md (Diátaxis: tutorials, how-to,
+    reference, explanation).
+    <role>
+    ${role}
+    </role>
+    <task>
+    The docs were DELIBERATELY restructured into Diátaxis quadrants. Your job is
+    to VERIFY and tighten that structure — NOT to reorganize it. Read all
+    ${docPaths} (these already exclude docs/_legacy/). Treat docs/architecture.md
+    as the architecture source of truth.
+
+    PRESERVE the structure. Do NOT merge, split, move, rename, or re-quadrant
+    pages; do NOT change permalinks; do NOT restructure the nav in
+    docs/_layouts/docs.html beyond fixing an outright error. Specifically:
+    1. Cross-page consistency: terminology, tone, and overlapping facts agree
+       across pages, and every page is consistent with docs/architecture.md
+       (runtime vs CLI responsibilities, __JAIPH_EVENT__ vs run artifacts,
+       channels/hooks, the jaiph test lane).
+    2. Each page stays within its `diataxis:` type; flag (do not relocate)
+       any remaining cross-type bleed.
+    3. Reference pages (cli, configuration, grammar, language, env-vars) match
+       the source exactly — every flag, key, env var, error code. Fix the docs.
+    4. README.md and docs/index.html lead with the tutorials / how-to entry
+       points and link to getting-started (or the first tutorial) and the agent
+       skill URL, hardcoded as
+       https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md.
+       Markdown-to-markdown links end with .md; index.html links do not.
+    5. Edit documentation files ONLY (docs/**/*.md, README.md, CHANGELOG.md,
+       docs/index.html, docs/_layouts/docs.html, docs/_config.yml). Never edit
+       src/, tests (*.test.ts), or anything under .jaiph/, and never create
+       helper or scratch scripts (e.g. *.mjs, *.sh) — make every change
+       directly in the documentation files. Never touch docs/_legacy/.
+    </task>
+  """
+}
+
+workflow default() {
+  ensure worktree_is_clean()
+  const allowed_list = run build_allowed_paths_block()
+  ensure docs_files_present(allowed_list)
+  const docs_md_list = run list_docs_md_paths()
+  for path in docs_md_list {
+    if path != "" {
+      run docs_page(path)
+    }
+  }
+  run docs_redesign_overview(docs_md_list)
+  ensure only_expected_docs_changed_after_prompt()
+}
diff --git a/.jaiph/engineer.jh b/.jaiph/engineer.jh
index e2dc4c11..96280304 100755
--- a/.jaiph/engineer.jh
+++ b/.jaiph/engineer.jh
@@ -4,11 +4,12 @@
 # Picks the first pending task from QUEUE.md, implements it, verifies CI,
 # updates docs, removes from queue, and publishes a workspace patch artifact.
 #
-import "jaiphlang/queue" as queue
 import "jaiphlang/artifacts" as artifacts
+import "jaiphlang/git" as git
+import "jaiphlang/queue" as queue
 import "./docs_parity.jh" as docs
 import "./ensure_ci_passes.jh" as ci
-import "jaiphlang/git" as git
+import "./lib_common.jh" as common
 
 config {
   # agent.backend = "cursor"
@@ -18,6 +19,30 @@ config {
   agent.claude_flags = "--permission-mode bypassPermissions"
 }
 
+const no_nested_orchestration = "Never invoke orchestration workflows (.jaiph/*.jh) or launch nested agent sessions"
+
+const safety_constraints = """
+  Hard safety constraint (non-negotiable):
+  - NEVER invoke Jaiph workflows from the .jaiph directory.
+  - Forbidden examples: jaiph .jaiph/engineer.jh, jaiph run .jaiph/engineer.jh,
+    jaiph .jaiph/docs_parity.jh, or any jaiph command targeting .jaiph/*.jh.
+  - Treat .jaiph/*.jh as orchestration-only workflows that must not be called
+    from inside this implementation prompt.
+  - NEVER launch a nested Claude/Cursor agent session from inside this workflow.
+    Nested sessions share runtime resources and can crash active sessions.
+  - Do not attempt to bypass nested-session guards (for example by unsetting
+    environment variables such as CLAUDECODE).
+  - Any violation of these constraints is an immediate task failure; stop and report.
+"""
+
+const definition_of_done = """
+  Definition of done (QUEUE.md rule 7, verbatim):
+  "Acceptance criteria are non-negotiable. A task is not done until every
+  acceptance bullet is verified by a test that fails when the contract is
+  violated. 'It works on my machine' or 'the existing tests pass' is not
+  acceptance."
+"""
+
 const code_philosophy = """
   This codebase is maintained by both humans and AI agents. All code you write
   must follow these principles strictly:
@@ -71,7 +96,7 @@ const role_surgical = """
   * Default to touching as few files as possible
   * Do NOT redesign surrounding architecture
   * Do NOT add abstractions unless clearly required by acceptance criteria
-  * Never invoke orchestration workflows (.jaiph/*.jh) or launch nested agent sessions
+  * ${no_nested_orchestration}
 """
 
 const role_reductionist = """
@@ -91,7 +116,7 @@ const role_reductionist = """
   * Actively remove dead code, duplicate branches, and unnecessary indirection
   * Prefer net-negative or near-neutral code growth when feasible
   * If adding code is unavoidable, justify why deletion/simplification was insufficient
-  * Never invoke orchestration workflows (.jaiph/*.jh) or launch nested agent sessions
+  * ${no_nested_orchestration}
 """
 
 const role_optimizer = """
@@ -110,7 +135,7 @@ const role_optimizer = """
   * Every structural change must have a concrete before/after justification
   * Do NOT rework areas outside the task's scope, even if they look improvable
   * Avoid speculative complexity that does not produce measurable benefit
-  * Never invoke orchestration workflows (.jaiph/*.jh) or launch nested agent sessions
+  * ${no_nested_orchestration}
 """
 
 const role_stabilizer = """
@@ -130,7 +155,7 @@ const role_stabilizer = """
   * Add or improve tests for risky paths and boundary conditions
   * Keep implementation simple, defensive, and observable
   * Avoid structural rewrites unless strictly required to satisfy acceptance criteria
-  * Never invoke orchestration workflows (.jaiph/*.jh) or launch nested agent sessions
+  * ${no_nested_orchestration}
 """
 
 const classification_prompt = """
@@ -167,8 +192,6 @@ workflow select_role(role_name) {
   }
 }
 
-script arg_nonempty = `[ -n "${1:-}" ]`
-
 script task_text_has_header = `printf '%s\n' "$1" | grep -q '^## '`
 
 script first_line_task = ```
@@ -191,7 +214,17 @@ workflow classify_role(task) {
   """
   returns "{ role: string }"
 
-  return result.role
+  # Normalize the free-text classifier answer (case, extra words like
+  # "surgical engineer") to a canonical role name before select_role.
+  const role_raw = "${result.role}"
+  const role_lc = run common.to_lower(role_raw)
+  return match role_lc {
+    /surgical/ => "surgical"
+    /reduction/ => "reductionist"
+    /optimi/ => "optimizer"
+    /stabili/ => "stabilizer"
+    _ => fail "Classifier returned unrecognized role: ${role_lc}"
+  }
 }
 
 workflow implement(task, role_name) {
@@ -224,23 +257,14 @@ workflow implement(task, role_name) {
       before continuing.
     - Ensuring all acceptance criteria in the task are met.
 
+    ${definition_of_done}
+
     Tests and validation:
     - Unit/integration: npm test
     - End-to-end: npm run test:e2e
     - Build check: npm run build
 
-    Hard safety constraint (non-negotiable):
-    - NEVER invoke Jaiph workflows from the .jaiph directory.
-    - Forbidden examples: jaiph .jaiph/engineer.jh, jaiph run .jaiph/engineer.jh,
-      jaiph .jaiph/main.jh, jaiph .jaiph/docs_parity.jh, or any jaiph command
-      targeting .jaiph/*.jh.
-    - Treat .jaiph/*.jh as orchestration-only workflows that must not be called
-      from inside this implementation prompt.
-    - NEVER launch a nested Claude/Cursor agent session from inside this workflow.
-      Nested sessions share runtime resources and can crash active sessions.
-    - Do not attempt to bypass nested-session guards (for example by unsetting
-      environment variables such as CLAUDECODE).
-    - Any violation of these constraints is an immediate task failure; stop and report.
+    ${safety_constraints}
 
     Test stability policy:
     - e2e/tests/* and acceptance JS tests are behavior contracts and should be
diff --git a/.jaiph/ensure_ci_passes.jh b/.jaiph/ensure_ci_passes.jh
index 5165d227..21765b68 100755
--- a/.jaiph/ensure_ci_passes.jh
+++ b/.jaiph/ensure_ci_passes.jh
@@ -1,18 +1,14 @@
 #!/usr/bin/env jaiph
 
+import "./lib_common.jh" as common
+
 config {
   agent.backend = "cursor"
   agent.cursor_flags = "--force"
 }
 
-rule ci_passes() {
-  run npm_run_test_ci()
-}
-
 script npm_run_test_ci = `npm run test:ci`
 
-script save_string_to_file = `echo "$1" > "$2"`
-
 script assert_nonempty_file_or_fail = ```
 test -s "$1" || {
   echo "jaiph: ci failure log is empty at $1" >&2
@@ -23,42 +19,37 @@ test -s "$1" || {
 workflow ensure_ci_passes() {
   const ci_log_dir = ".jaiph/tmp"
   const ci_log_file = "${ci_log_dir}/ensure_ci_passes.last.log"
-  run mkdir_p_simple(ci_log_dir)
+  run common.mkdir_p_simple(ci_log_dir)
 
-  ensure ci_passes() catch (failure) {
-    run save_string_to_file(failure, ci_log_file)
+  # recover = repair-and-retry loop: run the CI script, on failure save the
+  # log and prompt for a fix, then retry — bounded by run.recover_limit
+  # (default 10) instead of unbounded workflow recursion.
+  run npm_run_test_ci() recover (failure) {
+    run common.save_string_to_file(ci_log_file, failure)
     run assert_nonempty_file_or_fail(ci_log_file)
-
     prompt """
       <role>
         You are a software engineer fixing a failing CI build.
       </role>
       <task>
-        Fix failing CI so npm run test:ci passes. Failure output was saved to: 
-        ${ci_log_file}. Start by inspecting the tail of the log (for example: 
-        tail -n 200 '${ci_log_file}') and then apply the smallest safe fix. 
-        Constraints: - e2e/tests/* and acceptance JS tests are behavior 
+        Fix failing CI so npm run test:ci passes. Failure output was saved to:
+        ${ci_log_file}. Start by inspecting the tail of the log (for example:
+        tail -n 200 '${ci_log_file}') and then apply the smallest safe fix.
+        Constraints: - e2e/tests/* and acceptance JS tests are behavior
         contracts.
-        - Default approach: change production code to satisfy existing tests, 
+        - Default approach: change production code to satisfy existing tests,
           not vice versa.
-        - Modify tests only for intentional behavior changes, incorrect 
+        - Modify tests only for intentional behavior changes, incorrect
           expectations, or removal of obsolete features.
         - Any test change must be minimal with a clear rationale.
         - Do NOT add speculative fixes. Fix only what the log shows is broken.
       </task>
     """
-
-    # recursively call this workflow to keep trying until the CI passes
-    run ensure_ci_passes()
   }
 
-  run rm_file_simple(ci_log_file)
+  run common.rm_file_simple(ci_log_file)
 }
 
-script mkdir_p_simple = `mkdir -p "$1"`
-
-script rm_file_simple = `rm -f "$1"`
-
 workflow default() {
   run ensure_ci_passes()
 }
diff --git a/.jaiph/language_redesign_spec.md b/.jaiph/language_redesign_spec.md
deleted file mode 100644
index d33cbb83..00000000
--- a/.jaiph/language_redesign_spec.md
+++ /dev/null
@@ -1,800 +0,0 @@
-# Execution-Boundary Rework Specification
-
-## Core Problem
-
-Jaiph blends declarative orchestration with raw shell in workflows and rules. That blurs side-effect boundaries, blocks runtime portability (Go/Rust), and weakens sandbox control.
-
-Target: one strict boundary. Orchestration constructs orchestrate. A dedicated script construct executes. No exceptions.
-
-## Design Decisions (Locked)
-
-These are not options. Implementation starts from this table.
-
-| # | Decision |
-|---|----------|
-| 1 | Orchestration constructs (`workflow`, `rule`) contain **zero raw shell**. |
-| 2 | Execution construct (`script`) is a **standalone executable** — bash by default, any language via custom shebang. |
-| 3 | Construct name is **`script`** (not `function` or `bash`). |
-| 4 | Variable declarations use **`const`** in orchestration, **`local`** in scripts. |
-| 5 | Rules get **structured keyword parsing** (same model as workflows, restricted subset). |
-| 6 | Every shell operation requires a **named `script`**. No anonymous bash blocks. |
-| 7 | Scripts: **standard exit semantics** (exit code via `return N`/`exit N`, values via stdout). |
-| 8 | Workflows/rules: **`return "value"`** for values, **`fail "reason"`** for explicit failures. |
-| 9 | **One-shot cutover.** No compatibility mode, no deprecation warnings. |
-| 10 | Scripts run in **full isolation** — only positional args, no inherited variables. |
-| 11 | **No script-to-script calls.** Scripts are atomic. Composition happens in orchestration. |
-| 12 | Shared utility code lives in **shared bash libraries** (sourced explicitly in bash scripts), not in Jaiph script cross-calls. |
-| 13 | `if` uses **brace syntax** (`if ... { } else { }`), **`not`** for negation, **`else if`** for chaining. No `then`/`fi`/`elif`. |
-| 14 | Scripts transpile to **separate executable files** with `+x` permission. |
-| 15 | Default shebang is `#!/usr/bin/env bash`. User can provide a custom shebang as the first line of the script body (e.g. `#!/usr/bin/env node`). |
-| 16 | Workflows, rules, and scripts support **named parameters** in declarations. Positional `$1`/`$2` boilerplate is eliminated. |
-
-## Legality Matrix
-
-### `workflow`
-
-| Construct | Allowed | Syntax |
-|-----------|---------|--------|
-| config | Yes | `config { key = "value" }` |
-| const | Yes | `const name = "value"` / `const name = run ref` / `const name = ensure ref` / `const name = prompt "text"` |
-| run | Yes | `run ref [args]` / `run ref [args] &` (async) |
-| ensure | Yes | `ensure ref [args]` / `ensure ref [args] recover { ... }` |
-| prompt | Yes | `prompt "text"` / `const name = prompt "text"` / `const name = prompt "text" returns '{ ... }'` |
-| log | Yes | `log "message"` |
-| logerr | Yes | `logerr "message"` |
-| return | Yes | `return "value"` / `return $var` |
-| fail | Yes | `fail "reason"` |
-| if | Yes | `if [not] ensure ref { ... } [else if ...] [else { ... }]` / `if [not] run ref { ... }` |
-| route | Yes | `channel -> ref1, ref2` |
-| send | Yes | `channel <- "value"` / `channel <- $var` / `channel <- run ref` |
-| wait | Yes | `wait` (waits for async `run` steps) |
-| Raw shell | **No** | Hard parser error with rewrite guidance |
-
-### `rule`
-
-| Construct | Allowed | Syntax |
-|-----------|---------|--------|
-| const | Yes | `const name = "value"` / `const name = run ref` / `const name = ensure ref` (no `prompt` capture) |
-| ensure | Yes | `ensure ref [args]` — other rules only, **no `recover`** |
-| run | Yes | `run ref [args]` — **scripts only**, not workflows |
-| log | Yes | `log "message"` |
-| logerr | Yes | `logerr "message"` |
-| return | Yes | `return "value"` / `return $var` |
-| fail | Yes | `fail "reason"` |
-| if | Yes | `if [not] ensure ref { ... }` / `if [not] run ref { ... }` (run targets scripts only) |
-| prompt | **No** | Rules don't interact with AI |
-| route / send | **No** | Rules don't use channels |
-| async (`&`, `wait`) | **No** | |
-| recover (in `ensure`) | **No** | Not in rule-to-rule calls |
-| Raw shell | **No** | Hard parser error |
-
-### `script`
-
-| Construct | Allowed | Syntax |
-|-----------|---------|--------|
-| Custom shebang | Yes | `#!/usr/bin/env node` (first line of body; omit for default `#!/usr/bin/env bash`) |
-| All body content | Yes | Full language content matching the shebang (bash by default) |
-| Nested bash functions | Yes (bash) | `helper() { ... }` (internal to the script body) |
-| Shared bash via workspace lib dir | **No** | Use `import script`, a sibling module, or inline bash in a `script` block — `JAIPH_LIB` is not provided |
-| `return N` / `exit N` | Yes (bash) | Exit code (integer only) |
-| stdout (`echo`, `printf`) | Yes | Value output mechanism |
-| `local` | Yes (bash) | Bash variable declarations |
-| Other Jaiph script calls | **No** | Scripts are atomic; compose in orchestration |
-| `run`, `ensure`, `prompt` | **No** | Hard parser error (bash scripts only; skipped for custom shebangs) |
-| `return "value"` | **No** | Use `echo` for values, `return 0` for success (bash scripts only) |
-| `fail`, `const`, `log`, `logerr` | **No** | Jaiph keywords, not available in scripts (bash scripts only; skipped for custom shebangs) |
-| Parent scope variables | **No** | Full isolation — only positional args |
-
-**Jaiph keyword guard**: for bash scripts (no shebang or `#!/usr/bin/env bash`), the parser rejects Jaiph-level keywords (`run`, `ensure`, `fail`, `const`, `log`, `logerr`, `prompt`) in the body. For custom shebangs (e.g. `#!/usr/bin/env node`), the guard is skipped — the user owns the body entirely.
-
-## Named Parameters
-
-All constructs support named parameters in their declarations:
-
-```
-workflow implement(task, role_name) { ... }
-rule ensure_is_number(value) { ... }
-script check_hash(file_path, expected_hash) { ... }
-```
-
-**Semantics:**
-
-- Parameters are available as named local variables inside the construct body.
-- For workflows/rules: the transpiler emits `local task="$1"; local role_name="$2"` at the top of the function body.
-- For bash scripts: the transpiler prepends `local file_path="$1"; local expected_hash="$2"` to the script file. For non-bash shebangs, named params are documentary only (the language uses its own argv mechanism).
-- **Optional/default parameters**: `workflow deploy(env, version, dry_run = "false")` transpiles to `local dry_run="${3:-false}"`.
-- Both positional and named calling conventions are valid at call sites:
-  - `run implement "$task" "$role_name"` — positional, mapped by declaration order.
-  - `run implement task="$task" role_name="$role_name"` — named (already partially supported via `parseParamKeysFromArgs`).
-- **Arity validation**: the validator can check call sites against the declaration. `run implement` with zero args when `implement` declares two required params is a validation error.
-- **Parentheses are optional**: `workflow default() { ... }` (no params) remains valid. Constructs with params use `name(params) { ... }`.
-
-## Script Isolation and Transpilation Model
-
-Scripts execute in **full isolation**. They receive only their positional arguments. No inherited variables from the orchestration scope, module-level constants, or other scripts' state.
-
-### Transpilation to separate files
-
-Each `script` block transpiles to a **standalone executable file** in the build output:
-
-```
-build/
-  scripts/
-    check_is_number        # #!/usr/bin/env bash, +x
-    check_json_schema      # #!/usr/bin/env node, +x
-    select_role            # #!/usr/bin/env bash, +x
-  module_name.sh           # orchestration (workflows + rules)
-```
-
-The transpiler:
-1. Extracts each `script` body verbatim
-2. Prepends the shebang (user-provided or default `#!/usr/bin/env bash`)
-3. Writes to `build/scripts/<name>` with `chmod +x`
-4. In the module `.sh`, script calls become: `"$JAIPH_SCRIPTS/<name>" "$@"`
-
-The runtime sets `$JAIPH_SCRIPTS` to the build output scripts directory.
-
-### Shebang syntax
-
-The first non-empty line of the script body is checked for `#!`. If present, it becomes the file's shebang. If absent, `#!/usr/bin/env bash` is used.
-
-```
-script check_json() {
-  #!/usr/bin/env node
-  const data = JSON.parse(process.argv[2]);
-  process.exit(data.valid ? 0 : 1);
-}
-
-script check_is_number() {
-  [[ "$1" =~ ^[0-9]+$ ]]
-}
-```
-
-### Data flow
-
-**Data flow is always explicit**:
-- **Input**: named parameters (declared in signature) or positional arguments (`$1`, `$2`, ...). Named params are syntactic sugar — they transpile to positional arg assignments.
-- **Output**: stdout (value), stderr (diagnostics), exit code (success/failure)
-- **No side channel**: scripts cannot read `const` variables from workflows/rules
-
-### Shared utility code (bash scripts only)
-
-Scripts cannot call other Jaiph scripts. Factor repeated bash into **`import script "./helper.sh" as helper`** (path relative to the `.jh` file), another `.jh` module, or a small extra `script` in the same module. Do not use a workspace-wide bash drop directory outside the compiler model.
-
-Non-bash scripts use their language's own module system for shared code.
-
-## Semantics: Values, Returns, Failures
-
-### Scripts (isolated, standalone executables)
-
-Values are passed via **stdout**. Caller captures with `const result = run script_name`.
-
-Exit code determines success/failure: `return 0` / `exit 0` = success, `return 1` / `exit 1` = failure.
-
-The existing `jaiph::set_return_value` mechanism is **removed** from script transpilation. `return "$string"` in a bash script body is a **parser error** (bash `return` only accepts integers).
-
-### Workflows
-
-`return "value"` passes a value to the caller via the Jaiph runtime (not stdout).
-
-`fail "reason"` terminates the workflow with a non-zero exit and logs the reason to stderr. An unrecovered `ensure` failure also terminates the workflow.
-
-Exit code: 0 on natural completion or `return`. Non-zero on `fail` or unrecovered failure.
-
-### Rules
-
-`return "value"` passes a value to the caller. Captured by `const result = ensure rule_name`.
-
-`fail "reason"` causes the rule to fail. In the caller, this triggers a `recover` block (if present) or aborts.
-
-A rule that completes without hitting `fail` passes.
-
-### `fail` vs script failure
-
-| Context | How to fail | How to return a value |
-|---------|-------------|----------------------|
-| `script` | `return 1` / `exit 1` | `echo "value"` (stdout) |
-| `workflow` | `fail "reason"` | `return "value"` |
-| `rule` | `fail "reason"` | `return "value"` |
-
-## Migration Examples
-
-### Rule: raw shell → structured
-
-Before:
-
-```
-rule ensure_is_number() {
-  if ! [[ "$1" =~ ^[0-9]+$ ]]; then
-    echo "Expected a non-negative integer, got: $1" >&2
-    exit 1
-  fi
-}
-```
-
-After:
-
-```
-script check_is_number(value) {
-  [[ "$value" =~ ^[0-9]+$ ]]
-}
-
-rule ensure_is_number(value) {
-  if not run check_is_number "$value" {
-    fail "Expected a non-negative integer, got: $value"
-  }
-}
-```
-
-### Workflow: inline shell → named script
-
-Before:
-
-```
-workflow default() {
-  n="${1:-10}"
-  ensure ensure_is_number "$n"
-  result = run fib "$n"
-  log "$result"
-}
-```
-
-After:
-
-```
-workflow default(n = "10") {
-  ensure ensure_is_number "$n"
-  const result = run fib "$n"
-  log "$result"
-}
-```
-
-### Script: return value via stdout (not `jaiph::set_return_value`)
-
-Before:
-
-```
-function fib() {
-  local result
-  result="$(fib_impl "$n")"
-  return "$result"
-}
-```
-
-After:
-
-```
-script fib() {
-  fib_impl() {
-    local x="$1"
-    if [ "$x" -le 1 ]; then
-      echo "$x"
-      return 0
-    fi
-    local a b
-    a="$(fib_impl "$((x - 1))")"
-    b="$(fib_impl "$((x - 2))")"
-    echo "$((a + b))"
-  }
-  fib_impl "$1"
-}
-```
-
-All data is internal. Caller captures via `const result = run fib "$n"`.
-
-### Polyglot script: Node.js validation
-
-```
-script validate_json_schema(schema_path, data_path) {
-  #!/usr/bin/env node
-  const Ajv = require('ajv');
-  const fs = require('fs');
-  const ajv = new Ajv();
-  const schema = JSON.parse(fs.readFileSync(process.argv[2], 'utf8'));
-  const data = JSON.parse(fs.readFileSync(process.argv[3], 'utf8'));
-  const valid = ajv.validate(schema, data);
-  if (!valid) {
-    console.error(JSON.stringify(ajv.errors));
-    process.exit(1);
-  }
-}
-
-workflow validate_config() {
-  ensure config_file_exists
-  const result = run validate_json_schema "schema.json" "config.json"
-  log "Config validated successfully"
-}
-```
-
-### Prompt with `returns` + value dispatch (engineer.jh pattern)
-
-Before:
-
-```
-local role_surgical = "<role>...</role>"
-local role_reductionist = "<role>...</role>"
-
-workflow implement() {
-  local role_name="$2"
-  local role
-  if [ "$role_name" = "surgical" ]; then
-    role="$role_surgical"
-  elif [ "$role_name" = "reductionist" ]; then
-    role="$role_reductionist"
-  fi
-  prompt "$role ..."
-}
-```
-
-After:
-
-```
-script select_role(role_name) {
-  local role_surgical='<role>
-    You are a surgical engineer. ...
-  </role>'
-  local role_reductionist='<role>
-    You are a reductionist engineer. ...
-  </role>'
-
-  case "$role_name" in
-    surgical) echo "$role_surgical" ;;
-    reductionist) echo "$role_reductionist" ;;
-    *) echo "Unknown role: $role_name" >&2; return 1 ;;
-  esac
-}
-
-workflow implement(task, role_name) {
-  const role = run select_role "$role_name"
-
-  prompt "
-    $role
-    ...
-    $task
-  "
-}
-```
-
-Role data is internal to the script. Orchestration only passes the role name and receives the resolved text. Full isolation — script has zero knowledge of caller scope.
-
-### Send operator
-
-Before:
-
-```
-workflow scanner() {
-  findings <- echo "Found 3 issues in auth module"
-}
-```
-
-After:
-
-```
-workflow scanner() {
-  findings <- "Found 3 issues in auth module"
-}
-```
-
-### Rule with value return
-
-Before:
-
-```
-rule echo_line() {
-  echo "this goes to logs only"
-  return "captured-value"
-}
-```
-
-After:
-
-```
-script echo_impl() {
-  echo "this goes to logs only" >&2
-}
-
-rule echo_line() {
-  run echo_impl
-  return "captured-value"
-}
-```
-
-## Pattern Catalog: .jaiph/ and e2e/ audit
-
-Every `.jh` file was scanned. Below are all patterns found that require migration, grouped by category.
-
-### P1: Raw shell in workflows (every .jaiph/ file)
-
-**Files**: queue.jh, docs_parity.jh, simplifier.jh, architect_review.jh, ensure_ci_passes.jh, qa.jh, git.jh, log_keyword.jh, nested_run.jh, workflow_greeting.jh, prompt_unmatched.jh, rule_pass.jh, assign_capture.jh
-
-**Examples**: `echo "..."`, `printf`, `mkdir -p`, `rm -f`, `exit 0`, `exit 1`, `test -n`, bare assignment (`dataset="testdata"`)
-
-**Migration**: each becomes a named `script` or a `const` declaration. `exit 0` → `return` (early success). `exit 1` → `fail "reason"`.
-
-### P2: Raw shell in rules (every rule)
-
-**Files**: git.jh (`git rev-parse`, `test -z "$(git status)"`), queue.jh (`echo | grep -q`), ensure_ci_passes.jh (`npm run test:ci`), docs_parity.jh (`test -f`, `while IFS= read`), simplifier.jh, say_hello.jh, say_hello_json.jh, current_branch.jh
-
-**Migration**: shell logic moves to scripts. Rules become structured: `run` the script, `if`/`fail` on the result.
-
-### P3: Iteration in workflows
-
-**Files**: architect_review.jh (`while IFS= read -r header; do ... done <<< "$headers"`), docs_parity.jh (`for f in docs/*.md`, `for f in "${docs_md_files[@]}"`).
-
-**Problem**: the loop body contains orchestration keywords (`run`, `ensure`, `prompt`, `log`). Cannot be pushed to a script.
-
-**Resolution**: use **workflow recursion**. Extract per-item logic into a workflow, then recurse over the list. Split newline-delimited lists with tiny `script` steps (e.g. `printf '%s\n' "$1" | head -n 1` / `tail -n +2`) or `import script`.
-
-```
-script list_docs_files() {
-  for f in docs/*.md; do
-    echo "$f"
-  done
-}
-
-workflow process_docs_recursive(file, remaining) {
-  run docs_page "$file"
-
-  if run has_value "$remaining" {
-    const next = run first_line "$remaining"
-    const rest = run rest_lines "$remaining"
-    run process_docs_recursive "$next" "$rest"
-  }
-}
-
-workflow default() {
-  const docs_files = run list_docs_files
-  const first = run first_line "$docs_files"
-  const rest = run rest_lines "$docs_files"
-  run process_docs_recursive "$first" "$rest"
-}
-```
-
-**Future feature: `each` modifier.** Planned syntax sugar that replaces the recursion boilerplate:
-
-```
-run docs_page each $docs_files
-```
-
-`each` is a modifier on `run`/`ensure` that calls the target once per newline-delimited item. No loop body, no mutable state, no break/continue. Backward-compatible addition — does not block v1.
-
-### P4: Bash arrays in workflows
-
-**File**: docs_parity.jh — builds arrays dynamically (`local files=()`, `files+=("$f")`), passes them as args (`"${files[@]}"`).
-
-**Resolution**: avoid arrays in orchestration. Represent lists as newline-delimited strings. Scripts that need to process multiple items receive them as a single string argument. Glob expansion (`docs/*.md`) stays in scripts.
-
-### P5: Mutable variables in workflows
-
-**File**: architect_review.jh — `local failed=0` then `failed=1` inside a loop to track whether any task failed.
-
-**Resolution**: restructure to avoid mutable state. The per-item workflow performs side effects (marking tasks). After recursion completes, re-check the final state:
-
-```
-workflow review_single_task(header) {
-  const task = run queue.get_task_by_header "$header"
-
-  if run is_dev_ready "$task" {
-    log "Already dev-ready: $header"
-    return
-  }
-
-  const verdict = run review_task "$task"
-  if run matches "$verdict" "dev-ready" {
-    run queue.mark_task_dev_ready "$header"
-    log "Marked dev-ready: $header"
-  } else {
-    log "Needs work: $header"
-  }
-}
-
-workflow default() {
-  const headers = run queue.get_all_task_headers
-  # recurse over headers (or use `each` when available)
-  ...
-
-  const remaining = run queue.count_not_ready
-  if not run is_zero "$remaining" {
-    fail "One or more tasks need work"
-  }
-}
-```
-
-No mutable counter. The source of truth is the queue state, not a variable.
-
-### P6: String comparison in workflows (SPEC GAP)
-
-**Files**: architect_review.jh (`[[ "$verdict" == "dev-ready" ]]`), engineer.jh (role name dispatch), git.jh (`[ -z "$role_name" ]`).
-
-**Resolution**: push to scripts.
-
-```
-script matches(a, b) {
-  [ "$a" = "$b" ]
-}
-
-script has_value(val) {
-  [ -n "$val" ]
-}
-
-if run matches "$verdict" "dev-ready" {
-  ...
-}
-```
-
-These are small, reusable utility scripts in the same module (or behind `import script`).
-
-### P7: `return "$(command)"` in scripts (Jaiph value return)
-
-**Files**: queue.jh (`return "$(awk ...)"`), docs_parity.jh (`return "$(git diff ...)"`), simplifier.jh (same pattern).
-
-**Migration**: replace `return "$(command)"` with direct stdout passthrough:
-
-Before: `return "$(awk '/^## /{print}' "$queue_file")"`
-
-After: `awk '/^## /{print}' "$queue_file"` (just let stdout flow)
-
-### P8: `logerr` in rules
-
-**Files**: say_hello.jh, say_hello_json.jh — `logerr "message"` inside raw shell rule body.
-
-**Migration**: under structured rules, `logerr` becomes a Jaiph keyword (already in legality matrix):
-
-```
-rule name_was_provided(name) {
-  if not run has_value "$name" {
-    logerr "You didn't provide your name :("
-    fail "name argument required"
-  }
-}
-```
-
-### P9: `ensure` with `recover` containing shell
-
-**File**: ensure_ci_passes.jh — `recover` block contains `echo "$1" > "$ci_log_file"`, shell conditionals, and a `prompt`.
-
-**Migration**: shell in recover body moves to scripts. `prompt` stays (recover body follows workflow rules):
-
-```
-script save_ci_log(content, path) {
-  echo "$content" > "$path"
-}
-
-script ci_log_exists(path) {
-  [ -s "$path" ]
-}
-
-workflow ensure_ci_passes() {
-  const ci_log_file = ".jaiph/tmp/ensure_ci_passes.last.log"
-  run mkdir_p ".jaiph/tmp"
-
-  ensure ci_passes recover {
-    run save_ci_log "$1" "$ci_log_file"
-    if not run ci_log_exists "$ci_log_file" {
-      fail "ci failure log is empty at $ci_log_file"
-    }
-    prompt "Fix failing CI... log at: $ci_log_file"
-  }
-
-  run rm_file "$ci_log_file"
-}
-```
-
-### P10: Shell variable expansion in `const` RHS
-
-**Files**: multiple — `"${1:-10}"`, `"${1:-}"`, `"${task%%$'\n'*}"`.
-
-**Ruling**: simple interpolation (`$var`, `"${var:-default}"`) is allowed in `const` RHS — these are value lookups, not computation. Bash string operations (`${var%%pattern}`, `${var//old/new}`) are computation — push to a script.
-
-| Allowed in `const` RHS | Not allowed (use script) |
-|------------------------|---------------------------|
-| `"$var"` | `"${var%%pattern}"` |
-| `"${var:-default}"` | `"${var//old/new}"` |
-| `"${var:+alt}"` | `"${#var}"` |
-| `"literal"` | `$(command)` |
-
-### P11: Script-to-script calls
-
-**File**: docs_parity.jh — rule `only_expected_docs_changed_after_prompt` calls script `is_allowed_file` directly.
-
-**Migration**: under full isolation + no script-to-script calls, inline the logic or add a dedicated `import script` helper:
-
-```
-script check_only_expected_changed(allowed, changed) {
-  while IFS= read -r f; do
-    [ -z "$f" ] && continue
-    if [[ $'\n'"$allowed"$'\n' != *$'\n'"$f"$'\n'* ]]; then
-      echo "Unexpected file changed: $f" >&2
-      return 1
-    fi
-  done <<< "$changed"
-}
-```
-
-## Implementation Plan
-
-### Phase 0: Architectural prep (before breaking changes)
-
-**0a. Refactor `validate.ts` — collapse duplicate ref resolution**
-- Merge `validateRuleRef`, `validateWorkflowRef`, `validateRunInRuleRef`, `validateRunTargetRef`, `validateBareSendSymbol` into one generic `validateRef(ref, allowedKinds, context)` function
-- Target: 788 → ~400 lines
-- Zero behavior change
-
-**0b. Split `emit-workflow.ts` — separate emitters**
-- Extract script emission into `emit-script.ts`
-- Extract rule emission into `emit-rule.ts`
-- `emit-workflow.ts` becomes orchestration-only assembly
-- Creates natural seam for Phase 3 (separate script files)
-
-### Phase 1: Language additions (no breaking changes)
-
-**1a. Add `fail` keyword**
-- AST: new `WorkflowStepDef` variant `{ type: "fail"; message: string; loc: SourceLoc }`
-- Parser: recognize `fail "reason"` in `workflows.ts`
-- Transpiler: emit `echo "reason" >&2; exit 1`
-
-**1b. Add `const` declaration**
-- AST: new step type `{ type: "const"; name: string; value: ConstValue; loc: SourceLoc }` where `ConstValue` is string-expr | run-capture | ensure-capture | prompt-capture
-- Parser: `const name = ...` with RHS dispatch
-- Transpiler: emit `local name; name="value"` or appropriate capture form
-
-**1c. Formalize `wait` as keyword**
-- AST: new variant `{ type: "wait"; loc: SourceLoc }`
-- Parser: recognize `wait` in workflows (currently falls through to shell)
-- Transpiler: emit `wait`
-
-**1d. Switch `if` to brace syntax**
-- Parser: recognize `if [not] ensure/run ref { ... } [else if ...] [else { ... }]`
-- Keep old `if ... then ... fi` working during Phase 1 (dual parsing)
-- Transpiler: both forms emit the same bash
-
-### Phase 2: Rule parser rewrite
-
-**2a. Restructure `RuleDef`**
-- Change `RuleDef.commands: string[]` → `RuleDef.steps: RuleStepDef[]` (or reuse `WorkflowStepDef` subset)
-- Rewrite `rules.ts` with keyword-aware parsing (mirror `workflows.ts` structure)
-- Port existing rule tests first, then validate structured output
-
-**2b. Update rule emission**
-- `emit-workflow.ts`: handle structured rule steps instead of opaque command strings
-
-### Phase 3: `function` → `script` rename and separate file transpilation
-
-**3a. Rename keyword**
-- Parser: accept `script` keyword instead of `function`
-- AST: rename `FunctionDef` → `ScriptDef`, add `shebang?: string` field
-- `jaiphModule`: rename `functions` → `scripts`
-- Update all validator references
-
-**3b. Add shebang extraction**
-- Parser: check first non-empty line of script body for `#!`
-- If present, store in `ScriptDef.shebang` and exclude from body commands
-- If absent, `shebang` remains `undefined` (default `#!/usr/bin/env bash`)
-
-**3c. Conditional keyword guard**
-- For bash scripts (no shebang or bash shebang): keep existing Jaiph keyword rejection
-- For custom shebangs: skip keyword guard entirely
-
-**3d. Emit scripts as separate files**
-- Change `emitWorkflow` return type: `{ module: string; scripts: ScriptFile[] }` where `ScriptFile = { name: string; content: string; shebang: string }`
-- Module `.sh` calls scripts via `"$JAIPH_SCRIPTS/<name>" "$@"`
-- `build.ts`: write script files with `chmod +x`, set `$JAIPH_SCRIPTS`
-
-**3e. Update all first-party `.jh` files**
-- Rename `function` → `script` in all `.jaiph/*.jh` files
-- Rename in all `e2e/*.jh` fixtures
-- Update test fixtures and golden outputs
-
-**3f. Named parameters**
-- Parser: recognize `name(param1, param2)` and `name(param1, param2 = "default")` in workflow, rule, and script declarations
-- AST: add `params?: Array<{ name: string; default?: string }>` to `WorkflowDef`, `RuleDef`, `ScriptDef`
-- Transpiler: for workflows/rules, emit `local param1="$1"; local param2="$2"` (or `"${2:-default}"` for defaults) at the top of the function body. For bash scripts, prepend the same to the script file. For non-bash scripts, params are documentary only.
-- Validator: check call-site arity against declared params. Missing required args = validation error. Extra args beyond declared params = validation warning.
-- Update all first-party `.jh` files to use named params where applicable
-- Parentheses optional when no params: `workflow default() { ... }` remains valid
-
-### Phase 4: Script isolation
-
-**4a. Implement full isolation for script execution**
-- Scripts run as separate processes (inherent from separate files + exec)
-- Only positional args available (inherent from separate executable)
-- Set `$JAIPH_SCRIPTS` and `$JAIPH_WORKSPACE` for script steps (no workspace bash lib dir)
-
-**4b. Reject script-to-script calls**
-- Parser/validator: detect when a script body references another Jaiph script name
-- Error: `"scripts cannot call other Jaiph scripts; use import script, inline bash, or compose in a workflow"`
-
-### Phase 5: Remove shell (breaking changes)
-
-**5a. Remove shell fallback from workflow parser**
-- `workflows.ts`: delete the catch-all `type: "shell"` codepath
-- Remove `shellAccumulator` / `braceDepthDelta` shell accumulation
-- Emit parser error: `"raw shell is not allowed in workflow; extract to a script"`
-
-**5b. Remove shell fallback from rule parser**
-- Same treatment after Phase 2
-
-**5c. Remove old `if` syntax**
-- Drop `if ... then ... fi` / `elif` parsing
-- Only accept brace syntax with `not` / `else if`
-
-**5d. Enforce pure output in scripts**
-- `scripts.ts`: reject `return "value"` (non-integer return)
-- Remove `jaiph::set_return_value` from script transpilation
-
-**5e. Update send operator**
-- Accept `"value"` / `$var` / `run ref` as RHS
-- Reject raw shell command as RHS
-
-### Phase 6: Migrate all first-party code
-
-- Rewrite all `e2e/*.jh` fixtures
-- Rewrite all `.jaiph/*.jh` workflows
-- Factor repeated bash into `import script` or extra `script` blocks in the same module (P6, P11)
-- Update test fixtures and golden transpilation outputs
-- Update docs and README examples
-
-### Phase 7: Ship
-
-- Hard parser errors on all legacy syntax
-- Error messages include rewrite examples
-- Full e2e + golden snapshot CI gate
-- Zero P0 parser/runtime failures before merge
-
-## Code Changes Required
-
-| File | Change |
-|------|--------|
-| `src/types.ts` | Rename `FunctionDef` → `ScriptDef`, add `shebang?: string`, add `params?: ParamDef[]`. Rename `jaiphModule.functions` → `jaiphModule.scripts`. Add `params?: ParamDef[]` to `WorkflowDef`, `RuleDef`. Add `fail`, `wait`, `const` step types. Change `RuleDef.commands` → `RuleDef.steps`. Remove `shell` condition kind from `if`. Add `not` / brace-style `if` AST. |
-| `src/parser.ts` | Replace `function` keyword detection with `script`. Rename `parseFunctionBlock` → `parseScriptBlock`. |
-| `src/parse/functions.ts` → `src/parse/scripts.ts` | Rename file. Update regex to match `script` keyword. Add shebang extraction. Conditional keyword guard (skip for custom shebangs). Parse named params in signature. |
-| `src/parse/workflows.ts` | Remove shell fallback, shell accumulator. Add `fail`, `const`, `wait` parsing. Replace `if ... then ... fi` with brace syntax. |
-| `src/parse/rules.ts` | Full rewrite: keyword-aware structured parser mirroring workflow parser. |
-| `src/transpile/emit-workflow.ts` | Split: extract script emission to `emit-script.ts`, rule emission to `emit-rule.ts`. Change return type to include script files. Remove `jaiph::set_return_value` from script paths. |
-| `src/transpile/emit-script.ts` | **New file.** Emit standalone script files with shebang + body. |
-| `src/transpile/emit-rule.ts` | **New file.** Rule emission extracted from `emit-workflow.ts`. |
-| `src/transpile/emit-steps.ts` | Remove `emitShellStep` for workflows. Add `emitFailStep`, `emitConstStep`, `emitWaitStep`. |
-| `src/transpile/build.ts` | Handle new `emitWorkflow` return shape. Write script files with `chmod +x`. Set `$JAIPH_SCRIPTS` path. |
-| `src/transpile/validate.ts` | Collapse duplicate ref resolution. Rename `function` → `script` in errors/lookups. Allow `run` in rules (scripts only). Remove shell-condition validation. Add script isolation validation. |
-| `src/transpile/shell-jaiph-guard.ts` | Scope down — only applies to bash scripts now. |
-| `e2e/*.jh` | Rewrite all fixtures to new syntax. |
-| `.jaiph/*.jh` | Rewrite all workflows to new syntax. |
-| `test/fixtures/**` | Update golden transpilation outputs. |
-| `docs/*` | Update grammar, getting-started, CLI docs for `script` keyword and shebang. |
-
-## Risks
-
-| Risk | Impact | Mitigation |
-|------|--------|------------|
-| Wide breakage: all raw-shell workflows/rules fail at parse time | High | Single branch, full e2e gate, no merge without 100% pass |
-| Rule parser rewrite introduces regressions | High | Port existing rule tests before rewriting parser |
-| Ergonomic cost of named scripts for trivial shell | Medium | Accepted tradeoff — boundary clarity > brevity |
-| `fail` interacts badly with `recover` | Medium | Explicit test: `ensure rule_with_fail recover { ... }` must trigger recover |
-| `const` scoping conflicts with bash `local` | Low | `const` is parser-level immutability; transpiles to `local` |
-| Return semantics confusion during migration | Medium | Parser errors guide users: `"return 'value' not allowed in script; use echo"` |
-| Script isolation perf overhead (fork+exec per call) | Medium | Measure fork cost; scripts are already logically isolated. Optimize hot paths if needed |
-| Users want a global bash grab-bag | Medium | `import script` + small modules; no `JAIPH_LIB` |
-| `.jaiph/` workflow migration is large (9 files) | High | Migrate in parallel with parser changes; each file is independently testable |
-| Separate file management complexity | Medium | Deterministic naming (`scripts/<name>`), cleanup on rebuild |
-| Custom shebang scripts may have missing dependencies | Low | Not Jaiph's problem — user owns their runtime. Document clearly |
-
-## Success Criteria
-
-- 100% first-party `.jh` files parse under new grammar
-- 100% e2e pass under new runtime
-- Zero `type: "shell"` steps in workflow/rule AST output
-- `fail` triggers `recover` correctly in `ensure` blocks
-- Script bodies reject `return "value"`, `fail`, `const`, other Jaiph keywords (bash scripts only)
-- Script bodies reject calls to other Jaiph scripts
-- Scripts execute as separate files with correct shebang and `+x`
-- Custom shebang scripts (e.g. `#!/usr/bin/env node`) work end-to-end
-- Scripts execute in full isolation (no inherited variables)
-- `const` declarations work in workflows and rules with all RHS forms
-- `if` brace syntax works with `not` and `else if`
-- Parser errors for raw shell include actionable rewrite examples
-- `jaiph::set_return_value` removed from script transpilation paths
-- `validate.ts` under 500 lines after dedup
-- `emit-workflow.ts` handles only orchestration; script/rule emission in separate files
-- Named parameters work in workflow, rule, and script declarations
-- Default parameter values work: `workflow deploy(env, dry_run = "false")`
-- Arity validation catches missing required args at call sites
diff --git a/.jaiph/lib_common.jh b/.jaiph/lib_common.jh
new file mode 100644
index 00000000..20888a7b
--- /dev/null
+++ b/.jaiph/lib_common.jh
@@ -0,0 +1,33 @@
+#!/usr/bin/env jaiph
+
+#
+# Shared string/file helpers for the .jaiph orchestration workflows.
+# Import as: import "./lib_common.jh" as common
+#
+# Writes UTF-8 text to a path: $1 = path, $2 = content.
+# python3 instead of `echo`, so backslashes and dash-leading content
+# are written verbatim. Content still travels through argv, so it is
+# subject to the OS ARG_MAX limit (~1 MB on macOS).
+export script save_string_to_file = ```python3
+import sys
+if len(sys.argv) < 3:
+    sys.exit(2)
+path, content = sys.argv[1], sys.argv[2]
+open(path, "w", encoding="utf-8").write(content)
+```
+
+export script first_line_str = `printf '%s\n' "$1" | head -n 1`
+
+export script rest_lines_str = `printf '%s\n' "$1" | tail -n +2`
+
+export script arg_nonempty = `[ -n "$1" ]`
+
+export script str_equals = `[ "$1" = "$2" ]`
+
+export script to_lower = `printf '%s' "$1" | tr '[:upper:]' '[:lower:]'`
+
+export script mkdir_p_simple = `mkdir -p "$1"`
+
+export script rm_file_simple = `rm -f "$1"`
+
+export script jaiph_tmp_dir = `printf '%s\n' "$JAIPH_WORKSPACE/.jaiph/tmp"`
diff --git a/.jaiph/libs/jaiphlang/git.jh b/.jaiph/libs/jaiphlang/git.jh
index 8cf01eea..ba94635a 100755
--- a/.jaiph/libs/jaiphlang/git.jh
+++ b/.jaiph/libs/jaiphlang/git.jh
@@ -37,9 +37,11 @@ rule is_clean() {
 
 workflow commit(task) {
   config {
-    agent.backend = "cursor"
-    agent.cursor_flags = "--force"
-    agent.default_model = "auto"
+    # agent.backend = "cursor"
+    # agent.default_model = "composer-2"
+    # agent.cursor_flags = "--force"
+    agent.backend = "claude"
+    agent.claude_flags = "--permission-mode bypassPermissions"
   }
 
   ensure in_git_repo()
diff --git a/.jaiph/main.jh b/.jaiph/main.jh
deleted file mode 100755
index aaf143f7..00000000
--- a/.jaiph/main.jh
+++ /dev/null
@@ -1,17 +0,0 @@
-#!/usr/bin/env jaiph
-
-#
-# Full pipeline: architect review → implement first queue task.
-# For periodic docs audit, run docs_parity.jh separately.
-#
-
-import "./engineer.jh" as implement
-import "./architect_review.jh" as architect
-import "jaiphlang/git" as git
-
-workflow default() {
-  ensure git.is_clean()
-
-  run architect.default()
-  run implement.default("queue")
-}
\ No newline at end of file
diff --git a/.jaiph/prepare_release.jh b/.jaiph/prepare_release.jh
new file mode 100755
index 00000000..a110429c
--- /dev/null
+++ b/.jaiph/prepare_release.jh
@@ -0,0 +1,139 @@
+#!/usr/bin/env jaiph
+
+#
+# Release-prep workflow. Single-sources the CLI version: bumps package.json,
+# refreshes the installer's hardcoded ref, rebuilds the CLI, verifies that
+# `jaiph --version` matches package.json, and regenerates docs/registry.
+#
+# Run as:
+#   jaiph run .jaiph/prepare_release.jh -- 0.9.5     # explicit version
+#   jaiph run .jaiph/prepare_release.jh              # next patch version
+#
+# The workflow never creates a commit or git tag — it stages edits for the
+# operator to review, commit, tag, and push manually.
+#
+
+script read_pkg_version = `node -p "require('./package.json').version"`
+
+script assert_version_format = ```
+  v="$1"
+  case "${v}" in
+    *[!0-9.]*) printf 'version must match X.Y.Z (digits only); got: %s\n' "${v}" >&2; exit 1 ;;
+  esac
+  printf '%s' "${v}" | grep -Eq '^[0-9]+\.[0-9]+\.[0-9]+$' || {
+    printf 'version must match X.Y.Z (digits only); got: %s\n' "${v}" >&2
+    exit 1
+  }
+```
+
+script compute_next_patch = ```python3
+import sys
+v = sys.argv[1]
+parts = v.split('.')
+if len(parts) != 3 or not all(p.isdigit() for p in parts):
+    sys.stderr.write(f"invalid current version in package.json: {v}\n")
+    sys.exit(1)
+parts[-1] = str(int(parts[-1]) + 1)
+print('.'.join(parts))
+```
+
+script assert_git_tree_clean = ```
+  if [ -n "$(git status --porcelain)" ]; then
+    echo "git tree is dirty; commit or stash before running prepare_release" >&2
+    git status --short >&2
+    exit 1
+  fi
+```
+
+script assert_tag_does_not_exist = ```
+  v="$1"
+  if git rev-parse -q --verify "refs/tags/v${v}" >/dev/null 2>&1; then
+    printf 'tag v%s already exists\n' "${v}" >&2
+    exit 1
+  fi
+```
+
+script npm_version_no_tag = `npm version "$1" --no-git-tag-version --allow-same-version >/dev/null`
+
+script update_install_release_ref = ```python3
+import sys
+old, new = sys.argv[1], sys.argv[2]
+path = "docs/install"
+with open(path, "r", encoding="utf-8") as f:
+    src = f.read()
+needle = f"v{old}"
+count = src.count(needle)
+if count == 0:
+    sys.stderr.write(f"docs/install: hardcoded ref v{old} not found\n")
+    sys.exit(1)
+new_src = src.replace(needle, f"v{new}")
+with open(path, "w", encoding="utf-8") as f:
+    f.write(new_src)
+print(count)
+```
+
+script run_npm_build = `npm run build >&2`
+
+script assert_built_cli_version_equals = ```
+  v="$1"
+  expected="jaiph ${v}"
+  actual="$(node dist/src/cli.js --version)"
+  if [ "${expected}" != "${actual}" ]; then
+    printf 'displayed --version mismatch\nexpected: %s\nactual:   %s\n' "${expected}" "${actual}" >&2
+    exit 1
+  fi
+```
+
+script run_registry_build = `npm run registry:build >&2`
+
+workflow resolve_version(arg) {
+  const pkg_version = run read_pkg_version()
+  const resolved = match arg {
+    "" => run compute_next_patch(pkg_version)
+    _ => arg
+  }
+  run assert_version_format(resolved)
+  return resolved
+}
+
+workflow preflight(version) {
+  run assert_git_tree_clean()
+  run assert_tag_does_not_exist(version)
+}
+
+workflow apply_version_change(old_version, new_version) {
+  run npm_version_no_tag(new_version)
+  run update_install_release_ref(old_version, new_version)
+}
+
+workflow check_displayed_version(version) {
+  run run_npm_build()
+  run assert_built_cli_version_equals(version)
+}
+
+workflow default(arg) {
+  const version = run resolve_version(arg)
+  const old_version = run read_pkg_version()
+  log "Preparing release v${version} (current: v${old_version})"
+
+  run preflight(version)
+  run apply_version_change(old_version, version)
+  run check_displayed_version(version)
+  run run_registry_build()
+
+  log """
+    prepare_release: staged release v${version}
+      - package.json + package-lock.json (npm version ${version})
+      - docs/install (release ref v${old_version} -> v${version})
+      - docs/registry (regenerated)
+      - dist/ (rebuilt; jaiph --version == jaiph ${version})
+
+    Remaining manual steps:
+      1. Review the diff (git diff)
+      2. Commit the staged changes
+      3. Tag: git tag v${version}
+      4. Push branch + tag (tag push triggers docker-publish and release.yml)
+      5. Smoke check: jaiph use ${version}
+  """
+  return version
+}
diff --git a/.jaiph/prepare_release.test.jh b/.jaiph/prepare_release.test.jh
new file mode 100644
index 00000000..55d729ae
--- /dev/null
+++ b/.jaiph/prepare_release.test.jh
@@ -0,0 +1,86 @@
+#!/usr/bin/env jaiph
+
+import "./prepare_release.jh" as pr
+
+# resolve_version handles the empty-arg / explicit-arg branches and the
+# X.Y.Z format check; tests use mock script to pin the package.json version.
+
+test "resolve_version: empty arg returns next patch from package.json" {
+  mock script pr.read_pkg_version() {
+    echo "1.2.3"
+  }
+  const out = run pr.resolve_version("")
+  expect_equal out "1.2.4"
+}
+
+test "resolve_version: explicit X.Y.Z arg is accepted verbatim" {
+  mock script pr.read_pkg_version() {
+    echo "0.0.0"
+  }
+  const out = run pr.resolve_version("9.8.7")
+  expect_equal out "9.8.7"
+}
+
+test "resolve_version: non-X.Y.Z arg fails with offending value" {
+  mock script pr.read_pkg_version() {
+    echo "0.0.0"
+  }
+  const out = run pr.resolve_version("not-a-version") allow_failure
+  expect_contain out "version must match X.Y.Z"
+  expect_contain out "not-a-version"
+}
+
+test "resolve_version: extra-segment arg fails with offending value" {
+  mock script pr.read_pkg_version() {
+    echo "0.0.0"
+  }
+  const out = run pr.resolve_version("1.2.3.4") allow_failure
+  expect_contain out "version must match X.Y.Z"
+  expect_contain out "1.2.3.4"
+}
+
+# check_displayed_version: builds the CLI and compares its --version output
+# against the expected literal. On mismatch the script must print both the
+# expected and actual strings before the workflow fails.
+
+test "check_displayed_version: mismatch fails with both values in output" {
+  mock script pr.run_npm_build() {
+    :
+  }
+  mock script pr.assert_built_cli_version_equals() {
+    expected="jaiph $1"
+    actual="jaiph 0.0.0"
+    printf 'displayed --version mismatch\nexpected: %s\nactual:   %s\n' "${expected}" "${actual}" >&2
+    exit 1
+  }
+  const out = run pr.check_displayed_version("9.9.9") allow_failure
+  expect_contain out "expected: jaiph 9.9.9"
+  expect_contain out "actual:   jaiph 0.0.0"
+}
+
+# preflight: refuses to start if the working tree is dirty so the workflow's
+# own edits are the only diff a reviewer sees.
+
+test "preflight: dirty git tree fails before any side effects" {
+  mock script pr.assert_git_tree_clean() {
+    echo "git tree is dirty; commit or stash before running prepare_release" >&2
+    exit 1
+  }
+  mock script pr.assert_tag_does_not_exist() {
+    :
+  }
+  const out = run pr.preflight("9.9.9") allow_failure
+  expect_contain out "git tree is dirty"
+}
+
+test "preflight: existing tag v<version> fails" {
+  mock script pr.assert_git_tree_clean() {
+    :
+  }
+  mock script pr.assert_tag_does_not_exist() {
+    printf 'tag v%s already exists\n' "$1" >&2
+    exit 1
+  }
+  const out = run pr.preflight("9.9.9") allow_failure
+  expect_contain out "tag v9.9.9 already exists"
+}
diff --git a/.jaiph/security_review.jh b/.jaiph/security_review.jh
new file mode 100644
index 00000000..1d403389
--- /dev/null
+++ b/.jaiph/security_review.jh
@@ -0,0 +1,138 @@
+#!/usr/bin/env jaiph
+
+#
+# Security review of code changes. Reviews uncommitted changes by default,
+# or a git diff range passed as the first argument:
+#   jaiph run .jaiph/security_review.jh              # staged + unstaged + untracked
+#   jaiph run .jaiph/security_review.jh "main..HEAD" # a ref range
+# Writes a markdown report to .jaiph/tmp and publishes it as a run artifact.
+# Fails when any HIGH severity finding is confirmed.
+#
+# Review methodology adapted from anthropics/claude-code-security-review
+# (claudecode/prompts.py): high-confidence findings only, explicit
+# false-positive exclusions, severity + confidence scoring.
+#
+import "./lib_common.jh" as common
+import "jaiphlang/artifacts" as artifacts
+
+config {
+  agent.backend = "claude"
+  agent.claude_flags = "--permission-mode bypassPermissions"
+}
+
+const report_file = .jaiph/tmp/security_review_report.md
+
+const reviewer_role = """
+  You are a senior security engineer conducting a focused security review.
+  Identify HIGH-CONFIDENCE security vulnerabilities with real exploitation
+  potential. Minimize false positives: flag only issues where you are more
+  than 80% confident of actual exploitability in this codebase.
+
+  Vulnerability classes to examine:
+  1. Input validation: SQL/command/template/NoSQL injection, XXE,
+     path traversal.
+  2. Authentication & authorization: bypass logic, privilege escalation,
+     session flaws, JWT issues, insecure direct object references.
+  3. Crypto & secrets: hardcoded credentials, weak algorithms, improper key
+     storage, certificate validation bypasses, insecure randomness.
+  4. Code execution: unsafe deserialization, eval/exec on untrusted input,
+     unsafe YAML/pickle loading, XSS (reflected, stored, DOM-based).
+  5. Data exposure: secrets or PII in logs, debug info leaks, overly
+     revealing error messages, sensitive data written to artifacts.
+
+  Severity scale:
+  - HIGH: directly exploitable; leads to RCE, data breach, or auth bypass.
+  - MEDIUM: exploitable under specific conditions, significant impact.
+  - LOW: defense-in-depth gaps or low-impact weaknesses.
+
+  Do NOT report (out of scope, treated as noise):
+  - Denial of service, rate limiting, memory/CPU exhaustion.
+  - Missing input validation on non-security-critical fields without a
+    demonstrated security impact.
+  - Any finding you cannot back with a concrete exploit scenario.
+  - Style, performance, or general code-quality issues.
+"""
+
+script git_diff_uncommitted = ```
+{
+  git diff --cached
+  git diff
+  git ls-files --others --exclude-standard | while IFS= read -r f; do
+    [ -z "$f" ] && continue
+    git diff --no-index -- /dev/null "$f" || true
+  done
+}
+```
+
+script git_diff_range = `git diff "$1"`
+
+script worktree_fingerprint = `git status --porcelain | sort | cksum`
+
+workflow review_diff(diff_text) {
+  const result = prompt """
+    <role>
+    ${reviewer_role}
+    </role>
+    <task>
+    Review the following code changes for security vulnerabilities. You have
+    read access to the full repository — read surrounding source files
+    whenever needed to confirm whether a finding is actually exploitable;
+    do not judge from the diff alone.
+
+    Write a full markdown report to ${report_file} (overwrite if present)
+    with one section per finding: title, severity (HIGH/MEDIUM/LOW),
+    confidence (0.7-1.0; discard anything below 0.7), file and line,
+    a concrete exploit scenario, and a specific remediation. If there are
+    no findings, write a short report stating what was reviewed and that
+    nothing was found.
+
+    Do not modify any file in the repository other than ${report_file}.
+
+    Respond with JSON fields:
+    - verdict: the string "fail" if there is at least one HIGH finding,
+      otherwise the string "pass".
+    - highs, mediums, lows: finding counts by severity.
+    - summary: 1-3 sentences describing the overall result.
+
+    Code changes under review:
+    ${diff_text}
+    </task>
+  """
+  returns "{ verdict: string, highs: number, mediums: number, lows: number, summary: string }"
+
+  log "Security review: ${result.summary}"
+  log "Findings: high=${result.highs} medium=${result.mediums} low=${result.lows} (report: ${report_file})"
+  return result.verdict
+}
+
+workflow default(scope) {
+  run common.mkdir_p_simple(".jaiph/tmp")
+  const fingerprint_before = run worktree_fingerprint()
+
+  const diff_text = match scope {
+    "" => run git_diff_uncommitted()
+    _ => run git_diff_range(scope)
+  }
+  if diff_text == "" {
+    log "Security review: no changes to review."
+    return ""
+  }
+
+  const verdict = run review_diff(diff_text)
+
+  # The reviewer must be read-only apart from the (gitignored) report file.
+  const fingerprint_after = run worktree_fingerprint()
+  run common.str_equals(fingerprint_before, fingerprint_after) catch (err) {
+    fail "Security review must not modify the worktree, but git status changed during review. Inspect git status before trusting this run."
+  }
+
+  run artifacts.save(report_file)
+
+  run common.str_equals(verdict, "pass") catch (err) {
+    fail """
+      Security review found HIGH severity issues.
+      See ${report_file} (also published to the run artifacts directory).
+    """
+  }
+  log "Security review passed."
+}
diff --git a/.jaiph/skills.lock b/.jaiph/skills.lock
new file mode 100644
index 00000000..403fd4d3
--- /dev/null
+++ b/.jaiph/skills.lock
@@ -0,0 +1,11 @@
+{
+  "version": 1,
+  "skills": {
+    "documentation-writer": {
+      "source": "github/awesome-copilot",
+      "sourceType": "github",
+      "skillPath": "skills/documentation-writer/SKILL.md",
+      "computedHash": "ee53d65b163cd7eb953a930c95841cfe398cc2c0bd24c06508bbaa07c432be35"
+    }
+  }
+}
diff --git a/.jaiph/skills/documentation-writer/SKILL.md b/.jaiph/skills/documentation-writer/SKILL.md
new file mode 100644
index 00000000..1921e864
--- /dev/null
+++ b/.jaiph/skills/documentation-writer/SKILL.md
@@ -0,0 +1,53 @@
+<!--
+  Vendored from: https://github.com/github/awesome-copilot
+  Upstream path: skills/documentation-writer/SKILL.md
+  Source URL:    https://raw.githubusercontent.com/github/awesome-copilot/main/skills/documentation-writer/SKILL.md
+  Blob SHA:      93e3fbf57fe64179570de382347db8258c661b56
+  Copied at:     2026-06-10
+  Re-sync by fetching the source URL above and replacing the content below this header.
+-->
+---
+name: documentation-writer
+description: 'Diátaxis Documentation Expert. An expert technical writer specializing in creating high-quality software documentation, guided by the principles and structure of the Diátaxis technical documentation authoring framework.'
+---
+
+# Diátaxis Documentation Expert
+
+You are an expert technical writer specializing in creating high-quality software documentation.
+Your work is strictly guided by the principles and structure of the Diátaxis Framework (https://diataxis.fr/).
+
+## GUIDING PRINCIPLES
+
+1. **Clarity:** Write in simple, clear, and unambiguous language.
+2. **Accuracy:** Ensure all information, especially code snippets and technical details, is correct and up-to-date.
+3. **User-Centricity:** Always prioritize the user's goal. Every document must help a specific user achieve a specific task.
+4. **Consistency:** Maintain a consistent tone, terminology, and style across all documentation.
+
+## YOUR TASK: The Four Document Types
+
+You will create documentation across the four Diátaxis quadrants. You must understand the distinct purpose of each:
+
+- **Tutorials:** Learning-oriented, practical steps to guide a newcomer to a successful outcome. A lesson.
+- **How-to Guides:** Problem-oriented, steps to solve a specific problem. A recipe.
+- **Reference:** Information-oriented, technical descriptions of machinery. A dictionary.
+- **Explanation:** Understanding-oriented, clarifying a particular topic. A discussion.
+
+## WORKFLOW
+
+You will follow this process for every documentation request:
+
+1. **Acknowledge & Clarify:** Acknowledge my request and ask clarifying questions to fill any gaps in the information I provide. You MUST determine the following before proceeding:
+    - **Document Type:** (Tutorial, How-to, Reference, or Explanation)
+    - **Target Audience:** (e.g., novice developers, experienced sysadmins, non-technical users)
+    - **User's Goal:** What does the user want to achieve by reading this document?
+    - **Scope:** What specific topics should be included and, importantly, excluded?
+
+2. **Propose a Structure:** Based on the clarified information, propose a detailed outline (e.g., a table of contents with brief descriptions) for the document. Await my approval before writing the full content.
+
+3. **Generate Content:** Once I approve the outline, write the full documentation in well-formatted Markdown. Adhere to all guiding principles.
+
+## CONTEXTUAL AWARENESS
+
+- When I provide other markdown files, use them as context to understand the project's existing tone, style, and terminology.
+- DO NOT copy content from them unless I explicitly ask you to.
+- You may not consult external websites or other sources unless I provide a link and instruct you to do so.
diff --git a/.jaiph/testing.jh b/.jaiph/testing.jh
deleted file mode 100755
index 50c15386..00000000
--- a/.jaiph/testing.jh
+++ /dev/null
@@ -1,10 +0,0 @@
-#! /usr/bin/env jaiph
-
-script test_runner = ```
-cd "${JAIPH_WORKSPACE:?}"
-bash e2e/tests/72_docker_run_artifacts.sh
-```
-
-workflow default() {
-  run test_runner()
-}
\ No newline at end of file
diff --git a/CHANGELOG.md b/CHANGELOG.md
index be0622c6..f26e9ad0 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,23 +1,80 @@
 # Unreleased
 
-- **Language:** `for <id> in <id> { … }` in workflows and rules iterates newline-delimited lines of a string binding. Newlines normalize `\r\n` to `\n`; a single trailing empty segment from a final newline is omitted. Lines are not trimmed and empty interior lines are still iterated unless the body skips them (e.g. `if line != "" { … }`). Documented in `docs/language.md`.
-- **Tests / QA:** Unit tests for string line splitting (`src/runtime/string-lines.test.ts`); E2E `e2e/tests/135_for_string_lines.sh`.
+- **Fix — Prompt watchdog: never hang on a backend that finishes but does not exit:** `runBackend` (`src/runtime/kernel/prompt.ts`) previously gated the entire prompt result on the child process closing — `parseStream` resolves only on its readline `close`, the merged stream ends only on the child's `close` event, so a `claude -p` that streamed its final answer but never exited (commonly because a descendant it spawned is still holding the stdout pipe open) blocked the runtime forever: no `PROMPT_END`, no commit, no queue progress, no retry. Three independent watchdog layers now wrap every subprocess backend (claude / cursor / custom command) via a new exported `installPromptWatchdog`: **(1) completion grace** — `parseStream` now takes an `onComplete` callback that fires when the backend's terminal `result` event is parsed (tracked by a new `sawResult` flag on `StreamState` in `src/runtime/kernel/stream-parser.ts`); once seen, the process is given `JAIPH_PROMPT_COMPLETION_GRACE_SECONDS` (default 30s) to exit before it is terminated and the prompt returns **success** with the captured answer; **(2) idle timeout** — no stdout/stderr for `JAIPH_PROMPT_IDLE_TIMEOUT_SECONDS` (default 900s / 15m, reset on every output chunk) terminates the process and returns **failure**, feeding the existing prompt-retry backoff; **(3) absolute cap** — total wall-clock over `JAIPH_PROMPT_MAX_SECONDS` (default 7200s / 2h) terminates and fails likewise. Each layer is disabled with `0`. On expiry the watchdog sends `SIGTERM`, escalating to `SIGKILL` after 5s. A single-settle guard in `runBackend` ensures the normal-exit path and the watchdogs cannot double-resolve, and on settle the runtime now destroys its handles on the child's `stdin`/`stdout`/`stderr` (and the claude `merged` PassThrough) so a lingering descendant holding a pipe can no longer keep the event loop — and thus the whole run — alive after the prompt has resolved. The three knobs are read in `resolveConfig` via literal `env.JAIPH_PROMPT_*` access so the env-var source-parity harness (`integration/docs-reference-task5.test.ts`) pins them, and are documented in `docs/env-vars.md` (parity table) and a new "Prompt watchdog timeouts" section in `docs/configuration.md`. New tests in `src/runtime/kernel/prompt.test.ts` cover the watchdog unit (idle fires, `bump()` resets idle, absolute cap ignores `bump()`, completion grace settles success with the captured final, `clear()` cancels, fires-at-most-once) plus two end-to-end `executePrompt` cases through a fake cursor-agent that hangs (recovers with success after a `result` event; recovers with failure on a silent hang). Under Docker, `runtime.docker_timeout_seconds` remains the outer backstop.
+- **Docs — Post-parity cleanup: retire the `docs/_legacy/` quarantine (docs redesign 8/8):** Final task in the [Diátaxis](https://diataxis.fr/) docs rewrite — the agent-doable cleanup that runs after the maintainer's redesign-aware parity pass (`jaiph run .jaiph/docs_parity_redesign.jh`, a redesign-aware copy of `docs_parity.jh` that lists docs recursively, excludes `docs/_legacy/`, and verifies the Diátaxis structure against the TypeScript/Bash source + `docs/architecture.md` instead of re-consolidating it). With the greenfield pages (tasks 3–7) confirmed to match source on run-dir naming, env-var lists, flag tables, config keys, and error codes, the `docs/_legacy/` quarantine is now obsolete — its content has been fully superseded by the live pages and is recoverable from git history. All 14 quarantined pages (`artifacts.md`, `cli.md`, `configuration.md`, `contributing.md`, `getting-started.md`, `grammar.md`, `hooks.md`, `inbox.md`, `language.md`, `libraries.md`, `sandboxing.md`, `setup.md`, `spec-async-handles.md`, `testing.md`) are deleted from the worktree, and the now-unneeded `- _legacy` entry (plus its explanatory comment) is removed from the Jekyll `exclude:` list in `docs/_config.yml` so the build config no longer carries a vestige of the quarantine. The README's "Docs note" trailing sentence ("Pre-redesign pages that have not been recreated yet stay quarantined under [`docs/_legacy/`](docs/_legacy/) (in git, not published).") is dropped because there are no longer any quarantined pages to disclose. The env-forwarding parity check in `src/runtime/docker.test.ts` is repointed from `docs/_legacy/sandboxing.md` to the published reference page `docs/env-vars.md` (asserting that the `ENV_ALLOW_PREFIXES` allowlist and the `ENV_ALLOW_EXCLUDE_PREFIX` exclude prefix appear verbatim in the live page), and the companion cross-link assertion that required `configuration.md` and `cli.md` to link to the `sandboxing.md#environment-variable-forwarding` section is dropped — the env-vars reference is now self-contained, so the legacy cross-link contract no longer applies. The dedicated quarantine harness `integration/docs-legacy-quarantine.test.ts` is deleted because its invariants ("`_legacy` is build-excluded", "live pages exist alongside quarantined reference copies", "nav never targets a quarantined permalink") no longer have a `_legacy` directory to police, and the matching row is removed from the test-suite table in `docs/contributing.md`. In its place, `integration/docs-structure.test.ts` replaces the prior "pages under `docs/_legacy/` are exempt from publish-side checks" lint with a one-line `docs-lint: docs/_legacy/ no longer exists (post-redesign cleanup)` assertion that fails if anyone re-introduces the directory — the cleanup is now a hard invariant rather than a tolerated state. The docs-lint, internal-link, redirect-coverage, env-var source-parity (`integration/docs-reference-task5.test.ts`), and nav-structure (`integration/docs-nav-structure-task7.test.ts`) tests from tasks 2–7 stay green, and `bundle exec jekyll build` exits 0 with no missing-link / front-matter warnings. No runtime, CLI, language, or behavior changes — this task is docs cleanup only, closing out the eight-task Diátaxis redesign queue.
+- **Docs — Diátaxis IA finalization: nav regrouping, landing entry points, redirect sweep (docs redesign 7/8):** Fifth content task in the [Diátaxis](https://diataxis.fr/) docs rewrite — the structural wiring task that ties together the greenfield Explanation (task 3), How-to (task 4), Reference (task 5), and Tutorials (task 6) pages into the target IA. The Jekyll nav in `docs/_layouts/docs.html` is regrouped into **five labeled `<li class="docs-nav-group">` sections in the documented Diátaxis order — Tutorials → How-to guides → Reference → Explanation → Contributing** — each containing exactly the published pages whose `diataxis:` front-matter matches the section (`tutorial` → Tutorials, `how-to` → How-to guides, `reference` → Reference, `explanation` → Explanation, `contributor` → Contributing). The active-page highlighting (`{% if page.permalink == '/...' %} class="docs-nav-active" aria-current="page"{% endif %}`) is preserved on every entry, and the contributor Agent Skill link continues to point at the in-site permalink `/jaiph-skill` (the raw-`jaiph-skill.md` URL stays in `README.md` and `docs/index.html` because those are the entry points agents themselves consume and they need the unrendered Markdown — that contract is unchanged from task 2). Tutorials lead the panel because they are the entry point for newcomers; Contributing trails because it is in-repo developer surface, not user-facing. The landing page (`docs/index.html`) entry points are repointed to lead with the **first tutorial** and the **how-to index** (not a flat page list): the top-nav `Docs` link is split into `Tutorial` (→ `/tutorials/first-workflow`) and `How-to` (→ `/how-to/install`), and the footer `Architecture` link is replaced with the same `Tutorial` + `How-to` pair so the landing page guides newcomers down the tutorial path and operators down the how-to path rather than dumping them on an explanation page. The live contributor page `docs/contributing.md` (permalink `/contributing`, `diataxis: contributor`, `redirect_from: /contributing.md`) owns the `/contributing` slug alongside `docs/jaiph-skill.md` at `/jaiph-skill` — both under the Contributing nav section (22 published `docs/*.md` pages with `diataxis:` front-matter in total). Every URL in the pre-redesign nav (`/getting-started`, `/setup`, `/libraries`, `/artifacts`, `/language`, `/grammar`, `/cli`, `/configuration`, `/testing`, `/spec-async-handles`, `/inbox`, `/hooks`, `/sandboxing`, `/architecture`, `/contributing`) now resolves to its new home — either directly (the slug is unchanged on a live page) or via a single `jekyll-redirect-from` stub emitted from the absorbing page's `redirect_from:` list. `bundle exec jekyll build` exits 0 with no missing-link / front-matter warnings and emits no page from `docs/_legacy/` (already build-excluded via the `_config.yml` `exclude:` list from task 1). A new integration test `integration/docs-nav-structure-task7.test.ts` (Node `--test`, auto-picked up by `npm test`) graders this task end-to-end as two checks: (1) the nav layout's `<li class="docs-nav-group">` headings are exactly `["Tutorials", "How-to guides", "Reference", "Explanation", "Contributing"]` in that order — drift in heading text or ordering fails the test; (2) every published `docs/*.md` with a `diataxis:` front-matter value appears under the matching section exactly once (no miss / no miscategorisation / no cross-section duplicate), and every section's link list equals the set of permalinks for its diataxis bucket — so adding a new how-to page without nav-wiring it, or accidentally listing a tutorial under Explanation, fails the test. The existing docs-lint harness from task 2 (`integration/docs-structure.test.ts`) continues to enforce the historical-permalink resolution check (`every historical nav permalink still resolves`) — that test mines every `'<url>' | relative_url` reference from `git log -p --all -- docs/_layouts/docs.html` and asserts the URL still resolves via a published page or a `redirect_from:` alias, which is the redirect-coverage backstop for this task. With this task in, the IA is complete: all four user-facing Diátaxis quadrants are nav-grouped under their section heading, plus the in-repo Contributing bucket; the remaining task 8 work is the README/landing sweep (`docs/contributing.md` and nav wiring are in). No runtime, CLI, or language behavior changes; the edits are to `docs/_layouts/docs.html`, `docs/index.html`, `docs/contributing.md`, and `docs/jaiph-skill.md` front-matter.
+- **Docs — Diátaxis Tutorials pass: guided first-success paths (docs redesign 6/8):** Fourth content task in the [Diátaxis](https://diataxis.fr/) docs rewrite. Two learning-oriented pages now land in `docs/` as published Diátaxis tutorials, each authored greenfield from the TypeScript/Bash source plus `docs/architecture.md` first and only then reconciled against `docs/_legacy/getting-started.md` (per the anti-bias protocol in `.jaiph/skills/documentation-writer/SKILL.md`). Both pages walk a newcomer from "have nothing" to a working first-success outcome, with every command copy-pasteable and one happy path only — branching/optional knobs link out to the relevant How-to or Reference page rather than expanding inline: `docs/first-workflow.md` (permalink `/tutorials/first-workflow`, `redirect_from: /getting-started`, `/getting-started.md`) — install → write a five-line script-only `.jh` with one `script` step and one `workflow default(who)` that returns the script's stdout → run with `jaiph run ./hello.jh "Adam"` → read the live progress tree, the printed return value, and the durable files under `.jaiph/runs/<date>/<time>-<entry>/` (`000001-workflow__default.out|.err`, `000002-script__greet.out|.err`, `return_value.txt`, `run_summary.jsonl`, `heartbeat`) → re-run with `exit 7` swapped into the script body to observe the failure footer (`✗ FAIL`, `Logs:` / `Summary:` / `out:` / `err:`, `Output of failed step:` excerpt; no `return_value.txt` on failure); `docs/first-agent-run.md` (permalink `/tutorials/first-agent-run`, no retired slug — genuinely new) — credential prerequisites stated up front per backend (claude → `ANTHROPIC_API_KEY` or `CLAUDE_CODE_OAUTH_TOKEN`; cursor → `CURSOR_API_KEY`; codex → `OPENAI_API_KEY`; Docker is hard-failing for missing env vars because stored CLI logins do not cross the container boundary) → Docker prerequisite (`docker info`, no `--docker` flag, overlay vs copy mode picked from `/dev/fuse`) → add `rule valid_name(name_arg)` with `match` arms plus a triple-quoted `prompt """ … """` step → run `jaiph run ./greet.jh "Adam"`, observing the `(Docker sandbox, fusefs)` / `(tmp workspace)` banner, the backend-and-preview prompt line, and the return value → re-run with empty `name_arg` so `ensure valid_name(name_arg)` aborts the workflow and the `prompt` step is never reached → inspect the `PROMPT_START` record in `run_summary.jsonl` with `jq` for the resolved `backend` / `model` / `model_reason`. Each page declares `diataxis: tutorial` and the matching `permalink: /tutorials/<slug>`. The Jekyll nav in `docs/_layouts/docs.html` gains a new **Tutorials** group at the top of the panel (above Why Jaiph / Architecture, since tutorials are the entry point for newcomers) with one entry per page; the previously flat Explanation block now sits under an explicit **Explanation** group label so the nav reads as four named Diátaxis sections (Tutorials → Explanation → How-to → Reference) ahead of the final IA regrouping in task 7. `docs/architecture.md` is tightened only at the link surface: `/getting-started` is removed from its `redirect_from:` list because the new tutorial owns it now (jekyll-redirect-from emits one canonical stub from the tutorial's `redirect_from:`). A new integration test `integration/docs-tutorials-task6.test.ts` (Node `--test`, auto-picked up by `npm test`) grades this task end-to-end as four checks: (1) each of the two pages declares `diataxis: tutorial` and the expected `permalink: /tutorials/<slug>`; (2) every tutorial permalink is reachable from the nav exactly once, and the nav surfaces a `<li class="docs-nav-group">Tutorials</li>` group heading; (3) `/getting-started` is absorbed by `first-workflow.md`'s `redirect_from:` and **not** by any other live page (the test also asserts `architecture.md` no longer claims the slug so two redirect stubs cannot conflict at build time); (4) the first ```jh fenced block in `first-workflow.md` is *executable* — the test extracts it, writes it to a temp `hello.jh`, runs `node dist/src/cli.js run <entry> Adam` in a clean env with `JAIPH_UNSAFE=true` / `NO_COLOR=1` / `TERM=dumb`, asserts exit 0, and asserts the normalised stdout (with `(\d+(\.\d+)?(s|ms))` timings collapsed to `<time>`) equals the first ```text block on the page after trimming. This is the "happy path is executable, not aspirational" contract — if a future change to the CLI banner / progress tree / return-value-printing path drifts the actual output away from the tutorial, this test fails. README.md is updated to surface the two new tutorials in the top-line link bar and in the "Docs note" callout (now reading "Tutorials, Explanation, How-to, and Reference quadrants have landed"), to drop `getting-started` from the legacy index (the slug is now owned by the live tutorial), and to repoint the three remaining `docs/_legacy/getting-started.md` references (Usage doc-map, Example trailer, Start-here "Human" bullet) at `docs/first-workflow.md` so a reader who lands on README from search keeps reaching live pages. `docs/index.html`'s Language section similarly repoints its `<a href="getting-started">Getting started</a>` link (and the `jaiph.org/getting-started` external link next to it) at `/tutorials/first-workflow`, so the landing page stops naming a slug that now exists only as a redirect stub. With this task in, all four user-facing Diátaxis quadrants are live (Explanation from task 3, How-to from task 4, Reference from task 5, Tutorials here); the final IA / nav regrouping is task 7 and the contributor pages plus the broader README/landing sweep is task 8. No runtime, CLI, or language behavior changes.
+- **Docs — Diátaxis Reference pass: pure lookup pages, code-verified (docs redesign 5/8):** Third content task in the [Diátaxis](https://diataxis.fr/) docs rewrite. Five lookup-oriented pages now land in `docs/` as published Diátaxis reference pages, each authored greenfield from the TypeScript/Bash source plus `docs/architecture.md` first and only then reconciled against its `docs/_legacy/` copy (per the anti-bias protocol in `.jaiph/skills/documentation-writer/SKILL.md`). Each page is information-oriented and table-driven — exhaustive, neutral, no second-person tutorial prose and no how-to recipes (the *how* belongs to the How-to quadrant from task 4 and the *why* belongs to the Explanation quadrant from task 3): `docs/cli.md` (permalink `/reference/cli`, `redirect_from: /cli`, `/cli.md`) — the authoritative inventory of `jaiph` invocation forms (`jaiph`, `jaiph --help`, `jaiph --version`, file-shorthand routing of `*.test.jh` → `jaiph test` / other `*.jh` → `jaiph run`, unknown-command stderr text + exit `1`, the internal `__workflow-runner` marker that is excluded from help/usage), every subcommand (`run`, `test`, `compile`, `format`, `init`, `install`, `use`) with its full flag table and exit behaviour, the progress-marker glyphs (`▸ ✓ ✗ ℹ ! ·` plus the `₁ ₂ …` subscript prefix for `run async` branches), the credential pre-flight skip-on-`--raw` rule, the non-TTY heartbeat env-var pair (`JAIPH_NON_TTY_HEARTBEAT_FIRST_SEC` / `JAIPH_NON_TTY_HEARTBEAT_INTERVAL_MS`), the `__JAIPH_EVENT__`-on-stderr live contract, the `.jaiph/runs/<date>/<time>-<source>/` durable layout, and the `run_summary.jsonl` event types (`WORKFLOW_START` / `WORKFLOW_END` / `STEP_START` / `STEP_END` / `LOG` / `LOGERR` / `INBOX_*` / `PROMPT_START` / `PROMPT_END`); `docs/configuration.md` (permalink `/reference/configuration`, `redirect_from: /configuration`, `/configuration.md`) — the authoritative key inventory: every `agent.*` / `run.*` / `module.*` / `runtime.*` key with its value type, default, environment-variable equivalent, and notes (`agent.default_model`, `agent.command`, `agent.backend`, `agent.trusted_workspace`, `agent.cursor_flags`, `agent.claude_flags`, `run.logs_dir`, `run.debug`, `run.recover_limit`, `module.name`/`version`/`description`, `runtime.docker_image`/`network`/`docker_timeout_seconds`), the precedence ladder (env > workflow-level > module-level > defaults; runtime-level Docker on/off is env-only — in-file `runtime.docker_enabled` is `E_PARSE`), the `${NAME}_LOCKED=1` mechanism (locked names: `JAIPH_AGENT_BACKEND/MODEL/COMMAND/TRUSTED_WORKSPACE/CURSOR_FLAGS/CLAUDE_FLAGS`, `JAIPH_RUNS_DIR`, `JAIPH_DEBUG`), the scoping table across nested calls (root entry / same-module `run` / cross-module `run` / same-module `ensure` / cross-module `ensure`), the credential pre-flight matrix per backend (`cursor`, `claude`, `codex`), the model-resolution order (explicit → flags → backend-default with the special Claude `--model` injection), and the prompt-retry backoff schedule with `JAIPH_PROMPT_RETRY` / `JAIPH_PROMPT_RETRY_DELAYS` overrides; `docs/grammar.md` (permalink `/reference/grammar`, `redirect_from: /grammar`, `/grammar.md`) — the authoritative syntactic reference: lexical rules (identifier shape, comment / blank-line / shebang handling, single-line `"…"` vs triple-quoted `"""…"""`, backtick vs fenced script bodies, required-parentheses rule), top-level EBNF (`file = { top_level }`, the `import` / `import script` / `channel` / `env_decl` / `rule` / `script` / `workflow` productions), the formatter hoist ordering (`import` → `config` → `channel`, other top-level definitions keep source order), the per-statement EBNF (`run_stmt` / `run_catch_stmt` / `run_recover_stmt` / `run_async_stmt` / `ensure_stmt` / `prompt_stmt` / `const_decl_step` / `return_stmt` / `send_stmt` / `match_stmt` / `if_stmt` / `for_lines_stmt`), the inline-script form (`scripts/__inline_<12-hex>` deterministic emission), the typed-prompt `returns "{ field: type, … }"` flat schema rules, the validation catalog (`E_PARSE` / `E_SCHEMA` / `E_VALIDATE` / `E_IMPORT_NOT_FOUND` with each trigger), and the build-artifact table (only per-`script` files emit; workflows/rules/prompts/channels/control flow are interpreted from the AST); `docs/language.md` (permalink `/reference/language`, `redirect_from: /language`, `/language.md`) — the per-step reference: the eight `WorkflowStepDef` variants (`exec`, `const`, `return`, `send`, `say`, `if`, `for_lines`, `trivia`), the eight `Expr` kinds (`literal`, `call`, `ensure_call`, `inline_script`, `prompt`, `match`, `shell`, `bare_ref`), each step's allowed positions and capture rules (workflow callees yield explicit `return`; named/inline scripts yield trimmed stdout; rule `ensure` yields explicit `return`), `run async` resolution semantics (eager start / lazy resolve, the implicit join at end-of-step-list, passthrough vs resolving reads, the `recover` / `catch` interaction), the rule-scope restriction table (`prompt` / `send` / `run async` / `run` to workflow / raw shell are all forbidden in rules), the subprocess-environment contract (runner `process.env` augmented with `JAIPH_WORKSPACE` / `JAIPH_SCRIPTS` / `JAIPH_RUN_DIR` / `JAIPH_ARTIFACTS_DIR` / `JAIPH_RUN_ID` / `JAIPH_RUN_SUMMARY_FILE` plus `JAIPH_AGENT_*` and config-derived keys; module `const` values **not** auto-exported), the step-output contract (status / capture / logs per step type), and the `JAIPH_RECURSION_DEPTH_LIMIT` runtime cap (default `256`); `docs/env-vars.md` (permalink `/reference/env-vars`, `redirect_from: /env-vars`, `/env-vars.md`, NEW page) — a consolidated environment-variable inventory absorbing the sandboxing config/failure-mode tables explicitly excluded from the task-3 explanation page. Three tables: (1) every `JAIPH_*` name read in `src/` (`JAIPH_AGENT_*` / `JAIPH_DOCKER_*` / `JAIPH_INPLACE` / `JAIPH_INPLACE_YES` / `JAIPH_RUNS_DIR` / `JAIPH_RUN_DIR` / `JAIPH_RUN_ID` / `JAIPH_RUN_SUMMARY_FILE` / `JAIPH_ARTIFACTS_DIR` / `JAIPH_SCRIPTS` / `JAIPH_SOURCE_FILE` / `JAIPH_SOURCE_ABS` / `JAIPH_META_FILE` / `JAIPH_MODULE_GRAPH_FILE` / `JAIPH_WORKSPACE` / `JAIPH_TEST_MODE` / `JAIPH_MOCK_*_JSON` / `JAIPH_INBOX_MAX_DISPATCH` / `JAIPH_INBOX_PARALLEL` / `JAIPH_NON_TTY_HEARTBEAT_*` / `JAIPH_CODEX_API_URL` / `JAIPH_PROMPT_RETRY` / `JAIPH_PROMPT_RETRY_DELAYS` / `JAIPH_PROMPT_FINAL_FILE` / `JAIPH_INSTALL_COMMAND` / `JAIPH_REGISTRY` / `JAIPH_SKILL_PATH` / `JAIPH_DEBUG` / `JAIPH_UNSAFE` plus the `*_LOCKED` lock-flags and the stripped-on-launch deprecated names `JAIPH_LIB` / `JAIPH_STDLIB` / `JAIPH_PRECEDING_FILES`) with scope (`host` / `runtime` / `internal`), type, default, related config key, and role columns — the table is delimited by `<!-- begin: src-parity -->` / `<!-- end: src-parity -->` HTML markers so the docs-lint harness can pin it bidirectionally against `src/`; (2) the agent-credential matrix (`ANTHROPIC_API_KEY` / `CLAUDE_CODE_OAUTH_TOKEN` / `CURSOR_API_KEY` / `OPENAI_API_KEY`) with host vs Docker behaviour and the `JAIPH_*` / `ANTHROPIC_*` / `CLAUDE_*` / `CURSOR_*` Docker-forwarding allowlist; (3) the installer / `jaiph use` variables (`JAIPH_REPO_REF` / `JAIPH_BIN_DIR` / `JAIPH_RELEASE_BASE_URL` / `JAIPH_REPO_URL`) — host-shell consumers, **not** read from `src/`, so they sit outside the parity-pinned block; plus the consolidated Docker-failure-mode table (`E_DOCKER_NOT_FOUND` / `E_DOCKER_PULL` / `E_DOCKER_NO_JAIPH` / `E_DOCKER_RUNS_DIR` / `E_DOCKER_OVERLAY` / `E_DOCKER_TIMEOUT` / `E_DOCKER_UID` / `E_DOCKER_SANDBOX_COPY` / `E_DOCKER_INPLACE_NO_CONFIRM` / `E_FLAG_CONFLICT` / `E_CLI_SETUP` / `E_VALIDATE_MOUNT` / `E_TIMEOUT` / `E_AGENT_CREDENTIALS`) with trigger and behaviour columns. Each new page declares `diataxis: reference` and the matching `permalink: /reference/<slug>` in its front-matter, picks up `redirect_from:` entries for its retired permalink (`/cli`, `/configuration`, `/grammar`, `/language`, `/env-vars`) plus the `<slug>.md` form, and links inward to other reference pages and to the relevant How-to / Explanation pages for `Related` reading (with no manual "More Documentation" block — nav is provided by `docs/_layouts/docs.html`). The Jekyll nav in `docs/_layouts/docs.html` gains a new **Reference** group with one entry per page (`/reference/cli`, `/reference/configuration`, `/reference/grammar`, `/reference/language`, `/reference/env-vars`) sitting between the existing How-to quadrant and the Agent Skill contributor link; final IA regrouping still happens in task 7. `docs/architecture.md` is tightened only at the link surface: `/language`, `/grammar`, `/cli`, and `/configuration` are removed from its `redirect_from:` list because those slugs are now absorbed by the new live reference pages' own `redirect_from:`. The legacy quarantine list in `integration/docs-legacy-quarantine.test.ts` graduates `cli.md`, `configuration.md`, `grammar.md`, and `language.md` from `QUARANTINED_PAGES` to `RECREATED_WITH_LEGACY` (env-vars.md is genuinely new — no legacy predecessor — and is not listed in either bucket). A new integration test `integration/docs-reference-task5.test.ts` (Node `--test`, auto-picked up by `npm test`) graders this task end-to-end as four checks: (1) each of the five pages declares `diataxis: reference` and the expected `permalink: /reference/<slug>`; (2) every reference permalink is reachable from the nav exactly once; (3) the env-var reference is source-parity-pinned against `src/` — every `JAIPH_*` name read via `env.JAIPH_*` / `process.env.JAIPH_*` / `process.env["JAIPH_*"]` in `src/` appears between the `<!-- begin: src-parity -->` markers, and no name appears between the markers that is absent from `src/` (drift in either direction fails the test); (4) reference pages contain no tutorial-shaped numbered `## N.` / `### N.` section headings, no `## Verification` / `## Verify` terminal section, no second-person imperative leads (`You will…`, `Now you…`, `Next, you…`), and at most 12 second-person pronouns total (heuristic upper bound against drift back into open-ended prose). With this task in, three of the four Diátaxis quadrants are now live (Explanation from task 3, How-to from task 4, Reference here); the two Tutorials (`first-workflow`, `first-agent-run`) land as task 6, the final IA / nav regrouping is task 7, and contributor pages plus the README/landing sweep are task 8. No runtime, CLI, or language behavior changes.
+- **Docs — Diátaxis How-to pass: task-oriented recipes (docs redesign 4/8):** Second content task in the [Diátaxis](https://diataxis.fr/) docs rewrite. Eight problem-oriented recipes now land in `docs/` as published Diátaxis how-to pages, each authored greenfield from the TypeScript/Bash source plus `docs/architecture.md` first and only then reconciled against its `docs/_legacy/` copy (per the anti-bias protocol in `.jaiph/skills/documentation-writer/SKILL.md`). Each recipe is shaped goal → prerequisites → numbered steps → `Verification` → `Related`, with no conceptual digressions (the *why* belongs to the Explanation quadrant from task 3 and the *what-it-is* belongs to Reference in task 5): `docs/setup.md` (permalink `/how-to/install`, `redirect_from: /setup`) — install the standalone binary via `curl -fsSL https://jaiph.org/install | bash` (downloads the matching `jaiph-{darwin|linux}-{arm64|x64}` plus `SHA256SUMS` from the current stable Release, verifies the checksum, installs to `~/.local/bin/jaiph`, with `JAIPH_BIN_DIR` overriding the install dir), the npm alternative for Node-on-the-host setups, the `jaiph use <ref>` switch (`JAIPH_REPO_REF` + `JAIPH_INSTALL_COMMAND` overrides for forks/offline mirrors), and `jaiph --version` as the verification step; `docs/sandbox-run.md` (permalink `/how-to/sandbox-run`, no retired slug) — the enabling steps that were explicitly out of scope for the task-3 sandboxing explanation: `jaiph run ./flow.jh` is Docker-on by default, overlay mode picks itself when `/dev/fuse` exists on the host and copy mode otherwise (or under `JAIPH_DOCKER_NO_OVERLAY=1`), `--inplace` / `JAIPH_INPLACE=1` opts into live host edits and triggers the per-git-state confirmation prompt (default-no on empty input or EOF), `-y` / `--yes` / `JAIPH_INPLACE_YES=1` skips the prompt in non-TTY environments (without one of these the run aborts with `E_DOCKER_INPLACE_NO_CONFIRM`), `--unsafe` disables Docker entirely, and `--unsafe` + `--inplace` is rejected with `E_FLAG_CONFLICT`. The verification step grounds the recipe in the exact CLI banner lines (`Docker sandbox, fusefs` / `Docker sandbox, tmp workspace` / `Docker sandbox, in-place (live host edits)`) emitted by `src/cli/run/display.ts`; `docs/agent-auth.md` (permalink `/how-to/agent-auth`, NEW page) — the credential pre-flight implemented in `src/cli/run/preflight-credentials.ts` written up as a recipe per backend: claude needs `ANTHROPIC_API_KEY` *or* `CLAUDE_CODE_OAUTH_TOKEN` (with `claude setup-token` as the documented path for the OAuth token), cursor needs `CURSOR_API_KEY`, codex needs `OPENAI_API_KEY`. The host-vs-Docker matrix is explicit: under Docker, stored CLI logins (`~/.claude` / macOS Keychain / `cursor-agent login`) do **not** cross the container boundary so only the env vars on the host's forwarding allowlist reach the agent — claude and cursor are warn-only on host runs but hard `E_AGENT_CREDENTIALS` errors under Docker, while codex is a hard error on both because it has no CLI-login fallback. The page also covers the two escape hatches the pre-flight observes: `JAIPH_UNSAFE=true` skips the check entirely, and a file that neither declares a backend nor uses any `prompt` step is skipped because there is nothing to credential against. `JAIPH_CODEX_API_URL` is named once as the OpenAI-compatible endpoint override; `docs/configure-backend.md` (permalink `/how-to/configure-backend`, no retired slug) — how-to slice of the legacy `configuration.md`: module-level `config { agent.backend = "claude" / agent.default_model = "sonnet-4" }`, the workflow-level `config { … }` override (must be the first non-comment construct, only `agent.*` and `run.*` allowed at workflow scope — `runtime.*` is module-only), and the `JAIPH_AGENT_BACKEND` / `JAIPH_AGENT_MODEL` env overrides that win over both (the CLI marks `JAIPH_AGENT_BACKEND_LOCKED=1` for the run so in-file overrides cannot silently take effect later). The verification step is a copy-paste `jq -c 'select(.type=="PROMPT_START")' .jaiph/runs/<date>/<time>-<entry>/run_summary.jsonl` so the reader can confirm the resolved backend, model, and `model_reason`; `docs/hooks.md` (permalink `/how-to/hooks`, `redirect_from: /hooks`) — recipe form of the legacy hooks page: the two config locations (`~/.jaiph/hooks.json` global, `<workspace>/.jaiph/hooks.json` project, project overrides global per event), the exact four supported events (`workflow_start` / `workflow_end` / `step_start` / `step_end`), the schema (object → event-name → array of shell commands), the fire-and-forget execution model (`sh -c '<command>'` with the JSON payload on stdin, stdout discarded, stderr copied to CLI stderr, failures never change the workflow exit code), the commands hooks do NOT fire for (`jaiph test`, `jaiph compile`, `jaiph format`, `jaiph init`, `jaiph install`, `jaiph use`, `jaiph run --raw`), and the no-op `{"workflow_end": ["true"]}` pattern for disabling a global hook per project. The page anchors the full payload shape to `HookPayload` / `HookEventName` in `src/types.ts` rather than republishing the schema; `docs/libraries.md` (permalink `/how-to/libraries`, `redirect_from: /libraries`) — split into Part A (use) and Part B (publish). Part A covers all four input shapes of `jaiph install` (registry name, registry name `@version`, git URL, git URL `@ref`), the regex that decides registry-vs-URL (`/^[A-Za-z0-9_-]+(@…)?$/` with no `/` and no `:`), the clone destination `<workspace>/.jaiph/libs/<lib-name>/` with the nested `.git` directory stripped, the `.jaiph/libs.lock` lockfile recording the resolved URL, version, and 40-char commit, and the bare `jaiph install` restore-from-lock path (registry never read). Part B covers the publishing model — public git repo with top-level `.jh` modules, the import-prefix-from-clone-name rule, the `export` surface, git tag releases, and the optional `jaiph.org/registry` PR. The verification rejection message is reproduced verbatim from source (`lib "<name>" contains no .jh modules — not a jaiph library?`) so the reader can grep an actual error back to this page; `docs/artifacts.md` (permalink `/how-to/artifacts`, `redirect_from: /artifacts`) — recipe form of the legacy artifacts page: `import "jaiphlang/artifacts" as artifacts` followed by `artifacts.save("./path/to/file")` (single path) or `artifacts.save(newline_separated_list)` (multiple paths, blank lines ignored, returned value is a newline-separated list of absolute destinations), the `./`-prefix-stripped / absolute-paths-flattened-to-basename copy semantics, and the lower-level `script` step alternative writing directly to `$JAIPH_ARTIFACTS_DIR`. The page also names the sibling env vars the runtime always sets (`JAIPH_RUN_DIR`, `JAIPH_RUN_SUMMARY_FILE`, `JAIPH_RUN_ID`) and the three failure modes of `artifacts.save(...)` (empty list after trim / missing source / `JAIPH_ARTIFACTS_DIR` unset) so the reader knows where to wrap the call in `recover` / `catch`; `docs/testing.md` (permalink `/how-to/testing`, `redirect_from: /testing`) — how-to slice of the legacy testing page: write `*.test.jh` files with `import "./under-test.jh" as w` + `test "..." { … }` blocks, queue mock prompt responses (`mock prompt "..."` consumed FIFO, one per `prompt` call; bare-identifier form refers to test-block `const`), the pattern form (`mock prompt { /re/ => "...", _ => "..." }`, mutually exclusive with the queue form in the same test block), `mock workflow` / `mock rule` / `mock script` body-stubs (parentheses required), the `run w.default()` / `run w.default("arg")` / `run … allow_failure` capture forms, the `expect_contain` / `expect_not_contain` / `expect_equal` assertions, and the `jaiph test` discovery rules (`*.test.jh` recursive, zero-matches prints `jaiph test: no *.test.jh files found (nothing to do)` and exits 0, single-file path shorthand). Each new page declares `diataxis: how-to` and the matching `permalink:` in its front-matter, picks up `redirect_from:` entries for any retired permalink the legacy page held (`/hooks`, `/libraries`, `/artifacts`, `/setup`, `/testing`), and links inward to `architecture.md` / `sandboxing.md` / `/how-to/agent-auth` / `/how-to/sandbox-run` for `Related` reading (with no manual "More Documentation" block — nav is provided by `docs/_layouts/docs.html`). The Jekyll nav in `docs/_layouts/docs.html` gains a new **How-to** group with one entry per recipe (`/how-to/install`, `/how-to/sandbox-run`, `/how-to/agent-auth`, `/how-to/configure-backend`, `/how-to/hooks`, `/how-to/libraries`, `/how-to/artifacts`, `/how-to/testing`) sitting between the existing Explanation quadrant (Why Jaiph / Architecture / Sandboxing / Inbox & Dispatch / Async Handles) and the Agent Skill contributor link; final IA regrouping still happens in task 7. `docs/architecture.md` is tightened only at the link surface: `/setup`, `/libraries`, `/artifacts`, `/testing`, and `/hooks` are removed from its `redirect_from:` list because those slugs are now absorbed by the new live how-to pages' own `redirect_from:`. The legacy quarantine list in `integration/docs-legacy-quarantine.test.ts` graduates `artifacts.md`, `hooks.md`, `libraries.md`, `setup.md`, and `testing.md` from `QUARANTINED_PAGES` to `RECREATED_WITH_LEGACY`, the redirect-stub probe is repointed from `/hooks` (no longer quarantined) to `/getting-started` (still quarantined; replacement tutorial lands in task 6), and the internal-link check is upgraded to resolve nav entries against each docs/*.md front-matter `permalink:` rather than path-from-slug — so a how-to at `docs/setup.md` with permalink `/how-to/install` now resolves cleanly. A new integration test `integration/docs-how-to-task4.test.ts` (Node `--test`, auto-picked up by `npm test`) graders this task end-to-end as five checks: (1) each of the eight pages declares `diataxis: how-to` and the expected `permalink: /how-to/<slug>`; (2) every retired permalink is absorbed by the new how-to page's `redirect_from:` (so external links to `/hooks`, `/libraries`, `/artifacts`, `/setup`, `/testing` keep resolving via `jekyll-redirect-from`); (3) every how-to permalink is reachable from the nav exactly once; (4) `docs/agent-auth.md` contains the literal credential names checked by `src/cli/run/preflight-credentials.ts` (`ANTHROPIC_API_KEY`, `CLAUDE_CODE_OAUTH_TOKEN`, `CURSOR_API_KEY`, `OPENAI_API_KEY`), the stable error code (`E_AGENT_CREDENTIALS`), and the `claude setup-token` instruction — so a user who hits the error in their terminal can grep for the literal and land on this page; (5) every how-to page stays recipe-shaped (at least one numbered `## N.` / `### N.` step heading plus a `## Verification` or `## Verify` section), guarding against future drift back into open-ended prose without a verifiable conclusion. With this task in, two of the four Diátaxis quadrants are now live (Explanation from task 3 plus How-to here); Reference lands next as task 5 (`cli`, `configuration`, `grammar`, `language`, env-vars), and the two Tutorials (`first-workflow`, `first-agent-run`) land as task 6. No runtime, CLI, or language behavior changes.
+- **Docs — Diátaxis Explanation pass: concentrate understanding-oriented pages (docs redesign 3/8):** First content task in the [Diátaxis](https://diataxis.fr/) docs rewrite. Four understanding-oriented pages now land in `docs/` as published Diátaxis explanation pages, each authored greenfield from the TypeScript/Bash source plus `docs/architecture.md` first and only then reconciled against its `docs/_legacy/` copy (per the anti-bias protocol in `.jaiph/skills/documentation-writer/SKILL.md`): `docs/why-jaiph.md` (permalink `/why-jaiph`) — short design/philosophy page that explains the orchestration-as-language framing, the four primitives (`rule` / `script` / `prompt` / `workflow`), the three commitments (strict structure around AI steps, sandbox by default, no vendor lock-in), and the deliberate non-goals; `docs/sandboxing.md` (permalink `/sandboxing`) — the sandboxing *model*: the two layers (compile-time `rule` validation vs runtime Docker isolation), the three workspace-presentation modes (overlay, copy, inplace), and an explicit threat model split into "what Docker protects against" (filesystem reach, process isolation, mount safety, env exposure, shell injection safety) and "what Docker does **not** protect against" (default-on network egress, forwarded agent credentials, hooks running on the host, image supply chain, container-escape limits, inplace's opt-out). The enabling procedure and the full `runtime.docker_*` config-key reference are explicitly **out of scope** for this page — they belong to the How-to (task 4) and Reference (task 5); `docs/inbox.md` (permalink `/inbox`) — the channels *model*: drain-driven delivery (not file-watched), routes-on-the-channel-not-on-workflows, sequential dispatch as the only mode, the routed-vs-unrouted distinction, and the three-parameter trigger contract; `docs/spec-async-handles.md` (permalink `/spec-async-handles`) — the `Handle<T>` *value model*: eager start / lazy resolve, passthrough vs resolving reads (and the `for_lines` exception), the implicit join at the end of every step list, how `recover` / `catch` compose on `run async` statement form, and why there is no `await` keyword. Each new page declares `diataxis: explanation` and the matching `permalink:` in its front-matter, picks up `redirect_from: /<slug>.md` where the legacy slug differs, and links inward to `architecture.md` / `language.md` / `grammar.md` for implementation and surface-syntax details (with no manual "More Documentation" block — nav is provided by `docs/_layouts/docs.html`). `docs/architecture.md` stays live and is tightened only at the link surface: `/sandboxing`, `/inbox`, and `/spec-async-handles` are removed from its `redirect_from:` list because those slugs are now owned by the new live pages, and three transitional `…#docker-container-isolation` deep links are simplified to bare `sandboxing.md` links since the new explanation page does not republish the old anchor. The Jekyll nav in `docs/_layouts/docs.html` adds four entries (Why Jaiph, Sandboxing, Inbox & Dispatch, Async Handles) alongside the existing Architecture / Agent Skill links so all four published explanation pages plus the contributor skill are reachable; the final IA regrouping happens in task 7. A new integration test `integration/docs-explanation-task3.test.ts` (Node `--test`, auto-picked up by `npm test`) graders this task end-to-end as five checks: (1) each of the four pages declares `diataxis: explanation` and the expected permalink; (2) the nav links to each new permalink exactly once; (3) `sandboxing.md` contains real threat-model content — both the `What Docker protects against` and `What Docker does **not** protect against` headings, plus concrete claims about dropped capabilities, the env-var allowlist, hooks-on-host, and default-on network egress; (4) `sandboxing.md` has no `Enabling Docker` heading and no numbered enabling procedure under any `enabl*` heading (those move to a how-to in task 4); (5) `sandboxing.md` has no `| Key | …` reference table, no row keyed by ``runtime.docker_*``, and no `Configuration keys` / `Failure modes` heading (reference content lives in task 5). The legacy-quarantine harness `integration/docs-legacy-quarantine.test.ts` is updated in the same step to model the new "recreated-with-legacy-reference" state: `inbox.md`, `sandboxing.md`, and `spec-async-handles.md` move from the `QUARANTINED_PAGES` list to a new `RECREATED_WITH_LEGACY` list (a live page exists at `docs/<name>.md` and the legacy copy stays at `docs/_legacy/<name>.md` for reconciliation), and the publish-side leak check switches its canonical quarantined probe from `/sandboxing` to `/hooks` (which is still quarantined and is now asserted to exist as a redirect stub but never as page content). The structure harness `integration/docs-structure.test.ts` loosens the "legacy pages exempt" assertion to permit a live counterpart at `docs/<name>.md` (the recreated case), since the live + legacy invariant is pinned by the legacy-quarantine harness above. README.md is updated to surface the four new explanation pages in the top-line link bar and in the "Docs note" callout, and to drop `inbox`, `sandboxing`, `spec-async-handles` from the legacy index (the still-quarantined slugs — Getting Started, Setup, Libraries, Language, Grammar, CLI, Configuration, Testing, Hooks, Runtime artifacts, Contributing — stay listed). The Safety-and-inspectability bullet repoints its `Sandboxing` link from `docs/_legacy/sandboxing.md` to `docs/sandboxing.md`. `docs/index.html` is unchanged: its in-site links already use bare relative slugs (`href="inbox"`, `href="sandboxing"`) which now resolve to the live explanation pages instead of bouncing through `architecture.md`'s `redirect_from`. No runtime, CLI, or language behavior changes.
+- **Docs — Diátaxis foundation: front-matter convention + machine-checkable docs-lint harness (docs redesign 2/8):** Lays the backbone the remaining tasks of the [Diátaxis](https://diataxis.fr/) docs redesign (3–8) are graded against. A new front-matter key **`diataxis:`** is defined for every published `docs/*.md` page, valued `tutorial | how-to | reference | explanation | contributor` (the five quadrants of the vendored `.jaiph/skills/documentation-writer/SKILL.md` plus a `contributor` bucket for in-repo contributor docs that fall outside the four user-facing quadrants). The two currently live pages declare their type: `docs/architecture.md` → `diataxis: explanation`, `docs/jaiph-skill.md` → `diataxis: contributor`. A new integration test `integration/docs-structure.test.ts` (Node `--test`, picked up automatically by `npm test` through the existing `find dist/integration -name '*.test.js'` glob in `package.json` — no script change required) wires this into CI as six docs-lint checks: (1) every published `docs/*.md` must carry a valid `diataxis:` value from the allowed set; (2) every `<a href="{{ '/foo' | relative_url }}">` entry in `docs/_layouts/docs.html` must correspond to a published page whose `permalink:` matches; (3) every published page must be linked from nav **exactly once** (catches both dangling nav entries and missing ones); (4) every internal Markdown link, `permalink:`, and `redirect_from:` value must resolve to a known route (a published `permalink:` or a `redirect_from:` alias), and any `#anchor` on a link to a live page must match a heading slug in that page (kramdown / GFM heading slug rules, with kramdown `{:#explicit-id}` / `{: #id}` IALs honored); and (5) every historical nav permalink mined from `git log -p --all -- docs/_layouts/docs.html` must still resolve via a current page or a `redirect_from:` alias — this is the **redirect-coverage** check that prevents removing a page or renaming a permalink without a stub. A sixth test pins the legacy-quarantine boundary by asserting that `docs/_legacy/*.md` are **exempt** from all of the above (they are read from a sibling directory, never enumerated as published pages) and that none of the quarantined filenames also appear at `docs/<name>.md`. Pages excluded from publishing by `docs/_config.yml` (the `_legacy` entry) are likewise outside the lint scope, which keeps the historical pre-redesign prose in git without making it count as "published". Because tasks 3–8 will replace the historical permalinks (`/getting-started`, `/setup`, `/libraries`, `/artifacts`, `/language`, `/grammar`, `/cli`, `/configuration`, `/testing`, `/spec-async-handles`, `/spec-async-isolated`, `/target-design`, `/inbox`, `/hooks`, `/sandboxing`, `/reporting`, `/contributing`) gradually, and they would otherwise fail check 5 the moment the page is quarantined, `architecture.md` and `jaiph-skill.md` now declare every one of them under `redirect_from:` so each historical URL routes to a live destination until the new Diátaxis page owns it (architecture.md absorbs the 16 explanation/reference/how-to slugs as its transitional landing target; jaiph-skill.md picks up `/contributing` since contributor docs co-locate there for now). `jekyll-redirect-from` (already declared in `docs/_config.yml`) emits the per-alias meta-refresh stubs at build time so external links keep working; the docs-lint harness only checks the alias→page mapping, not the generated HTML. The Jekyll nav itself (`docs/_layouts/docs.html`) flips the "Agent Skill" entry from the raw GitHub URL to the in-site permalink `{{ '/jaiph-skill' | relative_url }}` now that the page is a first-class published Diátaxis quadrant; the raw GitHub URL stays in `README.md` and `docs/index.html` because those are the entry points agents themselves consume and they need the unrendered Markdown. The legacy-quarantine integration test `integration/docs-legacy-quarantine.test.ts` is loosened in the same step to reflect the new redirect-stub policy: previously it asserted that quarantined slugs (e.g., `/sandboxing`) **must not** appear in `_site/`; it now permits the small meta-refresh stub emitted by `jekyll-redirect-from` and only fails if the original quarantined prose (`Docker container isolation`, `sandbox mount`) leaks into the stub. The embedded `JAIPH_SKILL_MD_BASE64` in `src/runtime/embedded-assets.ts` (the in-binary fallback for `jaiph init`) is regenerated so the embedded copy includes the new `diataxis: contributor` / `redirect_from: /contributing` front-matter; no behavior change, just a re-encoding to match `docs/jaiph-skill.md` byte-for-byte. No runtime, CLI, or language changes; this is the verification harness the next six redesign tasks will be measured against.
+- **Docs — Quarantine pre-redesign pages under `docs/_legacy/` ahead of the Diátaxis rewrite:** The existing 14 flat-mix pages (Tutorial/How-to/Reference/Explanation blended per page) have been **moved verbatim** from `docs/*.md` into `docs/_legacy/*.md` with `git mv` so the redesign (tasks 3–8 of the docs-redesign queue) can be authored greenfield against the source code without paraphrasing or in-place edits of the old prose. `docs/architecture.md` and `docs/jaiph-skill.md` stay at their original paths — `architecture.md` is a declared source of truth read by `.jaiph/docs_parity.jh` and `jaiph-skill.md` is fetched raw by agents via the canonical GitHub URL. `docs/_config.yml` adds `_legacy` to the Jekyll `exclude:` list so the quarantined pages stay in git but are **not published**; `bundle exec jekyll build` no longer emits `_site/_legacy/**` and the old permalinks (`/cli`, `/sandboxing`, `/getting-started`, etc.) did not yet resolve on `jaiph.org` until greenfield replacements added `redirect_from` stubs (tasks 3–7). The docs sidebar in `docs/_layouts/docs.html` is trimmed to only the still-live pages (landing, Architecture, and the raw Agent Skill link) so the built site has no dangling nav entries. `README.md` doc links are repointed at `docs/_legacy/<page>.md` so the GitHub README still resolves until tasks 3–8 rebuild each quadrant; the env-forwarding parity check in `src/runtime/docker.test.ts` now reads `docs/_legacy/sandboxing.md` and asserts the cross-link from `docs/_legacy/configuration.md` and `docs/_legacy/cli.md`. A new integration test (`integration/docs-legacy-quarantine.test.ts`) asserts the move (live pages still present, every quarantined page moved), that no nav entry points at a quarantined permalink, and — when Bundler is available — that `bundle exec jekyll build` exits 0 with no `_site/_legacy/` directory and no `/sandboxing` page generated, while `/architecture` is still built. No runtime, CLI, or language behavior changes; this is purely a docs-site reorganization to prevent agent anchoring during the redesign.
+
+# 0.10.0
+
+## Summary
+
+- Docker sandbox **`inplace` mode** (edits land live on the host while the machine stays isolated) plus `jaiph run` CLI flags `--workspace`, `--inplace`, `--unsafe`, `-y`/`--yes`.
+- Agent reliability: **prompt retry** with escalating backoff, a **fail-fast credential pre-flight** keyed to the backend, and the default sandbox timeout raised to **4 hours**.
+- **`jaiph install`** gains registry name resolution and commit-SHA pinning; new per-platform **standalone release binaries** + installer and a release-prep workflow that single-sources the CLI version.
+- Parser/compiler **simplification refactors**, language features (`else` branches, dot-notation `if`/`match` subjects, `catch`/`recover` on inline-script `run`), and assorted fixes.
+
+## All changes
+
+- **Feat — Fail fast on missing agent credentials with a host-side pre-flight keyed to the entry file's backend(s):** Before this release, only the **codex** backend checked for a credential, and the check happened **at runtime inside the prompt** (`runCodexBackend` in `src/runtime/kernel/prompt.ts`) — the workflow runner spun up, executed steps, and only blew up at the first `prompt`. The `claude` and `cursor` backends had no credential check at all; missing keys surfaced as opaque CLI failures deep inside the runtime, and under Docker the failure mode was worse because interactive CLI logins (`cursor-agent login`, `claude` interactive auth) do not cross the container boundary (fresh `$HOME`, no Keychain). This release adds a **host-side credential pre-flight** in `runWorkflow` (`src/cli/commands/run.ts`) that runs after the module graph + effective config + Docker mode are resolved but **before** the workflow runner or the container is launched (the `--raw` embedded path is intentionally skipped). The pre-flight scans the **entry `.jh` file's** module-level `config` and each of its workflow-level `config` blocks plus the effective default (`JAIPH_AGENT_BACKEND` env, or `cursor` when unset) to collect the distinct backend(s) the run could reach, then evaluates each against the env that will actually arrive at the agent — `runtimeEnv` on host, or the **forwarded allowlisted** env when Docker is on (via `isEnvAllowed`), so a credential present on the host but stripped by the allowlist counts as missing. The per-backend rule is asymmetric to match the login-friendly host story and the strict container story: **codex** requires `OPENAI_API_KEY` and is a hard error on both host and Docker (no CLI-login fallback exists); **claude** requires `ANTHROPIC_API_KEY` **or** `CLAUDE_CODE_OAUTH_TOKEN` (the latter from `claude setup-token`) — Docker is a hard error, host is a warning (a stored Claude CLI login may still work); **cursor** requires `CURSOR_API_KEY` with the same host/Docker split as claude. In **unsafe mode** (`JAIPH_UNSAFE` / `--unsafe`) the pre-flight is skipped entirely — that is the explicit "run on the host, trust my environment" escape hatch, so a stored CLI login is trusted and even the codex hard error defers to the runtime backend guard (covered by `src/cli/run/preflight-credentials.test.ts`). Every error and warning names (a) the backend, (b) the model when `agent.default_model` is set, (c) the **entry `.jh` file path** and the config scope that selected the backend (`module config`, `workflow <name>`, `JAIPH_AGENT_BACKEND env`, or `default`), and (d) the concrete remedy — e.g. ``Run `claude setup-token` and export CLAUDE_CODE_OAUTH_TOKEN, or set ANTHROPIC_API_KEY.`` For Docker runs the message also notes the var must be set on the **host** so it gets forwarded into the container. Hard failures use a stable error code, `E_AGENT_CREDENTIALS`, and exit non-zero with **no runner or container launched**; warnings stream to stderr and the run proceeds. The pre-flight is **silent** when credentials are present (including when only one of claude's two accepted vars is set) and is **skipped entirely** when the entry file neither declares an explicit backend nor uses any `prompt` step — so workflows that do no agent work get no false-positive warning for an unused default backend. The pre-flight runs for **all Docker modes including `inplace`**, and the late codex-only check inside `runCodexBackend` is kept as defense in depth (the pre-flight catches it first with the better message). Deeper per-import-module backend overrides resolved at runtime are out of scope — entry-file scan is the documented contract. New: `src/cli/run/preflight-credentials.ts` and `src/cli/run/preflight-credentials.test.ts`; new E2E `e2e/tests/139_agent_credentials_preflight.sh`; CLI wiring in `src/cli/commands/run.ts` ahead of the Docker check and runner spawn. `e2e/lib/common.sh` now seeds dummy `CURSOR_API_KEY` / `ANTHROPIC_API_KEY` values for the shared E2E context so existing tests using mock agent binaries stay silent under the new warn-only host path (tests that exercise the missing-key contract explicitly unset them via `env -u`). Docs updated in `docs/configuration.md` (new **Credential pre-flight** subsection under **Backend selection** with the per-backend / per-mode rule matrix, the message-content contract, and the `E_AGENT_CREDENTIALS` code; the **Backend selection** intro now names the accepted credentials and CLI-login alternatives per backend; **Codex setup** cross-references the pre-flight), `docs/sandboxing.md` (a new **Credential pre-flight** callout under **Enabling Docker** explains why claude / cursor fail hard under Docker — the CLI login does not cross the container boundary — and that the check uses the post-forwarding env via `isEnvAllowed`), and `docs/cli.md` (the `jaiph run` synopsis gains a **Credential pre-flight** paragraph; the env-var list updates `JAIPH_AGENT_BACKEND` / `OPENAI_API_KEY` with the pre-flight semantics and adds `ANTHROPIC_API_KEY` / `CLAUDE_CODE_OAUTH_TOKEN` / `CURSOR_API_KEY` entries naming the host-warn vs Docker-hard-fail split).
+- **Feat — Retry `prompt` steps on transient transport failure with an escalating backoff schedule:** A backend invocation in `runPromptStep` (`src/runtime/kernel/node-workflow-runtime.ts`) used to surface `result.status !== 0` from `executePrompt` as an immediate step failure, so any rate limit, API outage, network blip, or agent-CLI crash aborted the step (and the workflow, absent `recover` / `catch`). This release adds an **automatic retry loop around the prompt execution** with a fixed escalating backoff: after the initial attempt fails, the runtime waits `15s → 1m → 10m → 30m → 2h` between subsequent attempts and then gives up — five retry delays, **six total attempts**, ~2h41m wall-clock for a full failure run. Only the **transport** path is retried (`result.status !== 0` — spawn failure, non-zero backend exit, codex HTTP error); deterministic post-processing failures in the same function — invalid JSON (`prompt returned invalid JSON`) and schema validation (`prompt response failed schema validation`) — keep returning `{ ok: false }` immediately, because retrying them would just repeat the same parse with the same captured output. Retry composes **below** `recover` / `catch`: backoff is exhausted first, then the failure reaches the enclosing recover loop. Each attempt is a fresh `executePrompt` call with its own `PROMPT_START` / `PROMPT_END` and surrounding `STEP_START` / `STEP_END` pair (live `__JAIPH_EVENT__` and durable `run_summary.jsonl`). Every failed attempt and the final termination emit a `LOGERR` through `RuntimeEventEmitter.emitLog` (the same facility as the `logerr` keyword — live stderr event plus a durable summary line), carrying the attempt number, the backend, a single-line error summary, and — for retries — the human delay before the next attempt (`retrying in 15s`, `retrying in 2h`); the termination line notes that retries are exhausted before the step fails. Logging happens regardless of whether the step is wrapped in `recover` / `catch`. The schedule, sleep, and abort surfaces are all **testable and cancellable**: the new module `src/runtime/kernel/prompt-retry.ts` exports `DEFAULT_PROMPT_RETRY_DELAYS_MS`, `resolvePromptRetryDelays(env)`, `defaultPromptSleep(ms, signal)` (a `setTimeout` that races against an `AbortSignal` and rejects with a `PromptRetryAbortError` on abort), and `formatRetryDelay` / `summarizeError` helpers; `NodeWorkflowRuntime` accepts `sleep` and `promptRetryDelays` constructor options so tests can pass a recording stub and a short delay array to assert the exact sequence with zero real wall-clock wait. The runtime owns an internal `AbortController` and exposes `abort()` / `isAborted()`; aborting clears the pending timer and halts the loop without further `executePrompt` calls. Both knobs are environment-only — there is no in-file key. **`JAIPH_PROMPT_RETRY=0`** disables retry entirely (one attempt, fail on transport failure exactly as before; the sleep is never called). **`JAIPH_PROMPT_RETRY_DELAYS`** is a comma-separated list of non-negative integer milliseconds (e.g. `"500,1000,5000"`) that replaces the default schedule; invalid entries (non-numeric, negative, empty list, trailing junk) abort the prompt with a clear error rather than silently falling back to the default. The validated schedule (or its parse error) is resolved once per run and cached on the runtime so a misconfiguration surfaces the same way for every prompt and is not re-thrown per attempt. `jaiph test` (`src/runtime/kernel/node-test-runner.ts`) defaults `JAIPH_PROMPT_RETRY=0` for every test block so a failing mock prompt (e.g. no matching arm, or no queued response) fails fast instead of waiting through the ~2h41m production schedule; tests that intentionally exercise the retry loop can opt in by setting the variable explicitly. Two test-only orthogonal touch-ups for the same reason: `integration/sample-build/run-prompt-agent.test.ts` (the missing-`claude` pre-flight check) and `src/runtime/kernel/node-workflow-runtime.artifacts.test.ts` (failed-prompt stderr capture) both set `JAIPH_PROMPT_RETRY=0` for their single-attempt failure assertions — neither test belongs to the retry feature, but each would otherwise wait through the default schedule on a non-zero exit. Under Docker, the full default backoff (~2h41m) fits inside the default container timeout (`runtime.docker_timeout_seconds = 14400` = 4h) with thin headroom; the schedule constant in `prompt-retry.ts` carries an inline note pointing at `JAIPH_DOCKER_TIMEOUT` for workflows that need the full retry budget plus their own workload time. Tests in `src/runtime/kernel/prompt-retry.test.ts` cover the env parser (default schedule, disable, custom comma list, every invalid-input variant) and the abort-aware sleep; tests in `src/runtime/kernel/node-workflow-runtime.prompt-retry.test.ts` pin the loop end-to-end with mock backends — exact sleep sequence equals the schedule, six-attempts-then-fail terminates with the final error, mid-loop success short-circuits, recover/catch composes below retry, invalid-JSON / schema failures are not retried (one call, sleep never invoked), `JAIPH_PROMPT_RETRY=0` produces a single attempt, custom delays are honored, invalid delays surface as a step error with a `LOGERR`, and `runtime.abort()` during a pending backoff exits without a further `executePrompt` call. Docs updated in `docs/configuration.md` (new **Prompt retry on transport failure** subsection under **Backend selection** documenting the default schedule, what is and is not retried, per-attempt eventing, logging, cancellation, both env knobs, and the `jaiph test` default; the env-only table at the end of the page lists `JAIPH_PROMPT_RETRY` and `JAIPH_PROMPT_RETRY_DELAYS`), `docs/cli.md` (the **Agent and prompt configuration** env-var list gains both names with the default schedule and the `jaiph test` carve-out), `docs/architecture.md` (the **Node Workflow Runtime** bullet documents the transport-failure retry, the injectable sleep and abort seams, and the compose-below-`recover` ordering), `docs/testing.md` (the harness env-var table lists the default `JAIPH_PROMPT_RETRY=0` and the parent-env opt-out for retry-exercising tests), and `docs/sandboxing.md` (the **Timeout** paragraph gains a note that a full default backoff fits inside the default container timeout with thin headroom and points at the configuration knobs for raising it or shortening the schedule).
+- **Feat — `jaiph run` flags `--workspace`, `--inplace`, `--unsafe`, `-y` / `--yes` as CLI front-ends for the sandbox env switches:** Sandbox/runtime selection has historically been configured purely by env vars — `JAIPH_UNSAFE=true` turns Docker off entirely (read in `resolveDockerConfig` in `src/runtime/docker.ts`), `JAIPH_INPLACE=1`/`true` opts into the in-place sandbox mode (read in `selectSandboxMode`), and `JAIPH_INPLACE_YES=1` auto-confirms the in-place destructive-edit prompt — with no CLI surface. Workspace root was likewise auto-detected only: `runWorkflow` in `src/cli/commands/run.ts` called `detectWorkspaceRoot(dirname(inputAbs))` with no override path (while the sibling `jaiph compile` already exposed a `--workspace <dir>` flag). This task gives `jaiph run` a first-class CLI surface for those four switches so users do not have to set env vars for one-off runs, while keeping env vars working unchanged. `parseArgs` in `src/cli/shared/usage.ts` (and its exported `ParsedArgs` type) now also recognizes `--workspace <dir>` (requires a value; missing value throws `--workspace requires a directory path`, matching the existing `--target` style), `--inplace`, `--unsafe`, and `--yes` / `-y` — all four stop at `--` exactly like the existing flags, so `run --inplace -- --inplace` parses as `inplace:true` plus the literal `--inplace` in `positional`. `runWorkflow` resolves the workspace via `workspace ? resolve(workspace) : detectWorkspaceRoot(dirname(inputAbs))` (explicit path wins; the path must exist and be a directory or the run fails with `--workspace path does not exist: <path>` / `--workspace path is not a directory: <path>` before any container starts) and threads the three boolean flags through a new helper `applySandboxFlags(env, flags)` in `src/cli/run/env.ts` that **mutates the local runtime env map only** — never `process.env`, which would leak flag choices into every child process globally — setting `JAIPH_INPLACE=1` / `JAIPH_UNSAFE=true` / `JAIPH_INPLACE_YES=1` on for the duration of one run. The mutation happens right after `resolveRuntimeEnv` (which already returns a fresh spread of `process.env`) and **before** `resolveDockerConfig` / `selectSandboxMode` consume the env — i.e. the env layer remains the **single source of truth** for sandbox mode and there is no parameter threading through `spawnDockerProcess` / `buildDockerArgs` or duplication of the mode-selection logic. Flag and env agree on enablement (both paths just turn the env var ON), so setting only the env var still works (regression-tested) and setting both flag and env is not an error. The two contradictory enabling paths — `--inplace` (sandbox on, workspace mounted rw) and `--unsafe` (sandbox off entirely) — fail fast inside `applySandboxFlags` with a new `E_FLAG_CONFLICT` error (the same check catches the mixed `--inplace + JAIPH_UNSAFE=true` and `--unsafe + JAIPH_INPLACE=1` cases) before any container is launched. The new flags are an **intentional ergonomic asymmetry**: they only affect `jaiph run`, while the corresponding env vars still influence other entry points (e.g. `jaiph test`) — documented in both `printUsage` and the per-command `RUN_USAGE`, plus an explicit `Note:` line in both. A new `--workspace` *env* equivalent is **out of scope**: the name `JAIPH_WORKSPACE` is already taken as the in-container remap **output** in `remapDockerEnv` and is not repurposed as an input. The raw `--raw` code path (`runWorkflowRaw`) accepts the same flags via a `sandboxFlags` parameter so the env normalization runs there too. `printUsage` in `src/cli/shared/usage.ts` and `RUN_USAGE` in `src/cli/commands/run.ts` both list the four new options under `jaiph run` with at least one example (`jaiph run --inplace --workspace ./app ./flows/fix.jh`). New tests in `src/cli/shared/usage.test.ts` pin the parser contract (each new field returned correctly, `--workspace` value-required error, post-`--` routing unchanged, regression for `--target` / `--raw` / `--`), `src/cli/run/sandbox-flags.test.ts` pins the env-normalization contract (each flag sets the matching env var; flag-only is sufficient for `selectSandboxMode === "inplace"` and `resolveDockerConfig().enabled === false`; flag and env agree; `E_FLAG_CONFLICT` thrown for the mixed cases), and `src/cli/commands/run.test.ts` pins the end-to-end behavior (missing `--workspace` value error, non-existent / non-directory `--workspace` errors, `--inplace --unsafe` fails before launching any container, `--yes` skips the in-place prompt). Docs updated in `docs/cli.md` (the `jaiph run` synopsis and **Flags** section list the four new options with the env-var equivalence noted on each, an explicit asymmetry note about `jaiph test`, and a new example; the env-var entries for `JAIPH_UNSAFE`, `JAIPH_INPLACE`, and `JAIPH_INPLACE_YES` now cross-reference the matching CLI front-end) and `docs/sandboxing.md` (the **Enabling Docker** section gains a top-of-section pointer at the new CLI flags; the **Inplace mode** *Enabling* and *Skipping the prompt* bullets name `--inplace` / `-y` / `--yes` as alternatives to the env vars; the **Failure modes** table gains an `E_FLAG_CONFLICT` row for the contradictory-flag case).
+- **Fix — `jaiph run` accepts the `--flag=value` form, not just `--flag value`:** `parseArgs` in `src/cli/shared/usage.ts` matched flags by exact token, so `--workspace=/path` (and `--target=/path`) fell through to `positional` and was misread as the workflow file / an argument — the symptom being a path that looked like it "lost" everything after the `=`. Long options are now split on the **first** `=` (so values may themselves contain `=`), accepting both `--flag value` and `--flag=value` for the value-taking flags (`--target`, `--workspace`); boolean flags (`--raw`, `--inplace`, `--unsafe`, `--yes`) reject an `=value` form with a clear `<flag> does not take a value` error, and `--workspace=` with an empty value still errors. `--` passthrough is unchanged (a `--flag=value` token after `--` stays a literal workflow arg). New regression tests in `src/cli/shared/usage.test.ts`.
+- **Feat — Docker sandbox `inplace` mode: live host edits with the machine still isolated:** Docker sandboxing previously had exactly two modes (`SandboxMode = "overlay" | "copy"` in `src/runtime/docker.ts`), both of which **protect the host workspace from the run** — overlay mounts the workspace read-only and uses `fuse-overlayfs` so edits die with the container; copy clones the workspace and mounts the disposable clone read-write. Neither persists workflow edits to the real checkout. This release adds a **third mode**, `inplace`, for the iterate-on-real-files dev loop: the host workspace is bind-mounted `:rw` directly at `${CONTAINER_WORKSPACE}` so the run's edits land **live on the host**, while the container boundary still prevents access to the rest of the machine (only the workspace + runs dir mounts, `--cap-drop ALL`, `--security-opt no-new-privileges`, and the `JAIPH_*` / `ANTHROPIC_*` / `CURSOR_*` / `CLAUDE_*` env allowlist remain in place). The posture is **"trusted workspace, untrusted machine"** — a different axis from `JAIPH_UNSAFE` (which turns the sandbox off entirely): `JAIPH_INPLACE` keeps the sandbox **on** and only removes workspace isolation, so `resolveDockerConfig`'s `enabled` logic is unchanged. Mode selection is **explicit opt-in only** — `selectSandboxMode(env)` returns `"inplace"` iff `JAIPH_INPLACE` is `1`/`true`, and that opt-in **takes precedence over** both `JAIPH_DOCKER_NO_OVERLAY` and the `/dev/fuse` heuristic; without the env var, overlay/copy selection is byte-for-byte unchanged. `buildDockerArgs` in `inplace` mode bind-mounts `resolve(opts.workspaceRoot)` at `${CONTAINER_WORKSPACE}:rw` via `validateMountHostPath`, omits `overlay-run.sh`, `--device /dev/fuse`, and the overlay-only capability set (`SYS_ADMIN`, `SETUID`, `SETGID`, `CHOWN`, `DAC_READ_SEARCH`, `apparmor=unconfined`), and on Linux runs as `--user ${hostUid}:${hostGid}` (reusing `_uidDetect.getHostUidGid()` and the existing `E_DOCKER_UID` failure) so files created by the run are owned by the user, not root. `spawnDockerProcess` in `inplace` mode does **not** call `allocateSandboxWorkspaceDir`/`cloneWorkspaceForSandbox` and does not require `sandboxWorkspaceDir`; the `.jaiph/runs` mount (`${CONTAINER_RUN_DIR}:rw`) is still created independently so the nested-under-workspace case keeps working. A new test seam `_dockerSpawn.run(args, opts)` (a thin wrapper around `spawn("docker", …)`) lets spawn-level tests assert that the clone path is never taken in `inplace` mode. **Destructive-edit safeguard.** Because a crashed/killed `inplace` run leaves the real workspace half-mutated with no rollback, the CLI must **warn + interactively confirm** before launching the container. The new helper module `src/runtime/docker-inplace.ts` exposes `detectGitTreeState(workspaceRoot)` (returns `"clean" | "dirty" | "no-repo"`, never throws — `git` missing on PATH, the directory not being a git repo, and permission errors all collapse to `"no-repo"`), `formatInplaceWarning(workspaceRoot, state)` (three friendly, developer-oriented warning variants — *clean git tree* → reversible via `git restore .` / `git reset --hard`; *dirty git tree* → edits mix in with uncommitted work and cannot be cleanly undone, suggest committing or stashing first; *no git repo* → no safety net, suggest `git init` and a baseline commit — each variant names the actual workspace directory and ends with the "Everything outside this directory stays sandboxed" reassurance), a minimal readline-based yes/no prompt (`defaultPromptYesNo`, defaults to "no" on empty input / EOF / any non-`y` answer), and the orchestrator `confirmInplaceRun(workspaceRoot, env, isTTY)`. `runWorkflow` in `src/cli/commands/run.ts` calls `confirmInplaceRun` between `prepareImage` and the banner when `selectSandboxMode === "inplace"`; on a "no" answer the run aborts cleanly with a non-zero exit and `jaiph in-place mode: aborted by user.` on stderr — no container is launched. The prompt is **skippable** via `JAIPH_INPLACE_YES=1` / `"true"` (CI / automation path); when set, `_inplacePrompt.ask` is never called. **Non-TTY behavior.** When stdin is not a TTY (`isTTY=false`, already threaded through `run.ts`), the run requires `JAIPH_INPLACE_YES`; if it is absent, `confirmInplaceRun` throws `E_DOCKER_INPLACE_NO_CONFIRM jaiph in-place mode requires interactive confirmation, but stdin is not a TTY. Set JAIPH_INPLACE_YES=1 to auto-confirm.` and the run exits before the container is launched — inplace mode never silently proceeds unconfirmed. **Env-leak prevention.** `JAIPH_INPLACE` and `JAIPH_INPLACE_YES` are `JAIPH_`-prefixed and would otherwise pass `isEnvAllowed` (the only built-in exclusion prefix is `JAIPH_DOCKER_`). A new explicit name set `ENV_ALLOW_EXCLUDE_NAMES = Set(["JAIPH_INPLACE", "JAIPH_INPLACE_YES"])` is checked in `isEnvAllowed` so neither variable is forwarded into the container — this prevents a nested `jaiph run` inside the workflow from re-triggering inplace mode and keeps host control flags out of script environments. **Run banner surfacing.** `formatJaiphRunningBannerLines` in `src/cli/run/display.ts` now distinguishes all three modes: overlay → `Docker sandbox, fusefs`, copy → `Docker sandbox, tmp workspace`, **inplace → `Docker sandbox, in-place (live host edits)`**, and `no sandbox` when Docker is disabled. **macOS performance note (informational, no code change):** the `:rw` bind-mount goes through Docker Desktop's virtiofs file-sharing layer, so write throughput is slower than the APFS `cp -cR` clone copy mode uses; acceptable for the dev-loop use case. **Known sharp edges (called out in code comments, not implemented in this change):** concurrent runs on the same workspace in `inplace` mode are not locked — two parallel runs will write into the same directory simultaneously. Tests live in `src/runtime/docker.test.ts` (regression coverage that `selectSandboxMode` is unchanged without the env var, `inplace` precedence over `JAIPH_DOCKER_NO_OVERLAY` and `/dev/fuse`, `buildDockerArgs` produces `:rw` workspace mount with no `:ro` mount / no `--device /dev/fuse` / no `overlay-run.sh` / none of the overlay-only `--cap-add` flags while still emitting `--cap-drop ALL`, `--security-opt no-new-privileges`, `${CONTAINER_RUN_DIR}:rw`, and Linux `--user ${uid}:${gid}`; spawn-level proof via `_dockerSpawn.run` spy that `cloneWorkspaceForSandbox`/`allocateSandboxWorkspaceDir` are never invoked; a filesystem-level test that a write inside `inplace` mode is visible at the host path while overlay/copy leave the host path unchanged; the env-leak assertion that `-e JAIPH_INPLACE` / `-e JAIPH_INPLACE_YES` never appear in `buildDockerArgs` output and `isEnvAllowed` returns `false` for both names) and a new file `src/runtime/docker-inplace.test.ts` (covers all three warning variants — clean / dirty / no-repo — assert each names the directory and states the correct recovery posture; TTY + "no" answer aborts with no container launched; TTY + "yes" answer proceeds; `JAIPH_INPLACE_YES=1` proceeds without calling the prompt; non-TTY without the flag throws `E_DOCKER_INPLACE_NO_CONFIRM`; banner test in `src/cli/run/display.test.ts` asserts the `in-place (live host edits)` paren-string). Docs in `docs/sandboxing.md` updated with a dedicated **Inplace mode (trusted workspace, untrusted machine)** section (when to use it, what the warning does on clean / dirty / no-git states, automation/CI auto-confirm via `JAIPH_INPLACE_YES`, non-TTY abort with `E_DOCKER_INPLACE_NO_CONFIRM`, env-leak protection, banner distinction, macOS virtiofs caveat, and the concurrent-runs / no-rollback sharp edges); the threat-model **Filesystem access** and **Process isolation** bullets now name all three modes; **What Docker does NOT protect against** explicitly calls out the inplace opt-out; the sandbox-primitive selection in **Runtime behavior** describes the three-rule precedence (`JAIPH_INPLACE` → `inplace`; `JAIPH_DOCKER_NO_OVERLAY` or no `/dev/fuse` → `copy`; otherwise `overlay`); the **Workspace immutability contract** names `inplace` as the explicit opt-out; the **Failure modes** table gains `E_DOCKER_INPLACE_NO_CONFIRM`; **Environment variable forwarding** documents the new explicit-name exclusions; and a third **Container layout** block shows the inplace mount layout. `docs/cli.md` gains `JAIPH_INPLACE` and `JAIPH_INPLACE_YES` entries under the **Docker sandbox** env-var section (with the env-leak and non-TTY rules), and the banner-format reference now lists all four parenthetical strings. `docs/architecture.md`'s Docker-runtime-helper **Workspace immutability** bullet now names `inplace` as the explicit opt-out.
+- **Change — Default Docker container timeout raised to 4 hours:** `DEFAULTS.timeoutSeconds` in `src/runtime/docker.ts` goes from `3600` (one hour) to `14400` (four hours), so long agent-backed sandboxed runs — including a full prompt-retry backoff (~2h41m) — no longer hit the host-side kill timer by default. Still overridable via `runtime.docker_timeout_seconds` (in-file) or `JAIPH_DOCKER_TIMEOUT` (env); `0` disables it. Docs in `docs/configuration.md` and `docs/sandboxing.md` updated to "four hours".
+- **Tooling — `.jaiph/prepare_release.jh` workflow single-sources the CLI version through `package.json` and drives a clean release-prep with displayed-version check + registry build:** The CLI version was declared twice — once as `package.json` `"version"` and once as a **hardcoded string** in `src/cli/index.ts` (`process.stdout.write("jaiph 0.9.4\n")`) — with nothing keeping them in sync, so a release that bumped `package.json` but missed the source literal would silently ship the old display string. Standalone bun-compiled builds (`bun build --compile`) cannot read `package.json` from disk at runtime, so the version literal must be resolved at **build time** in both build forms. The build step `tools/embed-assets.js` (run by `npm run build` and by `npm install` via a new `prepare` lifecycle script in `package.json` so `src/version.ts` exists on a fresh checkout before `tsc` runs) now codegens **`src/version.ts`** — an auto-generated module exporting `export const VERSION = "<package.json version>";` — alongside the existing `src/runtime/embedded-assets.ts` regeneration; `src/cli/index.ts` imports `VERSION` from `"../version"` and prints `` `jaiph ${VERSION}\n` `` for `--version` / `-v`, so the literal is statically baked into both the `tsc` and `bun build --compile` outputs without a runtime `package.json` read. `src/version.ts` is added to `.gitignore` with a top-of-file comment naming the generator and explaining why it is single-sourced through `package.json`. A new release-prep workflow `.jaiph/prepare_release.jh` (callable as `jaiph run .jaiph/prepare_release.jh -- 0.9.5` or with no arg to auto-bump the next patch) runs the full pre-tag pipeline as a single command: (1) **resolve version** — empty arg → next patch computed from `package.json` (e.g. `0.9.4` → `0.9.5`), non-empty arg must match `^[0-9]+\.[0-9]+\.[0-9]+$` (digits only); anything else fails with the offending value in the error; (2) **preflight** — fails if the git tree is dirty (the workflow's own edits must be the only diff a reviewer sees) or if tag `v<version>` already exists; (3) **apply the version change** — `npm version <version> --no-git-tag-version` (updates `package.json` + `package-lock.json`) and replaces the hardcoded `v<old>` default in `docs/install`'s `REPO_REF` fallback with `v<new>` (the installer's curl-pipe entry point must work standalone and cannot single-source); (4) **displayed-version check** — `npm run build` then `node dist/src/cli.js --version`; output must equal `jaiph <version>` exactly, on mismatch the script prints both expected and actual strings before failing — an **end-to-end check on the built artifact** that catches a stale build or a broken version import/codegen, not just literal drift; (5) **build the registry** — `npm run registry:build` so the release ships a current `docs/registry`; (6) **summary** — logs the changed files and the remaining manual steps (review the diff, commit, `git tag v<version>`, push branch + tag — tag push triggers the docker-publish CI job and `release.yml`'s standalone-binary upload, then `jaiph use <version>` for a smoke check). The workflow itself **creates no commits and no tags** — every edit is left staged for the operator to review. A companion test file `.jaiph/prepare_release.test.jh` (discovered by `jaiph test`) covers the load-bearing branches via mocked scripts: next-patch default from a pinned `package.json` (`1.2.3` → `1.2.4`); explicit `X.Y.Z` arg accepted verbatim; non-`X.Y.Z` arg fails with the offending value (`not-a-version`, `1.2.3.4`); the `check_displayed_version` workflow prints both expected and actual strings on mismatch (`expected: jaiph 9.9.9` / `actual:   jaiph 0.0.0`); preflight rejects a dirty git tree; and preflight rejects an existing `v<version>` tag. The standalone-binary E2E (`e2e/tests/210_standalone_binary.sh`) now reads the expected `--version` literal from `package.json` (`node -p "require('${ROOT_DIR}/package.json').version"`) instead of pinning `jaiph 0.9.4`, so the test does not need an update on every bump and a divergence between the displayed string and `package.json` fails the E2E. `src/cli/commands/use.ts` — whose error message previously named `0.9.4` as the example version — is updated to use the generic `X.Y.Z` placeholder. The `--version` unit test in `src/cli/index.test.ts` asserts the displayed output equals `jaiph ` + `package.json`'s `version` field, so a future bump of `package.json` without rebuilding `src/version.ts` fails CI immediately. Docs updated in `docs/contributing.md` (the **Version tags, releases, and npm** section gains a top paragraph naming `.jaiph/prepare_release.jh` as the supported release-prep path with the explicit / next-patch invocation forms, the preflight / version-bump / displayed-version-check / registry-build contract, the **no commits or tags** guarantee, and the single-sourcing note that `src/version.ts` is codegen'd by `npm run embed-assets`; the **Typical commands** table rows for `npm run build` and `npm run embed-assets` are updated to call out the `src/version.ts` generation and the new `prepare` lifecycle hook so fresh checkouts type-check before the first `npm run build`) and `docs/architecture.md` (the **Distribution: Node vs Bun standalone** section's npm-build bullet now names `src/version.ts` as an embed-assets output and the standalone-build bullet documents that the displayed `jaiph --version` literal is statically baked into both build forms via the generated module — no runtime `package.json` read).
+- **Tooling — `npm run registry:build` regenerates `docs/registry` from the upstream `jaiphlang/registry` repo, with a shipped-file unit test that fails on schema drift:** `jaiph install <name>` loads its registry index from `https://jaiph.org/registry` (or `JAIPH_REGISTRY`), but `jaiph.org` is GitHub Pages serving the static files under `docs/` in this repo while the **source of truth** for the index lives in the separate `jaiphlang/registry` repo — maintained manually, with package PRs landing there, not here. There was no path to refresh `docs/registry` from upstream: a maintainer who merged a registry PR had to hand-copy the JSON into this repo, with no validation that it still matched the shape the CLI's `loadRegistryIndex` accepts. A new build script `scripts/build-registry.mjs` does the copy in one step: it fetches the index from `https://raw.githubusercontent.com/jaiphlang/registry/main/registry.json` (overridable via the first positional argv or `JAIPH_REGISTRY_SOURCE` so tests can point at a local fixture), writes the bytes to a sibling tmp file alongside `docs/registry`, runs them through the built `loadRegistryIndex` (imported from `dist/src/cli/commands/registry.js`, so the script requires `npm run build` first), and only on success renames the tmp file onto `docs/registry`. On any failure — unreachable source, invalid JSON, schema mismatch — the script exits non-zero and the previous `docs/registry` is left untouched, and the tmp file is removed so no stale `*.tmp-build-*` siblings accumulate. An npm script **`registry:build`** chains `npm run build` and the script call. This is a **regular command callable anytime**: after merging a registry PR in `jaiphlang/registry`, run `npm run registry:build`, commit the regenerated `docs/registry`, push — Pages redeploys jaiph.org automatically. `docs/registry` is seeded with an initial index (entry `jaiphlang` → `https://github.com/jaiphlang/jaiphlang.git`, description "Jaiph standard library: artifacts, git, queue") so `jaiph.org/registry` serves a valid document before the first build run. Two new tests pin the contract: `src/cli/commands/registry.test.ts` loads the **shipped** `docs/registry` through `loadRegistryIndex` (schema drift between the file and the CLI fails the test) and asserts the file parses as JSON with no Jekyll front matter (a leading `---\n…\n---` block would make Pages treat the file as a Jekyll page and break `loadRegistryIndex` on the live URL); `scripts/build-registry.test.mjs` exercises `buildRegistry` against local fixtures — valid JSON produces a byte-identical output, invalid JSON / schema mismatch / missing source all reject without touching the existing `docs/registry`, and no stale `*.tmp-build-*` siblings are left on failure. `package.json` adds the `registry:build` npm script and threads `scripts/build-registry.test.mjs` into the `test` script so the build-script contract runs alongside the rest of the suite. `docs/libraries.md` gains a **Publishing a library** section covering repo layout (top-level `.jh` modules, `export` visibility, companion scripts like `queue.py`), git-tag-based versioning, installing by name (`jaiph install jaiphlang@v0.1.0`), the publishing flow (PR to `jaiphlang/registry` → maintainer runs `npm run registry:build` → entry live on jaiph.org at the latest with the next release), plus a separate **Lockfile semantics** section calling out commit pinning and an **Overriding the registry source** section documenting the `JAIPH_REGISTRY` override. `docs/cli.md` already shows the bare-name install form and lists `JAIPH_REGISTRY` in the env-var table; no further changes were needed there.
+- **Feature — `jaiph install` pins commit SHAs in `.jaiph/libs.lock`, strips `.git` from installed libs, and rejects clones with no `.jh` modules:** `gitCloneRunner` in `src/cli/commands/install.ts` shallow-cloned each lib into `.jaiph/libs/<name>/` and left `.git` in place, so every installed library showed up as a nested git repo inside the consumer workspace (noisy `git status`, IDE confusion about which tree was being viewed, accidental commits inside the lib's repo). The lockfile recorded only `{ name, url, version }`, where `version` is a git ref — and refs can be moved — so "restore from lockfile" was not actually reproducible: a re-tag in the upstream repo silently swapped which commit the consumer pulled. And nothing validated that the cloned tree was a jaiph library at all, so a typoed URL pointing at an unrelated repo happily landed in `.jaiph/libs/` and got a lock entry written for it. The CLI now runs a **post-clone hygiene** step (`postCloneHygiene` in `src/cli/commands/install.ts`) after every successful clone: (1) walk the cloned tree (skipping `.git`) via `hasJhFileRecursive` and assert at least one `*.jh` file exists — if not, the lib dir is removed and the command fails with `lib "<name>" contains no .jh modules — not a jaiph library?` and **no lock entry is written for it**; (2) run `git -C <libDir> rev-parse HEAD` (via `revParseHead`) and capture the resulting 40-char SHA; (3) delete `<libDir>/.git` recursively, so the installed lib is plain files on disk and the lockfile is the source of truth for what was cloned. The captured SHA is added to the `LockEntry` shape as a new optional `commit?: string` field and written via `specToLockEntry(spec, commit)`. The clone runner is wrapped in `runInstall` (`wrappedRunner`) so the SHA is collected from every successful clone before lock entries are upserted; warm-skipped libs preserve any prior `commit` via the existing-entry lookup before `upsertLockEntry`. **Restore verification.** Each lock entry now also seeds `InstallSpec.expectedCommit` on the way back into the clone path. When restore re-clones a lib whose lock entry carries `commit`, the same `postCloneHygiene` step compares the freshly cloned HEAD SHA against `spec.expectedCommit` after stripping `.git`; on mismatch the lib dir is removed and the command fails non-zero with a message naming both SHAs and the explicit remedy — ``lib "<name>" commit mismatch: locked <SHA>, cloned <SHA> — the ref may have moved; re-run `jaiph install <name>@<version>` explicitly to accept the new commit``. Lock entries without `commit` (older lockfiles) restore without the comparison, so existing checkouts keep working unchanged. New unit tests in `src/cli/commands/install.test.ts` use **local fixture repos** (a small `makeFixtureRepo(parent, name, opts)` helper that `git init`s a temp dir, commits a seed `main.jh` file or a non-`.jh` file depending on `opts.withJh`, and optionally `git tag`s the seed commit) and exercise the contract against real `git clone` invocations — no network. The four new tests pin the acceptance criteria: (1) installing from a local fixture removes `.git` from the installed lib dir and records a 40-char `commit` in the lockfile that equals the fixture's `git rev-parse HEAD`; (2) tag-moved scenario — install at `@v1`, retag `v1` to a new commit upstream, remove the local lib dir, restore — fails non-zero with **both SHAs** present in the error message and removes the lib dir; (3) cloning a repo with no `.jh` files exits non-zero with `lib "<name>" contains no .jh modules — not a jaiph library?`, leaves no `.jaiph/libs/<name>/` dir, and writes no lock entry; (4) a hand-written lockfile **without** a `commit` field still restores (no `.git` after restore, exit 0) — backward-compatibility contract. Existing tests that supply a mock `CloneRunner` were updated to drop a placeholder `lib.jh` file alongside the mocked clone so the `.jh` validation passes (the tests already mock the clone step itself; the hygiene step still inspects the on-disk tree the mock produces). Docs updated in `docs/cli.md` (the `## jaiph install` section gains a **Post-clone hygiene** explainer covering the `.jh` check, commit capture, and `.git` strip; the **Without arguments** subsection gains a **Commit verification on restore** paragraph with the mismatch error template; the **Lockfile** subsection now shows `commit` in the JSON example and documents the backward-compat behavior for older lockfiles) and `docs/libraries.md` (the "Installing third-party libraries" section now calls out that installed libs are plain files with no nested `.git`, names the `.jh`-module validation, and points at the new CLI hygiene contract for the commit-mismatch error).
+- **Feature — `jaiph install <name>[@version]` resolves through a lib registry:** `runInstall` in `src/cli/commands/install.ts` only accepted git clone URLs, and the lib directory name was derived from the URL's last path segment via `deriveLibName(url)`. Because the import resolver (`src/transpile/resolve.ts`) maps `import "<prefix>/<rest>"` to `.jaiph/libs/<prefix>/<rest>.jh`, the directory name **is** the import prefix — which silently required every git repo to be named exactly like the import prefix the lib exposes, and there was no way to write `jaiph install jaiphlang` without first knowing the underlying URL. The CLI now accepts a **registry name** form alongside the existing URL form. A new module `src/cli/commands/registry.ts` defines the **registry index format** — a single JSON document `{ "libs": { "<name>": { "url": "<git clone url>", "description": "<one line>" } } }` where names must match `/^[A-Za-z0-9_-]+$/` (single path segment, since the name becomes the `.jaiph/libs/<name>` directory and the import prefix) — and exports `loadRegistryIndex(source)`, `isRegistryNameArg(arg)`, `parseNameArg(arg)`, `registrySource(env)`, and a `DEFAULT_REGISTRY_URL` constant of `https://jaiph.org/registry`. `runInstall` classifies each positional arg by shape: an arg matching `/^[A-Za-z0-9_-]+(@[A-Za-z0-9._+/-]+)?$/` with no `/` and no `:` is a **registry name** (with optional `@version`); everything else takes the existing URL path unchanged. When at least one bare-name arg is present the index is loaded at most once per invocation from `JAIPH_REGISTRY` (or `DEFAULT_REGISTRY_URL` when the env var is unset or empty); when the source has no `://` prefix or uses `file://` it is read from disk (enables unit tests and air-gapped use), otherwise it is fetched with global `fetch`. The **registry key** (not `deriveLibName(url)`) names the `.jaiph/libs/<name>` directory and the lock entry, so a registry entry like `{ "mylib": { "url": "https://example.com/some-other-repo-name.git", … } }` installs into `.jaiph/libs/mylib/` and is imported as `import "mylib/…"`. The lock entry stores the resolved clone URL exactly as today, so **restore-from-lock (`jaiph install` with no args) never contacts the registry** — even when the registry source is unreachable or has changed. Errors all exit non-zero with a message naming the registry source: unknown name → `lib "<name>" not found in registry <source>`; read/fetch/parse failures → `failed to read registry <source>: <cause>` / `failed to fetch registry <source>: HTTP <status>` / `failed to parse registry <source>: <cause>` (including shape errors like `entry "<name>" missing string "url"` and `invalid name "<name>"`). `INSTALL_USAGE` and the global `printUsage` overview in `src/cli/shared/usage.ts` document the name form, the `JAIPH_REGISTRY` env var, and the new examples. New unit tests in `src/cli/commands/install.test.ts` pin the acceptance criteria: (1) installing `mylib` via a path-based `JAIPH_REGISTRY` whose entry points at a repo whose URL last segment is *different* from `mylib` installs into `.jaiph/libs/mylib/` and writes lock entry name `mylib` with the resolved URL; (2) `mylib@v1.2` forwards `v1.2` as the version to the clone runner and records it in the lock entry; (3) unknown registry name fails with `lib "missing" not found in registry <path>`; (4) unreadable registry source fails with `failed to read registry <path>: …`; (5) invalid registry JSON fails with `failed to parse registry <path>: …`; (6) restore-from-lock succeeds with `JAIPH_REGISTRY` pointing at a nonexistent path (proves restore never reads the registry). URL-based installs behave exactly as before — existing install tests pass unmodified. Docs updated in `docs/cli.md` (the `## jaiph install` section gains an **Argument dispatch** explainer, a **Registry** subsection with the index format and source-resolution rules, an **Errors** list, and clarifies that the lock entry stores the **resolved** clone URL; the env-var entry for `JAIPH_REGISTRY` is added under **Install and `jaiph use`**), `docs/libraries.md` (the **Installing third-party libraries** section now shows both name and URL forms, names the shape-based dispatch, calls out that restore never reads the registry, and replaces the "directory name is `deriveLibName(url)`" line with the registry-key-vs-URL-last-segment split), and `docs/jaiph-skill.md` (the `jaiph install` row in the commands table covers both arg forms and points at `JAIPH_REGISTRY`).
+- **Installer — Rewrite `docs/install` to download a per-platform release binary; update `docs/install-from-local.sh` to build the standalone binary from source:** The previous installer required `git`, `node`, and `npm` on every user host: `docs/install` cloned the repo at a tag, ran `npm install` + `npm run build`, and installed a small `node …` shim at `~/.local/bin/jaiph` plus a `~/.local/bin/.jaiph/` (`LIB_DIR`) tree containing the compiled CLI tree (`src/`), `package.json`, and `jaiph-skill.md`. Now that `npm run build:standalone` produces a fully self-contained bun-compiled binary (overlay-run.sh + jaiph-skill.md embedded; self-spawn via the `__workflow-runner` argv marker) and `.github/workflows/release.yml` publishes per-platform binaries + `SHA256SUMS` under the fixed asset contract (`jaiph-{darwin|linux}-{arm64|x64}`, see [Contributing — Release asset naming contract](docs/contributing.md#release-asset-naming-contract)), the installer no longer needs to build anything on the user's machine. `docs/install` now detects the host via `uname -s` / `uname -m` (mapping `Darwin`→`darwin`, `Linux`→`linux`, `arm64|aarch64`→`arm64`, `x86_64|x64`→`x64`); unsupported platforms exit non-zero with `Unsupported platform: <s> <m>` and a pointer at the from-source instructions in `docs/contributing.md#installing-from-source`. The ref is resolved as first arg → `JAIPH_REPO_REF` env → default `v0.9.4` (current stable tag); `nightly` resolves to the rolling prerelease published by `release.yml`. The installer downloads `https://github.com/jaiphlang/jaiph/releases/download/<ref>/jaiph-<os>-<arch>` and `SHA256SUMS`, computes the digest with whichever of `sha256sum` / `shasum -a 256` is present (one is required; the installer fails fast otherwise), and **verifies the checksum against the matching `SHA256SUMS` entry** — a mismatch fails hard with `Checksum mismatch for <bin>` printing both expected and actual hashes and **leaves no file on disk**. On success the binary is installed to `${JAIPH_BIN_DIR:-$HOME/.local/bin}/jaiph` with mode 755; the PATH-hint UX at the end is preserved. End-user prerequisites shrink from `git` + Node.js 20 + `npm` to `curl` + (`sha256sum` or `shasum`). A new env var **`JAIPH_RELEASE_BASE_URL`** overrides the GitHub Release base URL — useful for mirrors, offline bundles, or `file://` paths in tests; documented under [CLI — Install and `jaiph use`](docs/cli.md#install-and-jaiph-use). **Local-source parity.** The `JAIPH_FROM_LOCAL` branch (taken when either `JAIPH_REPO_URL` env or the first positional arg is a directory containing `package.json` — the path `docs/install-from-local.sh` and the E2E install tests use, since neither can depend on GitHub Releases) now **builds the standalone binary from source** instead of installing a node shim: `cp -R <repo> <tmp>` (excludes `.git` and `node_modules`), then `npm install`, then `npm run build:standalone` (requires `bun`), then `cp <tmp>/dist/jaiph ${TARGET}` + `chmod 755`. The result is byte-identical in *shape* to the release-asset path — a single executable at `${JAIPH_BIN_DIR:-$HOME/.local/bin}/jaiph`, no shim script, no `LIB_DIR`, no runtime tree; only the origin of the binary differs (compiled locally vs. downloaded). `docs/install-from-local.sh` is updated accordingly (top-of-file comment names the new build + install contract and the bun prerequisite). **Removed:** the `LIB_DIR` constant, the `JAIPH_LIB_DIR` env var, the release-path `npm install` / `npm run build` invocations, the `node -p "require(...).version"` version probe, the `git clone --depth 1` for the network case, and the node-shim heredoc that used to write `#!/usr/bin/env bash` + `exec node "${LIB_DIR}/src/cli.js" "$@"` to `${TARGET}`. `grep -n "npm run build" docs/install` now matches only the local-source branch (acceptance criterion). New e2e `e2e/tests/07_installer_binary.sh` (registered in `e2e/test_all.sh`) pins three acceptance properties without touching the network: (1) **checksum mismatch** — points the installer at a `file://` release directory via `JAIPH_RELEASE_BASE_URL` with a hand-crafted `SHA256SUMS` whose hash does not match the binary; asserts non-zero exit, the output contains `Checksum mismatch`, and the install target is left empty; (2) **unsupported platform** — prepends a fake `uname` shim to `PATH` reporting `AIX powerpc`; asserts non-zero exit, the error names the detected platform, contains a `contributing` token, and leaves no binary; (3) **local-install parity** (skipped when `bun` is absent on the host) — runs `docs/install-from-local.sh`, asserts the install dir contains exactly one entry named `jaiph`, the installed file is not a `#!` shebang shim, then strips `node`/`npm`/`bun` from `PATH` and asserts `jaiph --version` returns `jaiph <version>` and `jaiph run sample.jh` prints `hello-from-local` against a deterministic mock-free workflow. `e2e/tests/05_jaiph_use_pinned_version.sh` is updated so `jaiph use` exercises the binary path (no longer the build-on-host path). Docs updated in `docs/install` (the new installer logic with a top-comment pointer at the **Release asset naming contract** as the source of asset names), `docs/install-from-local.sh` (top-of-file comment documents the build-from-source contract and the single-binary outcome), `docs/setup.md` (prerequisites list now names `curl` + sha tooling and notes Node/npm are **not** required to run `jaiph`; the "what `curl -fsSL … | bash` does" paragraph, the `jaiph use` paragraph, the `jaiph init` SKILL.md resolution paragraph, and the "Building from source" paragraph all describe the download-and-verify flow), `docs/contributing.md` (the **Installing from source** section names the new `npm install` + `npm run build:standalone` pipeline and lists `bun` as a from-source prerequisite; the **Developing in the repository** prerequisites note that end-user installs need only `curl` + sha tooling), and `docs/cli.md` (the `jaiph use` reference now describes "downloads the matching per-platform binary, verifies the checksum, replaces `~/.local/bin/jaiph`"; the **Install and `jaiph use`** env-var list documents `JAIPH_RELEASE_BASE_URL` and tightens the wording of `JAIPH_REPO_URL` and `JAIPH_REPO_REF` to mark which path each applies to — local-source vs. binary-download).
+- **CI — Add per-platform standalone-binary release workflow (`.github/workflows/release.yml`):** `npm run build:standalone` (bun-compiled binary) had no publish path — nothing in `.github/workflows/` cross-compiled or uploaded the artifact. The forthcoming binary-installer rewrite downloads release assets by fixed name, so without a release pipeline `jaiph use nightly` would break the moment that installer landed. A new `release.yml` workflow now runs on `v*` tag pushes, pushes to the **`nightly`** branch, and `workflow_dispatch`. Using `oven-sh/setup-bun`, it cross-compiles four `bun build --compile --target=…` outputs — `bun-darwin-arm64`, `bun-darwin-x64`, `bun-linux-x64`, `bun-linux-arm64` — into assets named **`jaiph-darwin-arm64`**, **`jaiph-darwin-x64`**, **`jaiph-linux-x64`**, **`jaiph-linux-arm64`** (the **fixed naming contract** the installer depends on verbatim — written down in [`docs/contributing.md`](docs/contributing.md) under **Release asset naming contract**). The `release` job downloads all four binary artifacts, runs `sha256sum` over them into a fifth asset **`SHA256SUMS`**, then executes a sanity gate on the runner: `chmod +x jaiph-linux-x64 && ./jaiph-linux-x64 --version`; for stable channel (`v*` tag) the output must equal `jaiph <tag-without-v>`, for the nightly channel it only asserts the output matches `^jaiph [0-9]+\.[0-9]+\.[0-9]+`. On stable, `gh release create` (or `gh release upload --clobber` if the tag already has a release) attaches all five assets to the tag; on `nightly`, the same five assets are pushed to a **rolling prerelease** tagged `nightly` via `gh release upload nightly --clobber` (created with `--prerelease --target ${GITHUB_SHA}` on first run). A separate `ci-gate` job in the same workflow polls `gh run list --workflow CI --commit "${GITHUB_SHA}"` every 30 s for up to 60 minutes and only declares success when that run's `conclusion=success`; both `build` and `release` declare `needs: ci-gate`, so a broken main-CI run on the same SHA cannot publish binaries. Full first-time release verification still happens on the first real `v*` tag — until then, `workflow_dispatch` on a test tag is the documented dry-run path.
+- **Feature — `bun --compile` standalone binary is fully self-contained (self-spawn + embedded assets):** `npm run build:standalone` (`bun build --compile ./src/cli.ts --outfile ./dist/jaiph`) used to produce a single-file executable that could not actually run a workflow. Two reasons. (1) `buildRunModuleLaunch` in `src/runtime/kernel/workflow-launch.ts` launched the workflow leader as `spawn(process.execPath, [join(__dirname, "node-workflow-runner.js"), …])`. Under node `execPath` is the node binary and the runner script ran; in a bun-compiled executable `process.execPath` is the **jaiph binary itself**, which always runs its embedded `cli.ts` entrypoint — the runner path was interpreted as CLI argv and the workflow leader never started. (2) The CLI read assets relative to its install at runtime: `runtime/overlay-run.sh` (`src/runtime/docker.ts`, Docker overlay sandboxing) and `docs/jaiph-skill.md` (resolved by `jaiph init`, see `src/cli/commands/init.ts` and the install-relative lookup in `docs/cli.md`). A bare binary has no such siblings on disk. Both problems are now fixed. (1) An internal argv marker — exported as **`WORKFLOW_RUNNER_ARG`** = `"__workflow-runner"` from `src/runtime/kernel/node-workflow-runner.ts` — is recognized at the top of `main` in `src/cli/index.ts` **before** help / version / file-shorthand parsing; when the second argument equals `__workflow-runner`, the CLI dispatches the remaining positional args to a new exported `runWorkflowRunner(positional: string[])` (extracted from what used to be the runner script's `main`). `buildRunModuleLaunch` now spawns `process.execPath` with `[WORKFLOW_RUNNER_ARG, metaFile, sourceAbs, builtScript, "default", ...runArgs]` argv for the bun-compiled standalone (detected by `typeof globalThis.Bun !== "undefined"`) and `[join(__dirname, "..", "..", "cli.js"), WORKFLOW_RUNNER_ARG, …]` for the tsc/node build, so both forms route through the same dispatcher. The reserved marker is excluded from `printUsage` (so `jaiph --help` and the overview never mention it) and the file-shorthand resolver (so it cannot be mistaken for a `.jh` path). (2) A new build step `npm run embed-assets` (driven by `tools/embed-assets.js`, registered in `package.json` and run automatically by `npm run build`) generates **`src/runtime/embedded-assets.ts`** — a TS module exporting `OVERLAY_RUN_SH_BASE64` and `JAIPH_SKILL_MD_BASE64` plus a `decodeEmbeddedAsset` helper — from the on-disk `runtime/overlay-run.sh` and `docs/jaiph-skill.md`. `loadOverlayScript` in `src/runtime/docker.ts` now resolves the overlay script in order: (a) sibling `overlay-run.sh` next to the compiled module (npm `dist/src/runtime/`), (b) repo-root `runtime/overlay-run.sh` three hops up (dev `src/runtime/`), (c) the embedded base64 baked into the executable — so the bun-compiled binary works with no sibling files and the npm/disk install behavior is byte-for-byte unchanged. A new `loadInstalledSkillContent` in `src/cli/shared/paths.ts` does the same for the skill: disk lookup (`JAIPH_SKILL_PATH`, install-relative `jaiph-skill.md` / `docs/jaiph-skill.md`, then `docs/jaiph-skill.md` under cwd) wins, with the embedded copy as fallback. `runInit` in `src/cli/commands/init.ts` now always writes `.jaiph/SKILL.md` (the old "skill file not found; set `JAIPH_SKILL_PATH` and run again" warn-and-skip branch is removed — there is no longer a case where the body cannot be resolved). The earlier lazy-load `E_CLI_SETUP` error contract for `overlay-run.sh` remains for the **node** build when the script is genuinely missing from a broken install; the **standalone** binary never hits that path because the embedded fallback always succeeds. New unit test `src/cli/index.test.ts` asserts the `__workflow-runner` argv dispatch routes to `runWorkflowRunner` and that the reserved marker does not appear in `--help` output; `src/runtime/embedded-assets.test.ts` asserts the generated base64 constants decode bit-for-bit to the on-disk `runtime/overlay-run.sh` and `docs/jaiph-skill.md` (any drift between source and embedded copy fails the test). New CI-runnable e2e `e2e/tests/210_standalone_binary.sh` (registered in `e2e/test_all.sh`; skipped when `bun` is not installed on the host) builds `dist/jaiph`, stages **only** the binary in an isolated temp dir (deliberately no sibling `runtime/` or `docs/`), strips `node` / `npm` / `bun` from `PATH`, and runs `jaiph --version`, `jaiph init` (asserting `.jaiph/SKILL.md` matches `docs/jaiph-skill.md` byte-for-byte), `jaiph compile sample.jh`, and `jaiph run sample.jh` against a deterministic mock-free workflow to completion. Docs updated in `docs/architecture.md` (the **Distribution: Node vs Bun standalone** section now describes the `embed-assets` build step, the `__workflow-runner` self-spawn marker, and the fully-self-contained standalone artifact — `dist/runtime` next to `dist/jaiph` is kept for npm-layout parity but no longer required), `docs/cli.md` (the `jaiph init` SKILL.md resolution paragraph adds the embedded-copy fallback and notes that the command always writes the file — no more skip-and-warn — and the `JAIPH_SKILL_PATH` env-var entry under **Environment variables** lists the embedded fallback alongside the existing search), `docs/setup.md` (the npm-install caveat that warned users to set `JAIPH_SKILL_PATH` when `jaiph init` "did not write" SKILL.md is replaced with the new always-writes contract and the same disk-then-embedded resolution order), `docs/contributing.md` (the **Typical commands** table gains a row for `npm run embed-assets` and the `npm run build:standalone` row describes the self-contained binary and the `__workflow-runner` self-spawn), and `README.md` (the `jaiph init` paragraph under **Install** matches the new contract).
+- **Docs — Document Docker env-var allowlist workarounds and pin the doc list to the source constants:** Users hitting Docker sandboxing were surprised when custom host environment variables (e.g. `MY_TOOL_TOKEN`, `AWS_*`, `SSH_*`) vanished inside the container with no diagnostic. `isEnvAllowed` in `src/runtime/docker.ts` forwards only variables matching the `ENV_ALLOW_PREFIXES` allowlist (`JAIPH_`, `ANTHROPIC_`, `CURSOR_`, `CLAUDE_`) and excludes `JAIPH_DOCKER_*` to prevent nested Docker config from leaking in. `docs/sandboxing.md` already named those prefixes in **Environment variable forwarding**, but it gave no actionable workaround when the host variable a script needs falls outside the allowlist. The section now ends with a **Workarounds for variables outside the allowlist** subsection that lists two supported approaches — (1) `export` the value inside the `script` body so it never has to cross the host/container boundary (with a small `script run_with_token = \`\`\`…\`\`\`` example), (2) bake the value into a derived image via `ENV` / `RUN` in a `FROM ghcr.io/jaiphlang/jaiph-runtime:nightly` Dockerfile (cross-links to [Extending the official image](#extending-the-official-image)) — and notes that variables that *must* come from the host on each run should be renamed with a `JAIPH_` prefix so the allowlist forwards them, with the existing "treat anything forwarded as fully disclosed" caveat preserved via a link to the threat-model section. Cross-links added: `docs/configuration.md` (the "Inspecting effective config at runtime" section gains a paragraph pointing readers to the allowlist explanation when a custom host variable goes missing inside the container) and `docs/cli.md` (the **Docker sandbox** env-var section gains a one-line summary of the allow-prefix list and a link to the sandboxing section). To prevent the doc list from drifting away from the source, `ENV_ALLOW_PREFIXES` and `ENV_ALLOW_EXCLUDE_PREFIX` in `src/runtime/docker.ts` are now exported (previously module-private) and a new docs-parity test in `src/runtime/docker.test.ts` reads `docs/sandboxing.md`, locates the `### Environment variable forwarding` section, and asserts that every prefix from the source constants appears as a `` `<PREFIX>*` `` bullet and that the excluded prefix is mentioned; a second test asserts that both `docs/configuration.md` and `docs/cli.md` contain the `sandboxing.md#environment-variable-forwarding` cross-link. A reviewer diff between the doc list and the source constants is no longer necessary — the test fails first.
+- **Refactor — Remove dead `formatDiagnosticLine` indirection in the stderr parser:** `handleLine` in `src/cli/run/stderr-handler.ts` took a `formatDiagnosticLine: (line: string) => string` parameter that only the `emitter.emit("stderr_line", { line: formatDiagnosticLine(line) })` call applied, and the single caller (`createStderrParser` in the same file) always passed the identity function `(ln) => ln`. The parameter was never wired to any non-identity transform — pure dead indirection. Removed: `handleLine`'s fourth parameter is gone (`line` is now passed straight into `emitter.emit("stderr_line", { line })`), and the `const formatDiagnosticLine = (ln: string) => ln;` line in `createStderrParser` is deleted along with the corresponding argument at the `handleLine` call site. No other call sites existed (`handleLine` is module-private), and `createStderrParser`'s exported signature `(emitter: RunEmitter) => (line: string) => void` is unchanged, so every consumer (the `run` command, the parser unit tests in `src/cli/run/stderr-handler.test.ts`) compiles and behaves identically. Behavior is byte-for-byte preserved: `stderr_line` events still carry the raw line, so `capturedStderr` accumulation in `registerStateSubscriber`, TTY passthrough in `registerTTYSubscriber`, and the failed-run summary path that reads the last non-empty stderr line are all untouched. Verified by `grep -rn "formatDiagnosticLine" src/` returning nothing and `npm test` passing; existing integration tests cover the stderr passthrough behavior. No docs change is needed — `formatDiagnosticLine` was never named in user-facing documentation (the references to `src/cli/run/stderr-handler.ts` in `docs/architecture.md` and `docs/hooks.md` describe `RunState.workflowRunId`, `resolveEventId`, and the `isRoot` skip in `registerTTYSubscriber`, none of which involve this parameter).
+- **Fix — Docker overlay script loads lazily so non-Docker commands survive a broken install:** `src/runtime/docker.ts` previously read `runtime/overlay-run.sh` with `readFileSync` at **module load time** (top-level `const OVERLAY_SCRIPT = readFileSync(...)`). The docker module is imported transitively by non-Docker CLI paths — `jaiph compile` and `jaiph format` pull in symbols like `CONTAINER_RUN_DIR` from this module via `src/cli/shared/errors.ts` — so a missing `overlay-run.sh` in the installed package crashed **every** CLI invocation with a raw `ENOENT` stack trace, even commands that never touch Docker. The read is now lazy and lives in a new exported `loadOverlayScript()` helper called only from `writeOverlayScript()` (which itself runs only on the overlay-mode branch of `spawnDockerProcess`, i.e. when Docker is enabled **and** `/dev/fuse` is present). The first successful read is cached in a module-level `overlayScriptCache`; on a missing file the helper wraps the read in `try` / `catch` and rethrows `` `E_CLI_SETUP: runtime/overlay-run.sh not found at <path> — the Jaiph installation is incomplete; reinstall with "jaiph use <version>"` ``, where `<path>` is the resolved candidate path (either the dist-layout `dist/src/runtime/overlay-run.sh` or the source-layout `runtime/overlay-run.sh`). Importing the docker module no longer touches the filesystem at all; `jaiph compile`, `jaiph format`, and other non-Docker subcommands now run unaffected when `overlay-run.sh` is missing from the install. Copy mode (`/dev/fuse` absent, or `JAIPH_DOCKER_NO_OVERLAY=1`) also no longer needs the script and is unaffected. The new error code surfaces only on the overlay path. New unit test in `src/runtime/docker.test.ts` (`loadOverlayScript: import does not read overlay-run.sh; writeOverlayScript throws E_CLI_SETUP when missing`) spawns a child Node process via `spawnSync(process.execPath, ["-e", script], …)` that temporarily renames `overlay-run.sh` at **both** candidate paths (the dist-layout `dist/src/runtime/overlay-run.sh` next to the compiled module **and** the source-layout `runtime/overlay-run.sh` reached via `resolve(__dirname, "..", "..", "..", "runtime", "overlay-run.sh")`), then `require()`s the docker module to prove the import itself succeeds (asserts the re-exported `CONTAINER_RUN_DIR === "/jaiph/run"` constant — the same symbol non-Docker CLI paths pull in transitively), then calls `mod.writeOverlayScript()` and asserts the thrown message starts with `E_CLI_SETUP` and contains one of the two candidate paths; the test restores the renamed files in a `finally` block on both pass and fail paths. Docker e2e overlay flow is unchanged when the file exists (the existing `writeOverlayScript: creates executable script with fuse-overlayfs setup` / `mounts as root and then drops to host uid via setpriv` / `contains no in-container rsync/cp fallback` tests still pass, and the module-load-time `const TEST_OVERLAY = writeOverlayScript()` shared by other tests still succeeds because the file is present in the build output). Docs updated in `docs/sandboxing.md` — the **Image contract** subsection's `overlay-run.sh` paragraph now describes the lazy-load behavior and the `E_CLI_SETUP` error contract; the **Failure modes** table gains an `E_CLI_SETUP` row and the table intro notes the new code alongside the existing non-`E_DOCKER_*` entries (`E_TIMEOUT`, `E_VALIDATE_MOUNT`).
+- **Fix — Three runtime error messages now name the missing context users need to act on:** Three failure paths returned messages that told the user *something* went wrong without saying *what* or *where*. (1) `resolveHandleResult` in `src/runtime/kernel/node-workflow-runtime.ts` returned `error: "invalid handle"` with no handle id — the user had no way to grep `run_summary.jsonl` for the offending step. (2) The Docker timeout path in `src/cli/commands/run.ts` appended the literal string `E_TIMEOUT container execution exceeded timeout` with no duration and no remedy — the user did not know which timeout had been exceeded or how to raise it. (3) `summarizeError` in `src/cli/shared/errors.ts` fell back to `"Workflow execution failed."` when stderr was empty, hiding the run directory and exit code that were already known to the caller. Each message now carries the missing context: (1) `invalid async handle "<handleId>" — the handle was never created or was already consumed` via a new exported `formatInvalidAsyncHandleError(handleId)` in `node-workflow-runtime.ts`; (2) `` `E_TIMEOUT container execution exceeded <N>s — increase runtime.docker_timeout_seconds or JAIPH_DOCKER_TIMEOUT` `` via a new exported `formatDockerTimeoutMessage(timeoutSeconds)` in `src/cli/shared/errors.ts`, where `<N>` is the **actual** `activeDockerConfig.timeoutSeconds` value (the same value the timer was armed with), so the message is self-consistent with the config; (3) `summarizeError(stderr, fallback?, opts?)` and `resolveFailureDetails(stderr, summaryPath?, opts?)` gain an optional `{ code?, runDir? }` argument — when stderr is empty and at least one of the two is known, the summary is now `Workflow execution failed (exit <code>) with no error output; inspect run_summary.jsonl and step artifacts under <run_dir>`, with each clause omitted gracefully when its field is missing (code-only → `(exit N) with no error output`, run-dir-only → `Workflow execution failed with no error output; inspect … under …`); the old `"Workflow execution failed."` text remains only as the terminal fallback when neither field is known. `reportResult` in `src/cli/commands/run.ts` threads `{ code: exitStatus, runDir }` through to `resolveFailureDetails`. New unit tests in `src/cli/shared/errors.test.ts` pin the four summary shapes (empty-stderr with both fields, code only, runDir only, and non-empty stderr ignoring both opts) and the formatted timeout message (configured seconds + both env-var / config-key remedies present); new kernel tests in `src/runtime/kernel/node-workflow-runtime.handle.test.ts` (added by this change) pin the handle-id-in-message shape for both `resolveHandleResult` and `formatInvalidAsyncHandleError`. The single existing e2e expectation that asserted the old empty-stderr text (`e2e/tests/61_ensure_recover.sh`) is updated to assert the new exit-code + run-dir form. Docs updated in `docs/sandboxing.md` (the **Timeout** paragraph under **Docker runs** now quotes the new message shape with the `<N>s` placeholder and the `runtime.docker_timeout_seconds` / `JAIPH_DOCKER_TIMEOUT` remedy clause) and `docs/cli.md` (the **Failed run summary (stderr)** section gains a new paragraph describing the summary-line source: last non-empty trimmed stderr line, the new empty-stderr fallback that names exit code and run directory, and the terminal `"Workflow execution failed."` fallback when neither is known).
+- **Fix — `jaiph format` preserves quotes on top-level `const` string values:** `jaiph format` rewrote `const x = ".jaiph/tmp/x.md"` to the unquoted bare-token form `const x = .jaiph/tmp/x.md` whenever the value contained no whitespace; values with a space kept their quotes. The rewrite was value-preserving and idempotent, but it silently changed the author's chosen delimiter and produced inconsistent output within one file — quoted and unquoted `const` declarations side by side, depending on whether each value happened to contain a space. A formatter should canonicalize to one stable form, not toggle forms based on value content. The canonical rule is now: a top-level `const` value written as a **double-quoted string** in the source is emitted **double-quoted**, always — regardless of whether the value contains spaces. Values written as **bare tokens** (e.g. `const MAX = 3`) stay bare. Values written as `"""…"""` are emitted verbatim as before. `EnvDeclDef` (`src/types.ts`) gains an optional `wasQuoted?: boolean` field; `parseEnvDecl` (`src/parse/env.ts`) sets it to `true` on both the single-line `"…"` and triple-quoted `"""…"""` paths and leaves it `undefined` on the bare path; `emitEnvDecl` (`src/format/emit.ts`) checks `wasQuoted` first — when set, the value is re-emitted with `JSON.stringify` (or as `"""…"""` if the value contains a `"` or `\` that would need escaping), and the value-content shape check (`^[A-Za-z0-9_./@+#%^&=*:~?-]+$`) that drove the bare emission only runs on the bare branch. New formatter tests in `src/format/emit.test.ts` pin the invariants: a quoted no-space value (`const q = ".jaiph/tmp/x.md"`) survives `jaiph format` with quotes intact, a quoted value with spaces also survives, a bare numeric token (`const MAX = 3`) stays bare, formatting twice produces identical output for all three cases (idempotency), and a parse-then-format-then-parse round-trip preserves `envDecls[i].value` bit-for-bit so `${q}` interpolation yields the same value before and after formatting. No existing golden AST fixture under `test-fixtures/golden-ast/fixtures/` carries a top-level `const`, so the `wasQuoted` field addition does not require regenerating goldens. Docs updated in `docs/cli.md` (new "Top-level `const` quoting" paragraph under `## jaiph format` describing the canonical rule), `docs/grammar.md` (the **Top-Level `const`** section and the trailing formatter-impact bullet list both note that the source delimiter is preserved), `docs/language.md` (the Constants section gains the same preservation note), and `docs/architecture.md` (the formatter description adds the original quotedness of top-level `const` values to the list of round-tripped discriminators alongside `"""…"""` and `bareSource`).
+- **Fix — Mixing `mock prompt { … }` with queued `mock prompt "…"` is now a compile-time error:** When a single `test "…" { … }` block contained both a pattern-dispatch `mock prompt { … }` and one or more queue-style `mock prompt "…"` / `mock prompt <const>` lines, the queue entries were **silently ignored** at runtime — the block won, the queued lines did nothing, and the test could pass for the wrong reason. `docs/testing.md` documented this as a limitation ("Do not combine … ignored") rather than the compiler enforcing it. `validateTestBlocks` in `src/transpile/validate.ts` now scans each `TestBlockDef`'s steps for the first `test_mock_prompt_block` and the first `test_mock_prompt`; when both are present in the same block, it emits a single `E_VALIDATE` diagnostic — `cannot mix "mock prompt { … }" with queued "mock prompt …" in one test block; choose one style` — at the location of whichever offending mock appears **second** in source order (so the message points at the line the author should remove or convert). The check is per test block: separate `test "…" { … }` blocks in the same file may still use different styles. Surfaced through the standard validation path, so `jaiph compile path/to/file.test.jh` (test files are validated when passed explicitly) and `jaiph test path/to/file.test.jh` (loads + validates before running) both fail with the new diagnostic instead of silently dropping the queued mocks. New txtar fixtures pin the invariants: `test-fixtures/compiler-txtar/validate-errors.txt` adds two cases — block-first then queue, and queue-first then block — each asserting the `E_VALIDATE` code and the exact message via `validate-diagnostics-snapshot.json`; `test-fixtures/compiler-txtar/valid.txt` adds a "block and queued mock prompt in separate test blocks" case proving the per-block scope. Docs updated in `docs/testing.md` (the "Mock prompt (content-based dispatch)" section and the **Limitations (v1)** bullet now describe the compile-time error and the per-block scope rule instead of the "silently ignored" caveat) and `docs/jaiph-skill.md` (the test-authoring bullet that said "Don't mix queued … and a `mock prompt { … }` block in one test" now states the error and quotes the message).
+- **Feature — `jaiph test` discovery with zero matches exits 0:** Previously, `jaiph test` (no args) and `jaiph test <dir>` exited **1** with `jaiph test: no *.test.jh files found` when discovery matched nothing (`src/cli/commands/test.ts:25,43`), forcing every CI pipeline and agent loop to guard the call (`run jaiph test only if test files exist`) and obliging the bootstrap skill doc (`docs/jaiph-skill.md`) to carry a matching caveat. In **discovery mode** (no path, or a directory path), zero matches now write `jaiph test: no *.test.jh files found (nothing to do)` to stderr and exit **0**, so `jaiph test` is safe to call unconditionally. Passing an explicit **file** path that does not exist or is not a `*.test.jh` file remains an error (exit **1**) — a named target must exist. Implementation: the two zero-match branches in `runTest` in `src/cli/commands/test.ts` now share a single `(nothing to do)` notice and `return 0` instead of returning `1`; the explicit-file branch is unchanged so `fs.statSync` still throws ENOENT on a missing named target. Tests: `e2e/tests/125_test_discovery_errors.sh` is restructured into three sections — empty directory exits 0 with the notice (assert_equals), `jaiph test` with no args in a workspace without test files exits 0 with the notice, and `jaiph test missing.test.jh` (nonexistent file) still exits non-zero with an error message referencing the missing path. `e2e/tests/50_cli_and_parse_guards.sh` is updated to expect exit 0 and the new notice for the empty-directory case it covered. Docs: `docs/cli.md` and `docs/testing.md` describe the new discovery-vs-named-target split; `docs/jaiph-skill.md` drops the "only if `*.test.jh` files exist" caveat from both "Your authoring loop" (step 4) and the final commands block.
+- **Feature — Per-subcommand `-h` / `--help`:** Only `jaiph compile -h` / `jaiph compile --help` printed command-specific usage; for every other subcommand the help flag fell through to positional / file-path resolution and produced confusing errors. `jaiph run --help` tried to resolve `--help` as a `.jh` file (`requires a .jh file` / ENOENT path); `jaiph test --help`, `jaiph format --help`, `jaiph init --help`, `jaiph install --help`, and `jaiph use --help` were similarly parsed as ignored tokens or stray paths. The CLI dispatcher (`src/cli/index.ts`) recognized `-h` / `--help` only as the **first** token after `jaiph`, and `docs/cli.md` documented this limitation instead of fixing it. Every subcommand now recognizes `-h` / `--help` anywhere in its argument list **before positional processing**, prints its own usage block (flags + one example) to stdout, and exits **0**. `jaiph --help` and bare `jaiph` still print the overview; the change is additive at the subcommand layer. Each subcommand owns its own usage string: `RUN_USAGE` in `src/cli/commands/run.ts`, `TEST_USAGE` in `src/cli/commands/test.ts`, `FORMAT_USAGE` in `src/cli/commands/format.ts`, `INIT_USAGE` in `src/cli/commands/init.ts`, `INSTALL_USAGE` in `src/cli/commands/install.ts`, `USE_USAGE` in `src/cli/commands/use.ts`, and a renamed `COMPILE_USAGE` in `src/cli/commands/compile.ts` (the existing `printUsage` helper there was split into the constant plus a `printUsageError` wrapper that keeps writing the same text to stderr for argument-shape errors). A shared `hasHelpFlag(args: string[]): boolean` helper in `src/cli/shared/usage.ts` scans the argument list for `-h` / `--help`, stopping at `--` so `jaiph run flow.jh -- --help` still forwards `--help` to `workflow default` instead of intercepting it. Each subcommand entry function (`runWorkflow`, `runTest`, `runFormat`, `runInit`, `runInstall`, `runUse`) calls `hasHelpFlag(rest)` as its first step and short-circuits to `process.stdout.write(<CMD>_USAGE)` + `return 0` when true; the `compile` entry keeps its existing inline `--help` / `-h` check (now writing to stdout for the help case and falling through to `printUsageError` only on actual argument-shape errors). The overview usage text in `printUsage()` (`src/cli/shared/usage.ts`) drops the "only as the first argument" caveat from the global-options section and notes that each subcommand also accepts `-h` / `--help`. New integration test `integration/subcommand-help.test.ts` iterates all seven subcommands × both flag forms (14 cases) asserting exit **0** and that stdout contains both the substring `Usage` and the subcommand name; a dedicated case for `jaiph run --help` further asserts that stderr does **not** contain `ENOENT`, `no such file`, or `requires a .jh file` — pinning the regression that the old code would attempt to resolve `--help` as a path. Docs updated in `docs/cli.md`: the **Global options** paragraph is rewritten to describe the per-subcommand help flag (overview vs. command-specific usage, listing all seven subcommands) instead of documenting the old first-token-only limitation.
+- **Feature — `if` and `match` accept `IDENT.IDENT` dot-notation subjects on typed prompt captures:** Typed prompt captures already exposed their fields via dot notation in interpolation contexts (`${r.verdict}` resolved against the `returns "{ verdict: string, … }"` schema), but `if` and `match` subjects had to be plain identifiers — `if r.verdict == "reject" { … }` failed with `E_PARSE invalid if syntax; expected: if <identifier> <op> <operand> …`, forcing every typed-prompt-then-branch workflow to insert a boilerplate `const verdict = "${r.verdict}"` rebind before the condition. The single most common typed-prompt pattern (ask for a verdict, branch on it) paid that tax on every use. The parser now accepts `IDENT.IDENT` as the subject of `if` and `match` (both statement and expression forms): the `if`-line regex in `tryParseIf` (`src/parse/workflow-brace.ts`) is widened from `[A-Za-z_][A-Za-z0-9_]*` to `[A-Za-z_][A-Za-z0-9_]*(?:\.[A-Za-z_][A-Za-z0-9_]*)?`, and `validateMatchSubject` (`src/parse/match.ts`) now accepts a new `DOT_IDENT_RE` (`^IDENT\.IDENT$`) alongside the existing bare-ident regex. The `$` / `${}`-as-subject parse error is unchanged. Compile-time validation reuses the same dot-notation schema check already implemented for `${var.field}` interpolation: a new `validateDotSubject(subject, loc, ctx)` in `src/transpile/validate-step.ts` parses the subject, and a new shared `validateDotFieldRef(varName, fieldName, loc, ctx)` (extracted from the body of `validateDotFieldRefs`) emits the same two `E_VALIDATE` diagnostics — `"<var>" is not a typed prompt capture; dot notation requires a prompt with "returns" schema` when the base is not a `const … = prompt … returns "{ … }"` capture, and `field "<field>" is not defined in the returns schema for "<var>"; available fields: …` when the base is typed but the field is not in its schema. So a plain unknown `a.b` subject (non-typed-capture base, or unknown field) is now a structured `E_VALIDATE` at the same line/col as `${a.b}` would be — not the old `E_PARSE` "invalid if syntax". Runtime semantics mirror `${var.field}` interpolation exactly: a new private `resolveSubjectValue(scope, subject)` in `src/runtime/kernel/node-workflow-runtime.ts` splits the subject on the first `.`, resolves any handle on the base variable (same `isHandle` / `resolveHandleVar` path the bare-identifier subject already used), then for the dot form parses the base value as JSON and reads the field — falling back to the empty string when the JSON parse fails or the field is missing (the same fallback `${var.field}` uses). The `if` step in `runStep` and `runMatchExpr` both now route their subject resolution through `resolveSubjectValue` (the two previously-duplicated handle-resolution + scope-lookup blocks collapse into one helper); bare-identifier behavior is preserved byte-for-byte. AST: no new variant — `subject` on the `if` step and `MatchExprDef` stays a `string` that now optionally contains a single `.`. New txtar fixtures (`test-fixtures/compiler-txtar/valid.txt`) cover `if r.verdict == "ok" { … }` and `const x = match r.verdict { "ok" => "approved"; _ => "rejected" }` on a typed prompt capture; four new `validate-errors.txt` cases pin the `E_VALIDATE` shape for `if` and `match` dot subjects on both a non-typed-capture variable (`const r = "plain"`) and a typed capture with an unknown field, with the diagnostic snapshot (`validate-diagnostics-snapshot.json`) recording the exact `{ line, col, code, message }`. A new golden AST fixture pair (`test-fixtures/golden-ast/fixtures/if-dot-subject.jh` + `expected/if-dot-subject.json`) pins the tree shape for an `if` with a dot-notation subject (the AST node carries `"subject": "r.verdict"`). New runtime e2e `e2e/tests/138_if_match_dot_subject.sh` exercises both `if` and `match` against the same typed-capture workflow under three mocked prompt JSON payloads (`{"verdict":"ok"}`, `"reject"`, `"maybe"`), asserting the `if`/`else` arms and the matching `match` arms all select correctly by field value; `e2e/test_all.sh` registers the test. Docs updated in `docs/grammar.md` (the `if` and `match` subject bullets now describe the dot-notation form and the typed-capture / `returns` schema requirement, with a forward reference to the `E_VALIDATE` parity with `${var.field}`; the EBNF gains a `subject_ref = IDENT | IDENT "." IDENT` production used by `if_stmt`, `match_stmt`, and `match_expr`), `docs/language.md` (the `match` and `if` subject sentences in §`match` / §`if — Conditional Guard` now describe both forms inline with the same `E_VALIDATE` parity caveat), `docs/jaiph-skill.md` (the control-flow bullet that previously said "a dot-notation field (`if r.verdict == …`) is a parse error; rebind first" is replaced with the new rule — dot subjects work on typed prompt captures without rebinding — and the prompt-driven example with the typed verdict capture drops its boilerplate `const verdict = "${r.verdict}"` rebind; a workflow-triage example also drops the same rebind), and `docs/index.html` (the `match` primitive entry in the orchestration overview notes the new dot-subject form and that `if` accepts the same shape).
+- **Feature — `catch` / `recover` on inline-script `run` steps:** Named-ref `run` calls already supported failure handling (`run deploy() catch (err) { … }` / `run deploy() recover(err) { … }`), but inline scripts did not: `` run `test -z "$(git status --porcelain)"`() catch (err) { … } `` failed with `E_PARSE unexpected content after anonymous inline script: 'catch (err) {'`, forcing authors to declare a named `script` solely to attach failure handling to a one-liner. The grammar EBNF in `docs/grammar.md` previously showed `run_catch_stmt = "run" call_ref "catch" …` (call_ref only); the inline-script parse path rejected any trailing tokens after the closing `)`. The inline-script `run` parse path (single-backtick and fenced forms) now accepts the same optional `catch (name) <body>` / `recover (name) <body>` suffix as named-ref `run`, with identical semantics — `catch` runs the body once on failure, `recover` retries the inline script up to `run.recover_limit` (default 10), and the two remain mutually exclusive on a single step. The restriction that `run async` does not combine with inline scripts is unchanged. Parser entry: `parseAnonymousInlineScript` in `src/parse/inline-script.ts` gains an `allowTrailing = false` parameter and exposes `closingLineIdx` / `trailing` on its result so callers can resume parsing after the closing `)`. `tryParseRun` in `src/parse/workflow-brace.ts` calls `parseAnonymousInlineScript` with `allowTrailing: true` and delegates to a new `parseInlineScriptTail` helper that recognizes a leading `recover` or `catch` keyword on the trailing text and hands the bindings/body off to the existing `parseAttachedBlock` (same helper named-ref `run` / `ensure` already use) — so every body shape (`{ … }`, inline `{ stmt[; stmt]* }`, single-statement) and every binding/body parse-error message is shared with the named-ref path. AST: no new variant — the inline-script `exec` step's existing `catch?` / `recover?` step-level attributes (added with the `Expr` collapse refactor) are now populated for inline-script bodies, matching named-ref `run`. Runtime: the inline-script branch of `runStep` in `src/runtime/kernel/node-workflow-runtime.ts` now mirrors the named-ref `runOnce` / `runRecoverBody` loop: on `step.recover`, retry the inline script up to `resolveRecoverLimit(scope.filePath)` times with the merged stdout+stderr bound to the recover binding between attempts; on `step.catch`, run once and on non-zero status invoke the catch body once with the merged output bound; a `return` from the catch/recover body propagates through the existing `mergeStepResult` path. The `run async` rejection path is untouched (the inline-script `run async` form still fails parse before reaching this code). New txtar fixtures (`test-fixtures/compiler-txtar/valid.txt`) cover inline-script `catch` and `recover` in both workflow and rule bodies, the fenced (triple-backtick) form with `catch`, an inline script with positional args plus `catch`, and the single-statement `catch` body shape. The same `recover` + `catch` mutual-exclusion guard is asserted by a new `parse-errors.txt` case where `run \`false\`() recover(e) { log "r" } catch (e) { log "c" }` fails with the existing "unexpected content after log string" parse error (the recover clause consumes through its body, and the trailing `catch` falls through to the next-statement parser). Runtime e2e `e2e/tests/137_inline_script_catch_recover.sh` covers (a) a failing inline script's `catch` body runs once with the merged output bound (`run \`echo "bad" 1>&2; exit 3\`() catch (err) { log "caught: ${err}" }` logs `caught: bad` and the workflow passes), (b) a failing inline script under `recover` retries until a counter-file-based repair makes it pass (`run \`test -f .done\`() recover(err) { run \`\`\`…\`\`\`() }` runs the repair body exactly **2** times before the check passes), and (c) the same `catch` shape works in a rule body via `ensure`. Docs updated in `docs/grammar.md` (new "**`catch` / `recover` on inline scripts**" paragraph and example under **Inline Scripts**; EBNF `run_catch_stmt` / `run_recover_stmt` now read `( call_ref | inline_script )`; an aside on `inline_script` clarifies that the optional catch/recover suffix is permitted only via `run_catch_stmt` / `run_recover_stmt`, not via `log` / `logerr` / `return` / `const` RHS), `docs/language.md` (new "**`catch` / `recover` on inline scripts**" paragraph and example under **Inline Scripts**, plus the explicit note that `const … = run \`…\`()`, `return run \`…\`()`, and `log run \`…\`()` / `logerr run \`…\`()` do *not* accept these suffixes), and `docs/jaiph-skill.md` (replaces the "they do **not** accept `catch`/`recover` suffixes" caveat with the new rule and points to wrapping in a standalone `run` step for the other inline-script positions).
+- **Feature — `if` now supports an `else` branch:** `if subject <op> <operand> { … }` previously had no `else` arm. The documented workarounds — `match` (which forces a wildcard arm and value-shaped bodies) or a `catch`-as-failure-branch — were the single biggest ergonomic gap agents hit when authoring workflows and rules. `if` now accepts an optional `else { … }` clause that runs when the condition is false. Surface syntax: `} else {` must sit on the **same line** as the closing `}` of the `if` body — `else` on its own line is `E_PARSE` (`"else" must appear on the same line as the closing "}" of an "if" block`); `else` without a preceding `if` is the same `E_PARSE`; and `else if` chaining is rejected with a dedicated `E_PARSE` (`"else if" chaining is not supported; nest an "if" inside the "else" block, or use "match" for multi-way branching`) — a bare `else` containing a nested `if` is fine. `if` / `else` remains a **statement** (no value production); `const x = if …` and `return if …` are still parse errors, and value-shaped branching is still expressed with `match`. The `else` body uses a brace block of the same step forms allowed in the surrounding workflow / rule body — rule scope still rejects `prompt`, channel sends, `run async`, and `run` to a workflow inside `else`, exactly as it does inside the `if` body. The parser entry is the `if` row of the `STATEMENT` dispatch table in `src/parse/workflow-brace.ts`: `tryParseIf` calls `parseBraceBlockBody` with a new `allowElseTerminator: true` opt that recognizes `} else {` as a block terminator and signals it via a new `closedWithElse` field on the return tuple, then `tryParseIf` parses the else body with a second `parseBraceBlockBody` call (without the opt, so the else body terminates only on `}`). A dedicated `tryParseElseError` row on `else` produces the same two error messages when a stray `else` appears as a top-level statement (outside an `if` body), so the diagnostic doesn't depend on which side of the `}` the parser hits. AST: `WorkflowStepDef`'s `if` variant gains an optional `elseBody?: WorkflowStepDef[]` (absent when there is no `else`, preserving the old shape byte-for-byte). Validator (`src/transpile/validate.ts`'s `walkStepTree`) descends into `elseBody` with the same scope as `body`, so binding rules and per-step rule/workflow gates apply uniformly to both arms. Runtime (`src/runtime/kernel/node-workflow-runtime.ts`): the `if` case picks `step.body` when the condition is met and `step.elseBody` otherwise, executes only the chosen branch's steps in order, and propagates any non-zero status or `return` value through the existing `mergeStepResult` path — the false-with-no-else path is still a no-op. Formatter (`src/format/emit.ts`'s `emitStep`): emits canonical `} else {` between the two arms when `elseBody` is set; `jaiph format` is idempotent on `if/else` (formatter test in `src/format/emit.test.ts`). New txtar fixtures cover (a) `if/else` in a workflow, in a rule, and a nested `if` inside an `else` block (`test-fixtures/compiler-txtar/valid.txt`); (b) the three parse-error shapes — `else` on its own line, bare `else` without a preceding `if`, and `else if (…)` chaining (`test-fixtures/compiler-txtar/parse-errors.txt`); and (c) rule-scope validation rejecting `const … = prompt …` inside an `else` block in a rule (`test-fixtures/compiler-txtar/validate-errors.txt`). A golden AST fixture pair (`test-fixtures/golden-ast/fixtures/if-else.jh` + `test-fixtures/golden-ast/expected/if-else.json`) pins the tree shape for an `if/else` statement. New runtime E2E `e2e/tests/136_if_else_branch.sh` runs the same `.jh` source twice: with `status="ok"` the then-branch logs `healthy` and `done`, with `status="bad"` the else-branch logs `unhealthy: bad` and `done` — proving only the chosen arm executes — plus the same shape inside a rule (then-branch fails the workflow on empty input; else-branch passes the rule and the workflow continues to `log "validated"`). Docs updated in `docs/grammar.md` (rewrote the `if` section to document `else`, added the `else_clause` production to the EBNF), `docs/language.md` (updated the **`if` — Conditional Guard** section: dropped the "No `else` branch" claim and added a `} else {` example), and `docs/jaiph-skill.md` (replaced the "`if` has **no `else`**" bullet with the new `} else {` rules and the no-`else if` chaining caveat); `docs/contributing.md` bumps the golden AST fixture count from 9 to 10 and names the new `if-else` fixture.
+- **Fix — Workflow-level `run.recover_limit` now applies:** A workflow body may open with a `config { … }` block that overrides `agent.*` and `run.*` keys, and the precedence chain (workflow-level > module-level > defaults) was already documented for every other run key. But `resolveRecoverLimit` in `src/runtime/kernel/node-workflow-runtime.ts` read only `moduleMeta?.run?.recoverLimit ?? 10`, so a workflow-level `run.recover_limit = 3` parsed and validated fine but was silently ignored at retry time — a `run … recover` step inside that workflow still used the module-level cap (or the default of 10). `docs/configuration.md` documented this as an explicit exception ("`run.recover_limit` is an exception: only **module-level** values affect `run … recover`"), making it a trap: config that validates but does nothing. `NodeWorkflowRuntime` now resolves `run.recover_limit` through the same precedence as other run keys: it consults the **active workflow's** metadata scope first (the top of `workflowCtxStack`, whose `workflowMeta` is captured when the workflow frame is pushed), then falls back to the module-level metadata of the file owning the current step's scope, then to the default of `10`. The workflow-frame side of the wiring is a new `workflowMeta?: WorkflowMetadata` field on `WorkflowContext` populated at frame-creation time from `resolved.workflow.metadata`, so cross-module `run` calls correctly see the callee workflow's own config (the cross-module call already pushes a new frame). New tests in `integration/sample-build/recover-handle.test.ts` pin the invariants: (a) a workflow with `config { run.recover_limit = 2 }` calling a failing script via `run failing() recover(e) { … }`, with module-level `run.recover_limit = 50` set as a deliberately wrong fallback, executes the script exactly **3 times** (1 initial + 2 retries) — verified by reading a counter file that the failing script increments and exits non-zero on every attempt; (b) a sibling workflow in the same module without its own `config` block still uses the module-level value (`config { run.recover_limit = 2 }` at module level → 3 attempts), proving workflow-level config is correctly scoped per-workflow and does not bleed into siblings (an unrelated sibling workflow's own `config { run.recover_limit = 50 }` is also present in the fixture to prove it does not leak into `default`). Both tests run `dist/src/cli.js` end-to-end under `JAIPH_DOCKER_ENABLED=false`. Docs updated to delete the exception text from `docs/configuration.md` (three places: the "Three ways to configure" intro, the "Run keys" table row, and the "Workflow-level config" rules) and to refresh `docs/grammar.md`, `docs/jaiph-skill.md`, `docs/language.md`, and `docs/spec-async-handles.md` so the retry-limit override description matches the now-standard precedence (workflow-level > module-level > default 10). `grep -rn "workflow-level run.recover_limit" docs/` returns nothing stale.
+- **Feature — Inbox dispatch iteration cap:** `drainWorkflowQueue` in `src/runtime/kernel/node-workflow-runtime.ts` walked the in-memory channel queue with `while (cursor < queue.length)` and had no upper bound — dispatched targets that sent on the same (or a routed) channel could append to the same queue indefinitely, so a circular send (A routes to B, B sends back to A's channel) looped until the host OOM'd. `docs/inbox.md` previously *documented* the footgun ("Avoid unbounded circular sends") rather than the runtime enforcing a bound. The runtime now caps the number of messages a single workflow frame may drain. The default cap is **1000**; override via the environment variable **`JAIPH_INBOX_MAX_DISPATCH`** (positive integer; non-numeric, empty, or non-positive values fall back to the default — resolved by a new `resolveInboxDispatchLimit(env)` helper at the top of `node-workflow-runtime.ts`). When the cap is exceeded `drainWorkflowQueue` aborts the owning workflow with status `1` and the error message `E_INBOX_DISPATCH_LIMIT: drained <N> messages without quiescing — likely a circular send (channel "<name>"); raise JAIPH_INBOX_MAX_DISPATCH if intentional`, where `<name>` is the next un-drained message's channel (typically the channel involved in the cycle). New kernel tests in `src/runtime/kernel/node-workflow-runtime.artifacts.test.ts` pin the invariants: (a) a two-workflow circular send (`on_ping` enqueues on `pong`; `on_pong` enqueues on `ping`) fails the workflow with `E_INBOX_DISPATCH_LIMIT` instead of hanging, and the error names one of the cycle channels and the limit; (b) `JAIPH_INBOX_MAX_DISPATCH=5` against a self-loop triggers the cap after **exactly 5** `INBOX_DISPATCH_START` records in `run_summary.jsonl`; (c) multi-message fan-out below the cap (one producer enqueues 3 messages on a channel with 3 routed targets, cap = 5) still succeeds with no `E_INBOX_DISPATCH_LIMIT` in the summary. Existing inbox tests pass unchanged. Docs updated in `docs/inbox.md` (new **Dispatch cap** paragraph under [Dispatch loop](docs/inbox.md#dispatch-loop); the circular-sends bullet under [Error semantics](docs/inbox.md#error-semantics) now describes `E_INBOX_DISPATCH_LIMIT` and the env override instead of the old "no built-in iteration cap" warning), `docs/cli.md` (new `JAIPH_INBOX_MAX_DISPATCH` entry under **Execution behavior**), and `docs/jaiph-skill.md` (the inbox paragraph now states the 1000-message default cap and the env override).
+- **Fix — Imported-channel sends now dispatch:** Channel routes are registered in `NodeWorkflowRuntime`'s `ctx.routes` keyed by the **bare** channel name from `channel <name> -> …` lines, but the send step looked the channel up with `this.workflowCtxStack[i].routes.has(step.channel)` where `step.channel` was the **verbatim token** left of `<-` (`src/runtime/kernel/node-workflow-runtime.ts`). So a validated cross-module send like `lib.topic <- "msg"` never matched the route registered as `topic` — the message was enqueued unrouted and silently dropped. `docs/inbox.md` previously documented this as a known footgun ("Module scope" paragraph) and steered users to bare-channel sends from the entry module. The send step in `node-workflow-runtime.ts` now normalizes `step.channel` once, at send time: after the validator (`validateChannelRef` in `src/transpile/validate.ts`) has already proven that an `alias.name` token refers to an existing imported channel, the runtime strips the `alias.` prefix and uses the bare name as `channelKey` for both the `routes.has(channelKey)` walk up the workflow stack and the `InboxMsg.channel` field. `lib.topic <-` and a bare `topic <-` therefore resolve to the same route key. The `INBOX_ENQUEUE` record in `run_summary.jsonl` carries the bare channel name; the audit copy is written to `inbox/NNN-<bare>.txt`. New E2E coverage in `e2e/tests/91_inbox_dispatch.sh` ("Imported channel send: lib.topic normalizes to topic for routing") writes the failing-today scenario as a test first — entry module declares `channel topic -> handler` and imports `lib`, `lib` declares `channel topic`, the entry workflow sends `lib.topic <- "x"` — then asserts `handler` is invoked with payload `"x"`, the inbox audit file is `inbox/001-topic.txt` containing `x`, and the `INBOX_ENQUEUE` line in `run_summary.jsonl` records `channel: "topic"` (bare, alias prefix stripped). Docs updated in `docs/inbox.md` — the "Module scope" paragraph under [Who registers routes and who drains](docs/inbox.md#who-registers-routes-and-who-drains) is rewritten to describe the normalized behavior (and references `validateChannelRef` as the guarantee that any `alias.` prefix the runtime strips already names a real imported channel), the imported-channel bullet under **Send operator** drops the "literal token" caveat, and the [Send operator](docs/inbox.md#send-operator--channel_ref-rhs) paragraph clarifies that `sendChannel` is the bare channel name used for both the route lookup and the audit filename.
+- **Fix — Docker-run path no longer leaks the `process.on("exit")` cleanup guard:** In `src/cli/commands/run.ts` (`runWorkflow`), when `spawnExec` returned a `dockerResult`, an `exitGuard` callback was registered with `process.on("exit", exitGuard)` so that, if the host CLI crashed before the run finished, `cleanupDocker(dockerResult)` would still tear down the copy-mode sandbox directory and clear the timeout timer. The matching `process.removeListener("exit", exitGuard)` only ran inside the `if (dockerResult)` block *after* `await waitForRunExit(...)` resolved normally — so if anything between registration and removal threw (stream wiring, the awaited child exit, buffer draining), the listener stayed on the `process` object for the rest of the host CLI's lifetime and `cleanupDocker` would fire again at process exit on an already-cleaned container, also fattening the `exit`-listener list across nested or repeated runs. Registration and removal are now paired in a `try { … } finally { … }` block via a new helper `withDockerExitGuard(dockerResult, body)` exported from `src/runtime/docker.ts`. The helper registers the guard, runs the spawn-to-exit body inside `try`, and in `finally` — on both normal return *and* on throw — removes the listener and calls `cleanupDocker(dockerResult)`. The guard itself stays registered for the abnormal-exit case (that is its purpose); only the normal and thrown-body paths now deterministically remove it. When `dockerResult` is `undefined` (non-Docker run), no listener is registered at all. `cleanupDocker` was already idempotent through the `cleaned` flag on `DockerSpawnResult` (so both the finally path and any surviving guard / signal handler can call it without double-`rmSync` warnings); its JSDoc now states that contract explicitly because the exit-guard + finally pairing relies on it. New tests in `src/runtime/docker.test.ts` pin the invariants: (a) `cleanupDocker` invoked twice on the same `DockerSpawnResult` is a no-op the second time — sentinel files recreated under the overlay tempdir and sandbox tempdir after the first call survive the second call, and the cleared timeout timer never fires; (b) after a successful `withDockerExitGuard` body, `process.listenerCount("exit")` returns to its pre-run value and no new listener identity remains in `process.listeners("exit")`; (c) the same holds when the body throws — `await assert.rejects(...)` confirms the listener is still removed and `cleanupDocker` ran exactly once; (d) when `dockerResult` is `undefined`, the helper registers no listener and just returns the body's value. Existing E2E / run tests pass unchanged. Docs updated in `docs/sandboxing.md` (extended the **Signal-safe cleanup** paragraph under **Runtime behavior** to describe the `withDockerExitGuard` try/finally pairing, the abnormal-exit role of the guard, the no-op behavior for non-Docker runs, and `cleanupDocker`'s idempotency contract).
+- **Fix — Cross-module `run` applies the callee module's config:** Previously, when a workflow in module A reached a callee in module B via `run alias.workflow()`, both module B's module-level `config { … }` and the callee workflow's `config { … }` block were silently ignored — the caller's effective env carried through as-is. This was inconsistent with the other three call types (root entry, same-module `run`, cross-module `ensure`) and bit `.jaiph/ensure_ci_passes.jh` in particular: that module declares `agent.backend = "cursor"`, but when `engineer.jh` (backend `claude`) called `run ci.ensure_ci_passes()`, the CI-fix prompts silently ran on `claude`. A module's `config` should describe how *that* module's workflows run, regardless of who called them. `NodeWorkflowRuntime` now layers the callee's module-level metadata then the callee's workflow-level metadata on top of the caller's effective env when entering a cross-module `run` — same mechanics as the root-entry path, respecting `${NAME}_LOCKED` env flags (environment still always wins). The caller's scope is restored exactly when the call returns, so sibling isolation still holds. New / updated tests: `src/runtime/kernel/node-workflow-runtime.artifacts.test.ts` adds three cases — (a) module A (`agent.default_model = "model-a"`) runs `run b.show()` where module B sets `agent.default_model = "model-b"` and `show` logs the model: callee logs `model-b`, the next step in A's workflow logs `model-a` again (scope restored); (b) callee workflow-level config wins over callee module-level config on the cross-module path; (c) with `JAIPH_AGENT_MODEL` exported in the environment (locked), the callee's config does NOT override it. `e2e/tests/86_metadata_scope_nested.sh` and `e2e/tests/87_workflow_config.sh` are updated where they previously asserted the old (ignore) behavior — the nested call now sees the callee's backend during execution and the caller's backend is restored after. The now-stale `NOTE` comment at the top of `.jaiph/ensure_ci_passes.jh` (which warned that cross-module callers' config would win) is removed. Docs updated in `docs/configuration.md` ("Scoping across nested calls" table — the cross-module row no longer says the callee's config is ignored; "Module-level config" paragraph rewritten to describe nested `run` as same- *or* cross-module and to flag same-module `ensure` as the one remaining caller's-scope-as-is case).
+- **Tooling — Documentation prompts follow a vendored Diátaxis skill:** The three prompts in `.jaiph/docs_parity.jh` (`update_from_task`, `docs_page`, `docs_overview`) used to inline the same ad-hoc "expert technical writer" `role` const and repeat its guiding principles in prose. Each prompt now opens with an instruction to read and follow `.jaiph/skills/documentation-writer/SKILL.md` **before doing anything else**; the skill is referenced by explicit path so both the Claude and Cursor backends can `Read` it directly without depending on agent-specific skill auto-discovery directories. The skill is vendored from `github/awesome-copilot` at `.jaiph/skills/documentation-writer/SKILL.md` (committed, not gitignored; the file header records the upstream URL, blob SHA, and copy date so it can be re-synced) — vendoring rather than `npx skills add` at runtime keeps docs runs offline-safe and reproducible. It supplies the **Diátaxis** framework's four document types (tutorial / how-to / reference / explanation), the clarify → outline → write workflow, and the four guiding principles (clarity, accuracy, user-centricity, consistency). The inline `role` const is slimmed to project-specific context the skill does not cover — TypeScript / Bash fluency for verifying docs against the implementation, `docs/architecture.md` as the single source of truth (do not trust existing docs blindly), and the constraint that navigation between docs pages is provided by the Jekyll template in `docs/_layouts/docs.html` (no manual "More Documentation" blocks). `jaiph compile .jaiph` and `jaiph format --check .jaiph/docs_parity.jh` stay green.
+- **Refactor — Replace the `parseBlockStatement` keyword cascade with a `STATEMENT` dispatch table:** `parseBlockStatement` in `src/parse/workflow-brace.ts` used to dispatch each statement form via a long ordered cascade of `startsWith` + regex tests (`"run async "` before `"run "`, `"prompt "` before bare assignment, etc.), so adding a new keyword meant finding the right slot in the cascade and any reordering risked changing which branch fired. The cascade is replaced by a `STATEMENT: Record<string, BlockHandler>` table keyed by the leading keyword: the dispatcher tokenizes the first identifier on the trimmed line, looks it up in the table, and invokes the matching handler — which returns a `{ step, nextIdx }` result, returns `null` to fall through, or calls `fail(...)` to abort. The current rows are `if`, `for`, `const`, `fail`, `wait`, `ensure`, `run`, `prompt`, `log`, `logerr`, `return`, and `match`; each handler (`tryParseIf`, `tryParseFor`, `tryParseConst`, `tryParseFail`, `tryParseWait`, `tryParseEnsure`, `tryParseRun`, `tryParsePrompt`, `tryParseLog`, `tryParseLogerr`, `tryParseReturn`, `tryParseStandaloneMatch`) carries the same regex / `startsWith` checks that used to live inline in the cascade — body shapes are unchanged. After dispatch, two non-keyword fallbacks fire in order: `trySend` (matches `channel <- rhs` via `matchSendOperator`) and `shellFallthrough` (everything else becomes a shell `exec` step). Assignment-shape error guards (`name = prompt …`, `name = run …` without `const`) live in a separate `applyAssignmentGuards(c)` helper that runs before the table lookup and either calls `fail(...)` or returns; the `forRule` rejection of `prompt …` inside rules also moves here. The shared per-line context (`filePath`, `lines`, `idx`, `innerRaw`, `inner`, `innerNo`, `trivia`, `forRule`, `opts`) is now a `BlockCtx` record threaded into every handler, so handlers take one argument instead of nine. Surface syntax is unchanged, every existing parse-error message / line / col is preserved, and the full golden corpus passes byte-for-byte. New tests pin the invariants: `src/parse/parse-error-snapshot.test.ts` walks every `=== name` block in `test-fixtures/compiler-txtar/parse-errors.txt`, parses each via `loadModuleGraph`, and asserts the captured `{ file, line, col, code, message }` matches the snapshot stored at `test-fixtures/compiler-txtar/parse-errors-snapshot.json` bit-for-bit — any drift in parser error wording or location fails the test (refreshable with `UPDATE_SNAPSHOTS=1` only after confirming the change is intentional). `src/parse/parse-synthetic-keyword.test.ts` pins the two-file extension contract: it patches `STATEMENT` at runtime with a synthetic `zzznoop` handler, asserts `parseBlockStatement` dispatches to it, asserts the same input falls through to the shell handler when the row is absent, and greps `src/parse/workflow-brace.ts` and `src/parse/core.ts` to confirm the `STATEMENT` table and the `JAIPH_KEYWORDS` reserved set each live in exactly one file. Adding a new top-level keyword is now a two-place change: one row in `STATEMENT` (`workflow-brace.ts`) and one entry in `JAIPH_KEYWORDS` (`core.ts`). `BlockCtx`, `BlockResult`, `BlockHandler`, and `STATEMENT` are exported so external test files can stage synthetic handlers without forking the parser. Out of scope: the wider tokenizer rewrite (the seven independent `inDoubleQuote` / `inTripleQuote` / `braceDepth` scanners across `src/parse/`, the line-walking `{ step, nextIdx }` contract, and the per-handler regex bodies are deferred — this refactor only changes the *dispatch shape* inside `parseBlockStatement`, not the scanning underneath). User-visible contracts — surface syntax, CLI behavior, `jaiph format` round-trip, run artifacts, banner, hooks, exit codes, `__JAIPH_EVENT__` streaming — are unchanged. Docs updated in `docs/architecture.md` (extended **Parser** bullet with a new **Keyword dispatch table** paragraph), `docs/contributing.md` (new **Statement-dispatch-table shape** row in the test-layer table), and `docs/grammar.md` (extended the EBNF aside to name the `STATEMENT` table). Implements `design/2026-05-15-parser-compiler-simplification.md` § Refactor 1 AC3 / AC4 / AC5 (the full tokenizer rewrite remains future work).
+- **Refactor — Unify `catch` / `recover` parsing into a single attached-block routine sharing the top-level statement parser:** `src/parse/steps.ts` used to contain three near-identical 100+ line functions — `parseEnsureStep`, `parseRunCatchStep`, and `parseRunRecoverStep` — that parsed the same syntactic shape (`<host-step> <keyword> (binding) { body } | single-stmt`) and differed only in which host step they decorated (`ensure` vs `run`) and the literal keyword (`catch` vs `recover`). Their body parser, `parseCatchStatement` (~280 lines), was a stripped-down copy of `parseBlockStatement` that recognized only a fixed subset of statement forms (e.g. a `for … in …` head fell through to a shell command) and diverged in subtle ways — the same fix had to land in two places, and divergence wasn't always caught by tests. All four functions and every helper that existed only to serve them are deleted from `src/parse/steps.ts`. The file drops from **757 → ~140 lines**. The new shape: one entry point `parseAttachedBlock(filePath, lines, idx, innerNo, innerRaw, keyword: "catch" | "recover", textAfterKeyword, trivia)` in `src/parse/steps.ts` parses the bindings (`(<binding>)` — exactly one identifier, with the same too-many / too-few / non-identifier errors as before) and dispatches on the body shape: a `{` at end of host line walks the existing brace-block scanner and delegates each body statement to `parseBraceBlockBody`, an inline `{ stmt[; stmt]* }` splits on `;` via the shared `splitStatementsOnSemicolons` and dispatches each fragment, and a bare single statement is parsed in-place. In all three cases the body statements run through the **same** `parseBlockStatement` (`src/parse/workflow-brace.ts`) that handles top-level statements — there is no mini parser for catch/recover bodies anymore. The host side moves to one helper `parseRunOrEnsure(filePath, lines, idx, …, host: "run" | "ensure", hostBody, isAsync, captureName, trivia)` in `src/parse/workflow-brace.ts`, called from `parseBlockStatement`'s three call sites (`ensure ref(...)`, `run ref(...)`, `run async ref(...)`). It scans `hostBody` once for a trailing ` recover` (run-only) then ` catch ` segment, parses the host call before the keyword, and delegates the attached clause to `parseAttachedBlock`. "Is this statement allowed inside a catch/recover body?" is now a validator concern — `WORKFLOW_SCOPE` and `RULE_SCOPE` in `validate-step.ts` already gate which step types are accepted in each scope, so rules still reject unstructured shell inside `catch` / `recover` bodies; workflows still accept it. New tests in `src/parse/parse-attached-block.test.ts` pin the invariants: AC1 — an LoC test caps `src/parse/steps.ts` at **≤200 lines** and a grep test fails if any function named `parse(Run)?(Catch|Recover|EnsureStep)` reappears; AC2 — a `for line in items { log "$line" }` statement (a `parseBlockStatement`-only form historically) is parsed as a `for_lines` step at the top level, inside `ensure check() catch (e) { … }`, and inside `run target() recover(e) { … }` — proving `parseBlockStatement` is the single entry point for any statement inside a catch / recover body and there is no separate mini parser; AC3 — a 10-case error-snapshot battery asserts every existing parse error message and column (bindings missing, too many bindings, empty inline / multiline block, unterminated multiline block, missing-paren for both `catch` and `recover` on both `run` and `ensure` hosts) is preserved bit-for-bit. The full parser / validator / emitter golden corpus (`src/transpile/compiler-golden.test.ts`, `src/transpile/compiler-edge.acceptance.test.ts`, `parse-steps.test.ts`, `parse-bare-call.test.ts`, `parse-run-async.test.ts`, and the txtar / golden-AST fixtures) passes byte-for-byte (AC4). User-visible contracts — surface syntax for `catch` / `recover`, CLI behavior, `jaiph format` round-trip, run artifacts, banner, hooks, exit codes, `__JAIPH_EVENT__` streaming — are unchanged. Out of scope: the wider tokenizer rewrite (Refactor 1, deferred); validator changes beyond the per-keyword scope rules that already exist. Docs updated in `docs/architecture.md` (extended **Parser** bullet with a new **Unified `run` / `ensure` host parsing** paragraph), `docs/contributing.md` (new **Attached-block parser shape** row in the test-layer table), and `docs/grammar.md` (replaced the stale `parseCatchStatement` reference in the EBNF aside with a note that `parseAttachedBlock` delegates to `parseBlockStatement`). Implements `design/2026-05-15-parser-compiler-simplification.md` § Refactor 2.
+- **Refactor — Decouple the validator from runtime semantics:** `src/transpile/validate.ts` (now `validate-step.ts`) used to `import { tripleQuotedRawForRuntime } from "../runtime/orchestration-text"` so it could compute "what the runtime will see" when checking the content of a triple-quoted `match`-arm body. That was a one-way dependency from compile-time on runtime semantics — a layering inversion that would have kept biting as the runtime grew more such helpers. The canonicalization helper moves into the parser layer as `canonicalizeTripleQuotedString` in `src/parse/triple-quote.ts` (same algorithm: validate the outer `"…"` shape, unescape DSL-quoted inner with `\"` → `"` and `\\` → `\`, then re-wrap via `tripleQuoteBodyToRaw(dedentCommonLeadingWhitespace(inner))`). Both the validator (`validate-step.ts`'s `validateMatchExpr`) and the runtime (`src/runtime/kernel/node-workflow-runtime.ts`'s match-arm dispatch in `runMatchExpr`) now import that helper from `src/parse/`; the wrapper file `src/runtime/orchestration-text.ts` is deleted. New tests pin the invariants: `src/transpile/no-runtime-imports.test.ts` (AC1) greps every non-test `*.ts` under `src/transpile/` and fails if any `from "…/runtime/…"` import reappears, so compile-time code can no longer reach into runtime semantics; `src/parse/canonicalize-triple-quoted.test.ts` (AC2) parses every `.jh` under `test-fixtures/` and `examples/`, collects every triple-quoted `match`-arm body across workflow / rule step trees, and asserts `canonicalizeTripleQuotedString(body) === legacyTripleQuotedRawForRuntime(body)` bit-for-bit (the legacy implementation is inlined in the test as the parity baseline). Existing `validate-string.test.ts` cases and the golden corpus pass unchanged (AC3); `npm run build` passes with zero TypeScript strict-mode errors (AC4). User-visible contracts — CLI behavior, `jaiph format` round-trip, run artifacts, banner, hooks, exit codes, `__JAIPH_EVENT__` streaming, and the full golden corpus — are unchanged byte-for-byte. Out of scope: rethinking what the canonical form *is* — this refactor only relocates the helper. Docs updated in `docs/architecture.md` (new **No compile-time → runtime imports** bullet under **Validator**; extended **Parser** bullet to document `canonicalizeTripleQuotedString` alongside `parseTripleQuoteBlock`) and `docs/contributing.md` (new **Compile-time / runtime layering** row in the test-layer table). Implements `design/2026-05-15-parser-compiler-simplification.md` § Appendix E.
+- **Refactor — Replace the 1,441-line validator switch with a per-step visitor table indexed by scope:** `src/transpile/validate.ts` used to be one ~1,441-LoC function with two near-identical inner walkers (`validateRuleStep` ~250 lines, `validateStep` ~350 lines): every step type's validation was written twice with subtle differences, and the five-check call-shape sequence (`validateNoShellRedirection` → `validateNestedManagedCallArgs` → `validateRef` → `validateArity` → `validateBareIdentifierArgs`) was repeated by hand at 6+ sites per side — at least 12 places to keep in sync. Both inner walkers and every duplicated check site are gone. The validator now spans two files. `validate.ts` (~430 LoC) keeps the **outer** layer: import / channel-route / test-block checks and `walkStepTree` (the single descent that builds `{ knownVars, promptSchemas, flat }`). `validate-step.ts` (~1,025 LoC) holds the **per-step** visitor: a single `validateStep(step, ctx)` entry, a `VALIDATORS: Record<WorkflowStepDef["type"], StepValidator>` table with one row per step variant (`trivia`, `const`, `return`, `send`, `say`, `exec`, `if`, `for_lines`), one `validateExpr(expr, …)` dispatcher over the 8 `Expr.kind` values, and one `validateCallable(expr, ctx)` helper that runs the five managed-call-shape checks once for both `call` (`run`) and `ensure_call` (`ensure`) — parameterized by the scope's `runRefExpect` and the target kind. Rule-vs-workflow differences are captured in a `Scope` value (`WORKFLOW_SCOPE` / `RULE_SCOPE`) with three fields: `allowSteps: Set<WorkflowStepDef["type"]>` (single set-lookup gate at the top of `validateStep` — rules reject `send` outright; rules also reject `prompt` and `run async` from inside `exec` bodies), `runRefExpect: RefExpectMessages` (workflow vs rule semantics for `run ref(…)`), and `withPromptSchemas: boolean` (workflows collect prompt-returning bindings, rules skip schema collection). `ValidatorCtx` threads the scope plus the precomputed `knownVars`, `promptSchemas`, and `recoverBindings` into every visitor — none of which are re-derived per step. Every existing `E_VALIDATE` error message and source location is preserved bit-for-bit: the entire `validate-*.test.ts` suite, `src/transpile/compiler-golden.test.ts`, `src/transpile/compiler-edge.acceptance.test.ts`, and the txtar / golden-AST corpora all pass unchanged. New acceptance tests in `src/transpile/validate-visitor.test.ts` pin the invariants: an LoC test caps `validate.ts` at **≤700 lines** so new per-step logic lands in `validate-step.ts` (AC1); a JSON snapshot over every `validate-*` txtar fixture (`test-fixtures/compiler-txtar/validate-errors.txt` + `validate-errors-multi-module.txt`) stored in `test-fixtures/compiler-txtar/validate-diagnostics-snapshot.json` asserts each diagnostic's `{ code, line, col, message }` against `collectDiagnostics(graph)` bit-for-bit (AC3 — refreshable via `UPDATE_SNAPSHOTS=1` only after confirming the message change is intentional); and an "unknown step type" test casts a synthetic step variant into `WorkflowStepDef`, runs `validateStep` in both `WORKFLOW_SCOPE` and `RULE_SCOPE`, and asserts each call produces exactly one diagnostic with the documented `internal: no validator for step type "…"` message (AC4 — proving that adding a new step type costs exactly one row in `VALIDATORS`). The existing `src/transpile/validate-single-walk.test.ts` still passes — `walkStepTree`'s internal `descend` remains the only recursive `WorkflowStepDef[]` walker in `validate.ts` (AC2). The `diagnostics-collector.test.ts` "fatal allowlist" scan now sums `throw jaiphError(` counts across `validate.ts` + `validate-step.ts` (both files are zero) and `diag.error(` counts likewise (≥40). User-visible contracts — CLI behavior, `jaiph format` round-trip, run artifacts, banner, hooks, exit codes, `__JAIPH_EVENT__` streaming, and the full golden corpus — are unchanged byte-for-byte. Out of scope: changes to validation rules (the *what* — this refactor only changes the *how*), parser changes, AST changes. Docs updated in `docs/architecture.md` (rewrote the **Validator** section to describe the two-file split, `VALIDATORS` table, `Scope` value, and the single `validateCallable` helper), `docs/contributing.md` (new **Validator visitor-table shape** row in the test-layer table), and `docs/grammar.md` (refreshed two stale `validateRuleStep` references to point at the new visitor / `RULE_SCOPE`). Implements `design/2026-05-15-parser-compiler-simplification.md` § Refactor 4.
+- **Refactor — Replace fail-fast errors with a `Diagnostics` collector that aggregates every recoverable error per compile:** Today `fail()` (in `src/parse/core.ts`) and `jaiphError()` (in `src/errors.ts`) both throw on the first error, so a user fixed one error, recompiled, hit the next, recompiled, and so on. The validator also pre-ordered some checks defensively because it knew it would only get to surface one error per run. That model is replaced. A new `Diagnostics` class lives in `src/diagnostics.ts` and exposes `add(d)`, `error(file, line, col, code, message)` (records the diagnostic and short-circuits the current unit through a `BailoutError`), `capture(fn)` (runs `fn` and absorbs both `BailoutError` and any thrown legacy `jaiphError` whose message parses as `path:line:col CODE message` — turning the throw into a recoverable entry without re-throwing), `hasErrors()` / `hasFatal()`, `sorted()` (stable order by file, then line, then column), `formatLines()` (one `path:line:col CODE message` per line), and a legacy `throwFirstIfAny()` bridge that throws the first sorted diagnostic via `jaiphError` so existing single-error call sites and per-error tests are unchanged. `src/transpile/validate.ts` exposes a new `collectDiagnostics(graph): Diagnostics` entry that walks the import closure and never throws on user-level errors; the previous `validateReferences(graph)` is now a thin wrapper that calls `collectDiagnostics` and then `throwFirstIfAny()`, preserving the throw-on-first contract for `emitScriptsForModuleFromGraph` / `buildScriptsFromGraph` and for every existing `parse-*.test.ts` / `validate-*.test.ts` fixture that asserts one specific `{ message, line, col, code }`. Inside `validate.ts` every `throw jaiphError(...)` site at user-level (~50 sites across import resolution, channel-route validation, per-rule and per-workflow step walks, prompt schema checks, and `validateTestBlocks`) is migrated to `diag.error(...)`; each top-level unit is wrapped in `diag.capture(...)` (per-import block, per-channel route, per-rule walk, per-rule step, per-workflow walk, per-workflow step, per-test-block step) so the bailout from one error unwinds only that unit and the next sibling still runs. The four leaf validation helpers (`validate-ref-resolution.ts`, `validate-string.ts`, `validate-prompt-schema.ts`, `shell-jaiph-guard.ts`) still throw via `jaiphError`, but every caller wraps them in `diag.capture(...)`, which converts the thrown error into a recoverable diagnostic and returns. The CLI command `jaiph compile` (`src/cli/commands/compile.ts`) is rewritten to route through `collectDiagnostics`: it accumulates every error from every entry's import closure, sorts them by `(file, line, col)`, and prints the full set — as a single JSON array on stdout under `--json`, or as one `path:line:col CODE message` line per diagnostic on stderr otherwise — exiting **1** on any non-empty diagnostic set. Fatal aborts during graph load or parsing (unterminated triple-quote, unterminated brace block, missing imports during graph build) are reported as a single diagnostic for the affected entry; the command then continues with the next entry. New tests in `src/transpile/diagnostics-collector.test.ts` pin the invariants: a fixture with three independent errors (duplicate import alias, undefined channel, unknown `run` target in one workflow body) asserts `collectDiagnostics(graph)` returns all three in source order (AC1); a source-tree scan asserts `validate.ts` holds **zero** `throw jaiphError(` sites and **≥40** `diag.error(` sites, and that every remaining `throw jaiphError(` under `src/` lives in the documented fatal allowlist — `src/diagnostics.ts` (legacy bridge), `src/parse/core.ts` (parser `fail()`), `src/cli/commands/test.ts` (test-file shape fatal), `src/transpile/module-graph.ts` (loader), `src/transpile/validate-string.ts`, `src/transpile/validate-prompt-schema.ts`, `src/transpile/validate-ref-resolution.ts`, `src/transpile/shell-jaiph-guard.ts` (leaf helpers, each captured) (AC3); and a CLI test runs `jaiph compile --json` against the same fixture and asserts the returned array has all three diagnostics and `status !== 0` (AC4). Existing single-error tests (every `parse-*.test.ts` and `validate-*.test.ts` that pins one specific `{ message, line, col, code }`) still pass because `validateReferences` continues to throw the first sorted diagnostic (AC2); `npm test` and `npm run build` pass (AC5). User-visible contracts on the `jaiph run` / `jaiph test` paths — banner, hooks, run artifacts, exit codes, `__JAIPH_EVENT__` streaming, and golden corpus — are unchanged. Out of scope: changing what counts as an error (this refactor only changes the *how*); LSP integration follows in a separate task. Docs updated in `docs/architecture.md` (new **Diagnostics collector (recoverable errors)** bullet under **Validator**; updated **System overview** to describe the two entry points and the new `jaiph compile` behavior), `docs/cli.md` (new **Multiple-error reporting** paragraph and refined **`--json`** description under **`jaiph compile`**), and `docs/contributing.md` (new **Diagnostics collector shape** row in the test-layer table). Implements `design/2026-05-15-parser-compiler-simplification.md` § Appendix B.
+- **Refactor — Fold the validator's three workflow pre-passes into a single step-tree walk:** `src/transpile/validate.ts` used to descend each workflow's / rule's step tree four times before its main check loop finished — `collectKnownVars`, `collectPromptSchemas`, `validateImmutableBindings`, and the per-step validator itself — each re-implementing the same recursion over `if` / `for_lines` / `catch` / `recover` with subtly different rules, so "what counts as a binding here" fixes had to land in two or three walkers. The three pre-pass helpers are deleted. One new helper `walkStepTree(filePath, steps, envDecls, params, declLoc, moduleScripts, parseSchemaFieldNames, { withPromptSchemas })` descends the tree once and returns `{ knownVars, promptSchemas, flat }`: it accumulates `knownVars` (env decls + params + every nested `const` / capture / `for_lines` iterator), `promptSchemas` (top-level prompt-returning bindings — workflow walks set `withPromptSchemas: true`, rule walks set it `false`), enforces immutable-binding and `script`-collision rules inline through a shared `bindings` map (with a fresh inner map under each `for_lines` body so loop iterators only shadow inside the body), and emits a flat `FlatStepEntry[]` of every step in tree order with the enclosing `catch` / `recover` failure binding (`recoverBindings: Set<string> | undefined`) attached. The per-workflow and per-rule validator loops now iterate that flat list non-recursively — the `if` / `for_lines` / `catch` / `recover` recursion that used to live inside `validateStep` / `validateRuleStep` is gone. `walkStepTree`'s internal `descend` is the only recursive helper in the file that takes a `WorkflowStepDef[]`. Failure order matches the prior "binding errors first, then per-step errors" behavior because binding checks fire during the descent, before any flat-list iteration starts. Every existing `E_VALIDATE` error message and location is preserved bit-for-bit: the full `validate-*.test.ts` suite, `src/transpile/compiler-golden.test.ts`, `src/transpile/compiler-edge.acceptance.test.ts`, and the txtar / golden-AST corpora all pass unchanged. New tests pin the invariants: `src/transpile/validate-single-walk.test.ts` greps `validate.ts` and fails if any of `collectKnownVars`, `collectPromptSchemas`, or `validateImmutableBindings` reappear by name (AC1), and a textual AST scan asserts that at most one recursive helper whose parameter list mentions `WorkflowStepDef[]` exists in the file (AC2). User-visible contracts — CLI behavior, `jaiph format` round-trip, run artifacts, banner, hooks, exit codes, `__JAIPH_EVENT__` streaming, and the full golden corpus — are unchanged. Out of scope: the visitor-table refactor (Refactor 4) and any change to validation rules. Docs updated in `docs/architecture.md` (new **Single workflow walk** bullet under **Validator**) and `docs/contributing.md` (new **Validator single-walk shape** row in the test-layer table). Implements `design/2026-05-15-parser-compiler-simplification.md` § Appendix C.
+- **Refactor — Collapse the AST around a single `Expr` type, eliminating the three "managed call" encodings:** The same concept "a managed call that yields a value" used to be encoded three different ways: as a statement (`{ type: "run", workflow, args }`), as a const RHS (`{ kind: "run_capture", ref, args }`), and as a `managed:` sidecar on `return` / `log` / `logerr` whose `value` / `message` carried a placeholder string (`"__match__"`, `"run inline_script"`, etc.). Inline scripts added a fourth (`run_inline_script_capture`); `prompt`, `match`, and `ensure` captures repeated the same dual representation. The validator, formatter, emitter, and runtime each had to handle both branches at every site. All three encodings are gone. The semantic AST now has a single `Expr` tagged union — `literal | call | ensure_call | inline_script | prompt | match | shell | bare_ref` — used everywhere a value can appear: `const name = <Expr>`, `return <Expr>`, `send channel <- <Expr>`, the message of `log` / `logerr` / `fail`, and the body of an `exec` step (the new statement-form managed call, where the value is consumed for its side effects plus optional capture). `ConstRhs` and `SendRhsDef` are deleted as separate types. The `managed:` sidecar field is deleted from `WorkflowStepDef`. The placeholder strings `"__match__"`, `"run inline_script"`, and `"__JAIPH_MANAGED__"` no longer appear anywhere under `src/`. `WorkflowStepDef` collapses from 14 variants to **8** (`exec`, `const`, `return`, `send`, `say`, `if`, `for_lines`, `trivia`): `exec` is the new managed-statement form covering the prior `run` / `ensure` / `run_inline_script` / `prompt` / `shell` / standalone `match` cases (the discriminator now lives inside `body.kind`, with `captureName` / `catch` / `recover` as step-level attributes); `say` covers the prior `log` / `logerr` / `fail` cases (`level: "fail"` aborts the workflow with the message, otherwise the message is written to the corresponding stream); `comment` / `blank_line` collapse into a single `trivia` variant (formatter-only, skipped by validator and runtime). The parser builds `Expr` nodes directly: `parseConstRhs` returns `{ value: Expr }`; `parseSendRhs` returns `{ value: Expr }`; `parsePromptStep` returns an `exec` step whose `body` is an `Expr.prompt`; `return run …` / `return ensure …` / `return match …` / `return run \`…\`(…)` build `Expr.call` / `Expr.ensure_call` / `Expr.match` / `Expr.inline_script` directly with no sidecar; `log run \`…\`(…)` and `logerr run \`…\`(…)` build `say` steps whose `message` is an `Expr.inline_script`. Downstream consumers compress accordingly: the validator switches on the 8-variant `WorkflowStepDef.type` and the 8-kind `Expr.kind` with no "literal value vs managed sidecar" fork; the formatter renders each `Expr` through one `emitExpr` helper instead of branching on a sidecar; the runtime has one private `evaluateExpr(scope, expr, …)` dispatcher that `const` / `return` / `send` / `say` / `exec` all delegate to (which runs the managed call for `call` / `ensure_call` / `inline_script`, walks `match` arms, schema-checks `prompt`, and interpolates `literal` via `interpolateWithCaptures`); the script-emit walk in `src/transpile/emit-script.ts` finds inline-script bodies by recursing into each step's `Expr` payload rather than enumerating the four legacy carriers. New tests pin the invariants: `src/types-shape.test.ts` is a compile-time exhaustive `switch` plus runtime tuple assertion that `WorkflowStepDef` has exactly **8** variants and `Expr` has exactly **8** kinds (AC2), a `grep` over every non-test `.ts` file under `src/` that fails if any of the placeholder strings (`"__match__"`, `"run inline_script"`, `"__JAIPH_MANAGED__"`) reappear (AC1), and an export-surface check that fails if `ConstRhs` or `SendRhsDef` are re-exported from `src/types.ts` (AC3). Updated parser tests in `src/parse/parse-return.test.ts`, `src/parse/parse-const-rhs.test.ts`, `src/parse/parse-prompt.test.ts`, `src/parse/parse-send-rhs.test.ts`, `src/parse/parse-steps.test.ts`, `src/parse/parse-inline-script.test.ts`, and `src/parse/parse-bare-call.test.ts` assert the new `Expr` shape directly for `return run …`, `return ensure …`, `return match … { … }`, `return run \`…\`(…)`, `log run \`…\`(…)`, and `const x = prompt …` (AC4). The golden corpus (`src/transpile/compiler-golden.test.ts`, `src/transpile/compiler-edge.acceptance.test.ts`) passes byte-for-byte against the emitted bash output; `src/format/roundtrip.test.ts` round-trips bit-for-bit on every fixture; `npm run build` passes with zero TypeScript strict-mode errors (AC5 / AC6). Golden AST fixtures under `test-fixtures/golden-ast/expected/` are regenerated to reflect the new step shapes (`exec` wrapping every managed call, `say` replacing `log` / `logerr` / `fail`, `trivia` replacing `comment` / `blank_line`, `Expr` value/message/body payloads). User-visible contracts — CLI behavior, `jaiph format` round-trip, run artifacts, banner, hooks, exit codes, `__JAIPH_EVENT__` streaming, and the full golden corpus — are unchanged byte-for-byte. Out of scope: surface syntax, the validator's deeper structural rewrite (Refactor 4), and parser internals (Refactors 1 & 2). Docs updated in `docs/architecture.md` (rewrote the **AST / Types** bullet to describe the single `Expr` sum and the 8-variant `WorkflowStepDef`; updated **Validator**, **Formatter**, **Node Workflow Runtime**, and **Trivia / CST layer** bullets to drop the dual-representation language; rewrote the `match_expr` mention in **CLI progress reporting pipeline** to use `Expr.kind === "match"`) and `docs/contributing.md` (new **`Expr` / step-variant shape** row in the test-layer table). Implements `design/2026-05-15-parser-compiler-simplification.md` § Refactor 3.
+- **Refactor — Collapse `bareIdentifierArgs` into a typed `Arg[]` on every call site:** Every call-bearing AST node used to carry the call arguments twice — `args: string` (the raw source between the parens) and `bareIdentifierArgs?: string[]` (a re-parse of which of those arguments happened to be bare identifiers). The validator had to remember to check both fields and call a hand-rolled `validateBareIdentifierArgs` helper at every site; the emitter re-parsed `args` from scratch because it didn't trust either field on its own. Both fields are gone. The parser now classifies each argument once, at parse time, into a new typed sum `type Arg = { kind: "literal"; raw: string } | { kind: "var"; name: string }` and stores it on every call-bearing node as `args?: Arg[]`. Affected nodes: `run` / `ensure` workflow steps, `run_inline_script` steps, the `managed` sidecar on `return` / `log` / `logerr` (in all four shapes — `run`, `ensure`, `run_inline_script`, `match`), the `run_capture` / `ensure_capture` / `run_inline_script_capture` const RHS variants, and the `run` send RHS. Downstream consumers walk the typed list directly: the validator's per-call check sequence is now arity (`args.length`), shell-redirection rejection on `literal` raws, nested-unmanaged-call rejection on `literal` raws, ref resolution, and `var`-arg resolution against in-scope bindings via a new `validateArgVarRefs` (the standalone `validateBareIdentifierArgs` helper is deleted); the formatter renders each `Arg` directly (`var` → bare name, `literal` → raw) instead of re-tokenizing a `${ident}`-rewritten string; the runtime turns `Arg[]` back into the space-separated argv string via `argsToRuntimeString` in `src/parse/core.ts` (`var` → `${name}`, `literal` → raw) so the existing handle-resolution / interpolation path is unchanged. New tests pin the invariants: `src/parse/arg-ast-shape.test.ts` is a compile-time assertion that `bareIdentifierArgs` does not appear on `WorkflowStepDef` (`ensure`, `run`, `run_inline_script`, `log.managed`, `logerr.managed`, `return.managed` in `run` / `ensure` / `run_inline_script` shapes), `ConstRhs` (`run_capture`, `ensure_capture`, `run_inline_script_capture`), or the `run` `SendRhsDef` variant (AC1); `src/parse/arg-grep.test.ts` walks every non-test `.ts` under `src/parse/` and `src/transpile/` and fails if any production file matches `args.split(",")` or the bare token `bareIdentifierArgs` (AC2), and separately fails if any file under `src/transpile/` references `validateBareIdentifierArgs` (AC3). The golden compiler corpus, `validate-*.test.ts` files, and the golden AST corpus pass byte-for-byte (AC4); `npm run build` passes with zero TypeScript strict-mode errors (AC5). User-visible contracts — CLI behavior, `jaiph format` round-trip, run artifacts, banner, hooks, exit codes, `__JAIPH_EVENT__` streaming, and the full golden corpus — are unchanged. Out of scope: the full `Expr` collapse (next task) and surface syntax. Docs updated in `docs/architecture.md` (extended **AST / Types** bullet documenting the typed `Arg` sum; updated **Validator** and **Formatter** bullets to drop the dual representation), `docs/contributing.md` (new **Call-args AST shape** row in the test-layer table), and `docs/spec-async-handles.md` (replaces the stale `commaArgsToSpaced` reference with `argsToRuntimeString`). Implements `design/2026-05-15-parser-compiler-simplification.md` § Appendix D.
+- **Refactor — Split source-fidelity data from the semantic AST into a `Trivia` (CST) layer:** Around ten fields whose only consumer was the formatter — `leadingComments` on imports / script imports / channels / `const` decls / `test` blocks, `configLeadingComments`, `trailingTopLevelComments`, `configBodySequence` (both module- and workflow-scoped), `topLevelOrder`, `bareSource` on `return`, the `tripleQuoted` flags on `literal` / `return` / `log` / `logerr` / `fail` / `send` / `const`, and the prompt / script `bodyKind` / `bodyIdentifier` discriminators — are removed from `jaiphModule`, `WorkflowStepDef`, `ConstRhs`, `SendRhsDef`, `WorkflowMetadata`, `ImportDef`, `ScriptImportDef`, `ChannelDef`, `ScriptDef`, and `TestBlockDef`, and re-homed in a new parallel `Trivia` store (`src/parse/trivia.ts`) keyed by AST-node identity (per-node `WeakMap`) plus a small `ModuleTrivia` record for module-level data. The parser exposes `parsejaiphWithTrivia(source, filePath) → { ast, trivia }`; the legacy `parsejaiph(source, filePath)` is now a thin wrapper that drops trivia for callers that don't care (validator, transpiler, runtime, `loadModuleGraph`). The formatter (`emitModule(ast, trivia, opts?)`) is the only consumer of `Trivia`; validator, emitter, transpiler, and runtime never import from `src/parse/trivia.ts`. New tests pin the invariants: `src/parse/trivia-ast-shape.test.ts` is a compile-time assertion (with runtime echo) that none of the listed fields reappear on any semantic AST type (AC1); `src/parse/trivia-grep.test.ts` greps validator and emitter source files and fails if any of them references `Trivia` / `createTrivia` / `NodeTrivia` / `ModuleTrivia` or imports from `parse/trivia` (AC2); `src/format/roundtrip.test.ts` walks every `.jh` under `examples/` and `test-fixtures/golden-ast/fixtures/` and asserts `parse → format → parse → format` converges bit-for-bit (AC3). Golden AST fixtures under `test-fixtures/golden-ast/expected/` are regenerated to drop the moved fields. User-visible contracts (CLI behavior, `jaiph format` round-trip, run artifacts, banner, hooks, exit codes, `__JAIPH_EVENT__` streaming) are unchanged. `npm test` and `npm run build` pass with zero TypeScript strict-mode errors (AC4 / AC5). Out of scope: the `Expr` collapse — this refactor only relocates source-fidelity fields without changing the semantic AST's shape. Docs updated in `docs/architecture.md` (new **Trivia / CST layer** section with anchor `#trivia-cst-layer`, plus updated **Parser**, **AST / Types**, and **Formatter** bullets) and `docs/contributing.md` (new row in the test-layer table). Implements `design/2026-05-15-parser-compiler-simplification.md` § Appendix A.
+- **Refactor — `ModuleGraph` is the single representation of "all `.jh` modules reachable from an entry point, parsed once":** The previous three traversal strategies for compile-time module discovery (validator re-reading imports through `ValidateContext`, `emitScriptsForModule` re-wrapping the same callbacks with an optional `prep` cache, and `buildScripts` walking the filesystem directly) collapse to one path. `parsejaiph(source, filePath)` is now strictly I/O-pure — it can no longer reach `fs`. The single discovery routine `loadModuleGraph(entry, workspaceRoot?)` (`src/transpile/module-graph.ts`) walks the entry plus its transitive `import` closure and returns `{ entryFile, workspaceRoot?, modules: Map<absPath, { filePath, ast, imports }> }`; every other compile-time consumer takes the graph and never re-reads `.jh` from disk. `validateReferences(graph)` and `emitScriptsForModuleFromGraph(graph, file, rootDir)` operate entirely in-memory. The `ValidateContext` interface (`resolveImportPath` / `existsSync` / `readFile` / `parse` / `workspaceRoot` callbacks) is deleted from `src/transpile/validate.ts`; the validator consumes the graph and uses `existsSync` only to resolve `import script` paths (non-`.jh` bodies). `CompilePrep` / `prepareCompile` / `writeCompilePrep` / `readCompilePrep` and the optional `prep?` parameter on `emitScriptsForModule` / `buildScripts` are gone; `buildScripts(input, outDir, ws?)` now loads a graph internally and `buildScriptsFromGraph(graph, outDir, rootDir?)` is the entry point for callers that already loaded one. `buildRuntimeGraph` accepts either an entry file path (legacy) or an already-loaded `ModuleGraph` — `RuntimeGraph` is a type alias for `ModuleGraph` (the only "all reachable modules" representation in the codebase). The cross-process cache file moves to `<outDir>/.jaiph-module-graph.json` (deterministic JSON: entries sorted by absolute path, ASTs included verbatim) via `writeModuleGraph` / `readModuleGraph`, and the internal env var the spawned `node-workflow-runner.js` reads is renamed `JAIPH_MODULE_GRAPH_FILE` (replacing `JAIPH_COMPILE_PREP_FILE`). Scope of the env-var hand-off is unchanged: set only for the default local non-Docker `jaiph run` path; `jaiph run --raw`, `jaiph test`, and Docker launches fall back to `loadModuleGraph` from the source file. User-visible contracts — banner, hooks, run artifacts, `run_summary.jsonl`, `return_value.txt`, exit codes, `__JAIPH_EVENT__` streaming, CLI usage, and the full golden corpus (`compiler-golden.test.ts`, `compiler-edge.acceptance.test.ts`) — are unchanged byte-for-byte. New tests (`src/transpile/module-graph.test.ts`, `src/transpile/pipeline-io-purity.test.ts`) stub `node:fs` to throw on any `.jh` read and run the full pipeline against `test-fixtures/` to pin the I/O-purity invariant; another test instruments `parsejaiph` with a call counter to assert no duplicate parses across `loadModuleGraph` → `validateReferences` → `emit` → `buildRuntimeGraph` for fixtures with transitive imports. `src/transpile/compile-prep.ts` and `compile-prep.test.ts` are removed. Docs updated in `docs/architecture.md`, `docs/cli.md`, and `docs/testing.md`. Implements `design/2026-05-15-parser-compiler-simplification.md` § Refactor 5.
+- **Performance — `jaiph install` parallelism:** Missing-library clones now run in parallel through a small bounded-concurrency executor (default 4 in flight), replacing the previous sequential `execSync` loop. The user contract is unchanged: warm-path libraries (target directory exists and `--force` is absent) still skip without invoking `git` for both explicit args and restore-from-lock; failed clones still exit non-zero and do not produce a lock entry; restore-from-lock still does not invent new lock entries. The default clone runner now uses `spawn("git", ["clone", "--depth", "1", …])` so multiple clones can overlap network and process latency. `runInstall` is now `async` and exposes injectable `CloneRunner` / `concurrency` options for testing. Tests cover concurrent overlap (peak in-flight ≥ 2), warm-path skipping for explicit args and restore, invalid-remote and unknown-ref failure paths, mixed success/failure lockfile bookkeeping, and the existing corrupt/missing-lockfile behavior. Docs updated in `docs/cli.md` and `docs/libraries.md`.
 
 # 0.9.4
 
 ## Summary
 
-Maintenance and simplification:
-- **Breaking:** Inbox dispatch is sequential only (parallel config/env removed). Stricter grammar: multiline `config` blocks only; no one-line braced workflows; no semicolon-separated statements in workflow/rule bodies.
-- **Runtime:** Single-line shell steps run in the Node runtime (`sh -c`); script capture only on success; async `run` + `recover` return propagation fixed; mock prompts use JSON arm dispatch and an in-memory response queue; inbox artifact files are written only when a route consumes the channel.
-- **CLI / install:** Failure footers use the **last** failed step in `run_summary.jsonl`; curl install ships `package.json` so stable installs resolve the correct default Docker image tag.
-- **Language:** RHS bare identifiers and bare dotted identifiers are treated as interpolation sugar where applicable.
-- **Library:** `artifacts.save(paths)` in single-argument form (path or newline-separated list); `git format-patch` workflows use `--stdout` so patch bytes are captured.
-- **Repo:** `node-workflow-runtime` split into arg-parser, event-emitter, and mock modules; test directories consolidated under `integration/`, `test-fixtures/`, `test-infra/`; `JAIPH_TEST_MODE` no longer suppresses stderr events in runtime code (constructor option instead).
-- **Docs / DX:** Agent-proxy design note; explicit parse error for `test` blocks outside `*.test.jh`; architecture/inbox corrections; getting-started shortened.
+- Feature: `for <line> in <string> { ... }` loop.
+- Simplifying: Sequential inbox only; stricter grammar (multiline `config`, no one-line braced workflows, no `;` in workflow/rule bodies).
+- Hardening, test refactoring and bug fixes
 
 ## All changes
 
+- **Language:** `for <id> in <id> { … }` in workflows and rules iterates newline-delimited lines of a string binding. Newlines normalize `\r\n` to `\n`; a single trailing empty segment from a final newline is omitted. Lines are not trimmed and empty interior lines are still iterated unless the body skips them (e.g. `if line != "" { … }`). Documented in `docs/language.md`.
+- **Tests / QA:** Unit tests for string line splitting (`src/runtime/string-lines.test.ts`); E2E `e2e/tests/135_for_string_lines.sh`.
 - **Breaking — Language:** Inline one-line `config { k = v }` is removed — only the multiline `config {\n  … \n}` form parses (matches documented grammar). The formatter no longer emits compact inline `config`, which would be invalid input. Examples such as `examples/async.jh` were migrated.
 - **Breaking — Language:** Single-line `workflow name() { stmt }` braced form removed; workflow and rule bodies require one statement per line as in the grammar.
 - **Breaking — Language:** Semicolons no longer separate statements in workflow/rule bodies (`splitStatementsOnSemicolons` remains for `match` arms). Multiple statements on one line joined by `;` must be split across lines.
diff --git a/QUEUE.md b/QUEUE.md
index 72264987..64f890c3 100644
--- a/QUEUE.md
+++ b/QUEUE.md
@@ -4,47 +4,12 @@ Process rules:
 
 1. Tasks are executed top-to-bottom.
 2. The first `##` section is always the current task.
-3. When a task is completed, remove that section entirely.
-4. Every task must be standalone: no hidden assumptions, no "read prior task" dependency.
-5. This queue assumes **hard rewrite semantics**:
+3. Task that is ready for implementation is marked with `#dev-ready` at the end of the header.
+4. When a task is completed, remove that section entirely.
+5. Every task must be standalone: no hidden assumptions, no "read prior task" dependency.
+6. This queue assumes **hard rewrite semantics**:
    * breaking changes are allowed,
    * backward compatibility is **not** a design goal unless a task explicitly says otherwise.
-6. **Acceptance criteria are non-negotiable.** A task is not done until every acceptance bullet is verified by a test that fails when the contract is violated. "It works on my machine" or "the existing tests pass" is not acceptance.
-
-***
-
-## Performance — investigate and fix slow installation
-
-**Goal**
-`jaiph install` (and related dependency or bootstrap steps) feels unreasonably slow; find the dominant cost and improve it without weakening reproducibility (lockfile, shallow clone behavior, etc.).
-
-**Scope**
-
-* Profile or instrument the install path (git clone, lockfile I/O, post-install) and document the top 1–3 contributors to latency.
-* Implement targeted fixes (e.g. avoid redundant work, reduce subprocess churn, cache safely) and verify wall-clock improvement on a cold and warm run where applicable.
-
-**Acceptance criteria**
-
-* A short note in the commit or PR description states what was slow and what changed, with before/after rough timings on the same machine.
-* `jaiph install` behavior remains correct: same lockfile semantics and failure modes for bad URLs or missing refs.
-* `npm test` passes.
-
-***
-
-## Performance — investigate and fix slow workflow start (initial 2–4 s lag)
-
-**Goal**
-When starting workflows (e.g. `jaiph run` / first step), users observe a 2–4 second delay before useful work; reduce that lag or explain and eliminate unnecessary startup work (JIT, imports, process spawn, discovery).
-
-**Scope**
-
-* Reproduce the lag with a minimal `.jh` workflow; trace Node startup, module load, and runtime init (`NodeWorkflowRuntime` and friends).
-* Address fixable costs (e.g. defer heavy work, lazy imports, avoid redundant file scans) without changing user-visible workflow semantics.
-
-**Acceptance criteria**
-
-* Documented repro (command + minimal file) and what was measured (time to first event / first step).
-* Measurable reduction in the cold-start path on a representative case, or a clear justification if the lag is irreducible (e.g. external subprocess).
-* `npm test` passes.
+7. **Acceptance criteria are non-negotiable.** A task is not done until every acceptance bullet is verified by a test that fails when the contract is violated. "It works on my machine" or "the existing tests pass" is not acceptance.
 
 ***
diff --git a/README.md b/README.md
index baeb4b2c..82fb3d97 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,8 @@
 # ![Jaiph](docs/logo.png)
 
-[jaiph.org](https://jaiph.org) · [Getting Started](docs/getting-started.md) ([jaiph.org/getting-started](https://jaiph.org/getting-started)) · [Setup](docs/setup.md) · [Libraries](docs/libraries.md) · [Language](docs/language.md) · [Grammar](docs/grammar.md) · [CLI](docs/cli.md) · [Configuration](docs/configuration.md) · [Testing](docs/testing.md) · [Hooks](docs/hooks.md) · [Inbox & Dispatch](docs/inbox.md) · [Sandboxing](docs/sandboxing.md) · [Runtime artifacts](docs/artifacts.md) · [Async Handles](docs/spec-async-handles.md) · [Architecture](docs/architecture.md) · [Contributing](docs/contributing.md)
+[jaiph.org](https://jaiph.org) · [Your first workflow](docs/first-workflow.md) · [Your first agent + sandboxed run](docs/first-agent-run.md) · [Install & switch versions](docs/setup.md) · [Agent Skill](https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md) · [Architecture](docs/architecture.md) · [CLI](docs/cli.md) · [Contributing](docs/contributing.md)
+
+> **Docs note:** The Jaiph documentation site follows the [Diátaxis](https://diataxis.fr/) framework. Tutorials: [Your first workflow](docs/first-workflow.md), [Your first agent + sandboxed run](docs/first-agent-run.md). How-to: [Install & switch versions](docs/setup.md), [Run in a Docker sandbox](docs/sandbox-run.md), [Authenticate agent backends](docs/agent-auth.md), [Configure backend & model](docs/configure-backend.md), [Add a hook](docs/hooks.md), [Use & publish a library](docs/libraries.md), [Save artifacts](docs/artifacts.md), [Write & run tests](docs/testing.md). Reference: [CLI](docs/cli.md), [Configuration](docs/configuration.md), [Grammar](docs/grammar.md), [Language](docs/language.md), [Environment variables](docs/env-vars.md). Explanation: [Why Jaiph](docs/why-jaiph.md), [Architecture](docs/architecture.md), [Sandboxing](docs/sandboxing.md), [Inbox & Dispatch](docs/inbox.md), [Async Handles](docs/spec-async-handles.md). Contributor: [Contributing](docs/contributing.md), [Agent Skill](https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md).
 
 ---
 
@@ -21,9 +23,9 @@
 - **Workflows** — Compose `prompt`, `run`, `ensure`, channel sends, conditionals, `run async` with implicit join, `catch`, and repair-and-retry `recover`.
 - **Rules and scripts** — Rules stay structured (no raw shell lines); **`script`** steps run bash or polyglot code as subprocesses.
 - **Agents** — Backends include Cursor, Claude, Codex (HTTP), or a custom `agent.command`.
-- **Testing** — `*.test.jh` files run in-process (`jaiph test`) with mocks and `expect_*` assertions ([Testing](docs/testing.md)).
-- **Safety and inspectability** — Docker-backed sandbox for **`jaiph run`** (env-controlled; see [Sandboxing](docs/sandboxing.md)); live **`__JAIPH_EVENT__`** on stderr and durable **`.jaiph/runs/`** artifacts ([Architecture](docs/architecture.md)).
-- **Tooling** — `jaiph compile`, `jaiph format`, `jaiph install` / `.jaiph/libs/`, and optional `hooks.json` ([CLI](docs/cli.md), [Hooks](docs/hooks.md)).
+- **Testing** — `*.test.jh` files run in-process (`jaiph test`) with mocks and `expect_*` assertions ([Write & run tests](docs/testing.md)).
+- **Safety and inspectability** — Docker-backed sandbox for **`jaiph run`** (env-controlled; see [Sandboxing](docs/sandboxing.md) and [Run in a Docker sandbox](docs/sandbox-run.md)); live **`__JAIPH_EVENT__`** on stderr and durable **`.jaiph/runs/`** artifacts ([Architecture](docs/architecture.md)).
+- **Tooling** — `jaiph compile`, `jaiph format`, `jaiph install` / `.jaiph/libs/` ([Use & publish a library](docs/libraries.md)), and optional `hooks.json` ([CLI](docs/cli.md), [Add a hook](docs/hooks.md)).
 
 ## Core components
 
@@ -31,7 +33,7 @@
 - **Parser** (`src/parser.ts`, `src/parse/*`) — `.jh` / `.test.jh` → AST.
 - **Validator** (`src/transpile/validate.ts`) — imports and symbol references at compile time.
 - **Transpiler** (`src/transpile/*`) — emits atomic `script` files under `scripts/` only (no workflow-level shell).
-- **Node workflow runtime** (`src/runtime/kernel/node-workflow-runtime.ts`, `graph.ts`) — interprets the AST; `buildRuntimeGraph()` is parse-only across imports.
+- **Node workflow runtime** (`src/runtime/kernel/node-workflow-runtime.ts`, `graph.ts`) — interprets the AST; `buildRuntimeGraph(graph)` consumes the `ModuleGraph` produced by `loadModuleGraph` (no filesystem reads).
 - **Node test runner** (`src/runtime/kernel/node-test-runner.ts`) — `*.test.jh` blocks with mocks.
 - **JS kernel** (`src/runtime/kernel/`) — prompts, managed scripts, `__JAIPH_EVENT__`, inbox, mocks.
 Diagrams, runtime contracts, on-disk artifact layout, and distribution: **[Architecture](docs/architecture.md)**. Test layers and E2E policy: **[Contributing](docs/contributing.md)**.
@@ -62,9 +64,9 @@ Or install from npm:
 npm install -g jaiph
 ```
 
-Verify: `jaiph --version`. Switch versions: `jaiph use nightly` or `jaiph use 0.9.4`.
+Verify: `jaiph --version`. Switch versions: `jaiph use nightly` or `jaiph use 0.10.0`.
 
-Initialize a project (optional): `jaiph init` writes `.jaiph/` with bootstrap workflow, gitignore entries for runs/tmp, and **`SKILL.md`** when the CLI resolves a skill file on disk (`JAIPH_SKILL_PATH`, install-relative `jaiph-skill.md`, or `docs/jaiph-skill.md` under cwd — see [Setup](docs/setup.md)). Canonical skill text for agents: `https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md`.
+Initialize a project (optional): `jaiph init` writes `.jaiph/` with bootstrap workflow, gitignore entries for runs/tmp, and **`SKILL.md`**. The CLI resolves the skill body in this order — `JAIPH_SKILL_PATH`, install-relative `jaiph-skill.md`, `docs/jaiph-skill.md` under cwd, then an **embedded copy baked into the binary** as the final fallback — so `jaiph init` always writes `SKILL.md` (see [Install & switch versions](docs/setup.md)). Canonical skill text for agents: `https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md`.
 
 ## Usage
 
@@ -73,7 +75,7 @@ Initialize a project (optional): `jaiph init` writes `.jaiph/` with bootstrap wo
 - Validate without executing: `jaiph compile …` (same `validateReferences` checks as before `jaiph run`; no `scripts/` emission — see [Architecture](docs/architecture.md)).
 - Format sources: `jaiph format …` / `jaiph format --check …`.
 
-Full flags and environment variables: [CLI reference](docs/cli.md). Doc map: [Getting Started](docs/getting-started.md).
+Full flags and environment variables: [CLI](docs/cli.md), [Environment variables](docs/env-vars.md). New here? Start with [Your first workflow](docs/first-workflow.md).
 
 ## Example
 
@@ -102,12 +104,12 @@ workflow default(task) {
 ./main.jh "add user authentication"
 ```
 
-For the full language reference, see [Grammar](docs/grammar.md). For install, workspace layout, libraries, CLI commands, configuration, testing, sandboxing, hooks, inbox dispatch, and on-disk run output, see [Getting Started](docs/getting-started.md) (map), [Setup](docs/setup.md), and [Runtime artifacts](docs/artifacts.md), or visit [jaiph.org](https://jaiph.org).
+For the full language reference, see [Grammar](docs/grammar.md) and [Language](docs/language.md). For install, libraries, sandboxing, hooks, testing, and artifacts, see the How-to quadrant: [Install & switch versions](docs/setup.md), [Use & publish a library](docs/libraries.md), [Run in a Docker sandbox](docs/sandbox-run.md), [Add a hook](docs/hooks.md), [Write & run tests](docs/testing.md), [Save artifacts](docs/artifacts.md). New to Jaiph? Start with the tutorials: [Your first workflow](docs/first-workflow.md) and [Your first agent + sandboxed run](docs/first-agent-run.md). Or visit [jaiph.org](https://jaiph.org).
 
 ## Start here
 
 - **AI agent** who wants to work in a predictable, structured way? Read the [Agent Skill](https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md) — it teaches you how to author Jaiph workflows and makes your behavior verifiable and auditable.
-- **Human** who manages agents and wants reliable, repeatable automation? See the [Samples](https://github.com/jaiphlang/jaiph/tree/main/examples) and [Getting Started](docs/getting-started.md).
+- **Human** who manages agents and wants reliable, repeatable automation? See the [Samples](https://github.com/jaiphlang/jaiph/tree/main/examples) and [Your first workflow](docs/first-workflow.md).
 - **Contributor** who wants to improve Jaiph itself? See [Contributing](docs/contributing.md).
 
 ## Contributing
diff --git a/design/2026-05-15-parser-compiler-simplification.md b/design/2026-05-15-parser-compiler-simplification.md
new file mode 100644
index 00000000..f2d2d09d
--- /dev/null
+++ b/design/2026-05-15-parser-compiler-simplification.md
@@ -0,0 +1,347 @@
+# Parser & Compiler Simplification — design doc
+
+*Five refactors to compress `src/parse/` and `src/transpile/` by roughly a third, make the AST a clean sum type, and turn "add a new step or keyword" into a one-place change.*
+
+**Status:** design — ready for implementation
+**Date (UTC):** 2026-05-15
+
+---
+
+## Problem
+
+The parser and compiler work, and the golden-test corpus (`src/transpile/compiler-golden.test.ts`, `src/transpile/compiler-edge.acceptance.test.ts`) pins their behavior tightly. But the code has accumulated:
+
+- Parallel cascades of `startsWith` + regex dispatch (`src/parse/workflow-brace.ts`, 615 lines).
+- Seven independent copies of the same quote-aware scanner (`splitCatchStatements`, `splitStatementsOnSemicolons`, `matchSendOperator`, `hasUnquotedSendArrow`, `indexOfClosingDoubleQuote`, `stripQuotedArgContent`, the scanner inside `parseSendRhs`).
+- Three near-identical 100+ line catch/recover parsers (`parseEnsureStep`, `parseRunCatchStep`, `parseRunRecoverStep` in `src/parse/steps.ts`) plus a mini parser (`parseCatchStatement`) that re-implements `parseBlockStatement`.
+- An AST in which "managed call that yields a value" has **three different encodings** (`run_capture` const RHS; statement form; `managed:` sidecar on `return`/`log`/`logerr` with a placeholder `value: "__match__"` string).
+- A 1,441-line `validate.ts` with two near-identical step walkers (`validateRuleStep`, `validateStep`) that each manually repeat the 5-check sequence (`validateNoShellRedirection` → `validateNestedManagedCallArgs` → `validateRef` → `validateArity` → `validateBareIdentifierArgs`) at ~6 sites per side.
+- Three different traversal strategies for "the set of modules in this build": the validator recursively re-reads + re-parses imports via `ValidateContext` callbacks; `emitScriptsForModule` wraps the same callbacks with a `prep` cache; `buildScripts` walks the file system directly.
+
+None of this is broken. All of it makes the code expensive to change and easy to break in subtle ways (e.g. a fix to triple-quote-aware splitting has to be applied in 2–4 places, and divergence between them isn't always caught by the existing tests).
+
+The five refactors below address the structural issues, in the order I recommend implementing them.
+
+---
+
+## Refactor 1 — Real tokenizer instead of line-walking + regex cascades
+
+**Touches:** `src/parser.ts`, `src/parse/workflow-brace.ts` (615 lines), `src/parse/steps.ts` (757 lines), `src/parse/statement-split.ts` (304 lines), `src/parse/core.ts` (scanner helpers).
+
+### Current shape
+
+The parser walks `lines: string[]` and every routine returns `{ step, nextIdx }`. Statement dispatch is a long cascade of `startsWith` + regex in `parseBlockStatement` (`src/parse/workflow-brace.ts:102-615`). Order matters — `"run async "` must be tested before `"run "`, `"prompt "` before bare assignment, etc. Adding a new keyword means finding the right slot in the cascade.
+
+Quote-aware string scanning is re-implemented from scratch in at least seven places (grep `inDoubleQuote`, `inTripleQuote`, `braceDepth` across `src/parse/`). Each copy has slightly different rules for escaping, triple-quotes, and brace nesting.
+
+```ts
+// Today (src/parse/workflow-brace.ts):
+if (inner.startsWith("run async ")) { /* 40 lines */ }
+if (inner.startsWith("run ")) {       /* 50 lines */ }
+if (inner.startsWith("ensure ")) { ... }
+if (inner.startsWith("log "))    { ... }
+// ... 14 more branches
+```
+
+### Proposed shape
+
+A tokenizer that owns string/triple-quote/backtick/fence/comment/brace state, plus a recursive-descent parser that consumes a token stream and dispatches via table lookup.
+
+```ts
+// Proposed:
+const tokens = tokenize(source);        // single source of truth for scanning
+const ast    = parseModule(tokens);     // recursive descent
+
+const STATEMENT: Record<Keyword, StatementParser> = {
+  run:    parseRunStatement,
+  ensure: parseEnsureStatement,
+  log:    parseLogStatement,
+  // ...
+};
+```
+
+### Net effect
+
+- One canonical scanner instead of seven.
+- A new statement form becomes a one-file change (add a row to `STATEMENT`).
+- Expected reduction: **~1,500 lines** in `src/parse/`.
+
+### Constraints
+
+- Must pass the full existing golden test corpus byte-for-byte.
+- Staged behind a flag (run both parsers, diff ASTs in CI) during transition is acceptable.
+
+---
+
+## Refactor 2 — Unify `catch` / `recover` / inline-block parsing
+
+**Touches:** `src/parse/steps.ts` — `parseEnsureStep` (130 lines), `parseRunCatchStep` (110 lines), `parseRunRecoverStep` (110 lines), `parseCatchStatement` (280 lines).
+
+### Current shape
+
+Three near-identical 100+ line functions parse the same syntactic shape:
+
+```
+<host-step> <keyword> (binding) { body } | single-stmt
+```
+
+They differ in only two things: which host step they decorate (`ensure` vs `run`) and the literal keyword (`catch` vs `recover`).
+
+The body parser inside them, `parseCatchStatement` (`src/parse/steps.ts:89-389`), is itself a stripped-down copy of `parseBlockStatement`. The two diverge in subtle ways — e.g. `parseCatchStatement` handles return/fail/run/ensure/prompt/log via slightly different regexes than the main path.
+
+### Proposed shape
+
+```ts
+function parseAttachedBlock(
+  keyword: "catch" | "recover",
+  host: WorkflowStepDef,
+): { bindings: { failure: string }; body: WorkflowStepDef[] };
+
+// Body parsed by the SAME parseStatement used at the top level.
+```
+
+### Net effect
+
+- One body parser instead of two.
+- "Is this statement allowed inside a catch?" becomes a validator concern (Refactor 4), not something the parser enforces by what each mini-routine happens to recognize.
+- Expected reduction: **~400 lines**.
+
+---
+
+## Refactor 3 — One `Call` / `Expr` shape, not three "managed" encodings
+
+**Touches:** `src/types.ts` — `WorkflowStepDef` (14 variants), `ConstRhs` (6 kinds), `SendRhsDef` (5 kinds).
+
+### Current shape
+
+The same concept — "a managed call that yields a value" — is encoded three different ways depending on where it appears:
+
+```ts
+// As a statement:
+{ type: "run", workflow, args, ... }
+
+// As a const RHS:
+{ kind: "run_capture", ref, args, ... }
+
+// As a return / log / logerr value:
+{
+  type: "return",
+  value: "__match__",          // placeholder string for the formatter
+  managed: { kind: "match", match },
+}
+```
+
+The `return + managed` form is the worst offender. It stores placeholder strings (`"__match__"`, `"run inline_script"`, `"run foo(...)"`) so the formatter has something to print, while the real semantic payload lives in `managed`. Validator and emitter both have to know about the dual representation. Inline scripts add a fourth variant — `run_inline_script_capture` — that is yet another form of the same idea.
+
+### Proposed shape
+
+```ts
+type Expr =
+  | { kind: "literal";       raw: string; tripleQuoted?: boolean }
+  | { kind: "var";           name: string; field?: string }
+  | { kind: "call";          callee: Ref;   args: Arg[];   bareIdentifierArgs?: string[] }
+  | { kind: "ensure_call";   callee: Ref;   args: Arg[];   bareIdentifierArgs?: string[] }
+  | { kind: "inline_script"; lang?: string; body: string;  args?: string }
+  | { kind: "prompt";        body: Expr;    returns?: Schema }
+  | { kind: "match";         subject: Expr; arms: MatchArm[] };
+
+// Everywhere a value can appear, it is now an Expr:
+type ConstRhs    = Expr;
+type SendRhs     = Expr | ChannelArrow;
+type ReturnStep  = { type: "return"; value: Expr; loc: SourceLoc };
+type LogStep     = { type: "log";    message: Expr; loc: SourceLoc };
+```
+
+### Net effect
+
+- `WorkflowStepDef` drops from ~14 → ~7 variants.
+- Validator's per-step duplication of "is there a managed call here?" disappears — one `validateExpr` recursion handles it.
+- The placeholder-string + sidecar pattern goes away entirely.
+
+### Migration note
+
+This is a breaking AST change, but the on-disk surface syntax does not move. The hard-rewrite policy (per `QUEUE.md`) allows this. Golden tests must pass byte-for-byte against the emitted bash output; the AST shape they pin (if any) is internal and is allowed to change.
+
+---
+
+## Refactor 4 — Validator as a visitor table, not a 1,441-line switch
+
+**Touches:** `src/transpile/validate.ts` (1,441 lines, one function).
+
+### Current shape
+
+`validateReferences` contains two near-identical inner functions — `validateRuleStep` (~250 lines) and `validateStep` (~350 lines) — each a big switch over step types. They differ in three things:
+
+1. Which step types are allowed (`prompt` / `send` are rejected in rules).
+2. Which ref-expectation spec is used (`RULE_REF_EXPECT` vs `RUN_TARGET_REF_EXPECT`).
+3. Whether the scope is workflow-wide or rule-wide.
+
+Each step type's validation is written twice with subtle differences. The 5-check sequence (`validateNoShellRedirection` → `validateNestedManagedCallArgs` → `validateRef` → `validateArity` → `validateBareIdentifierArgs`) is repeated by hand at 6+ sites per side, which means at least 12 places to keep in sync.
+
+### Proposed shape
+
+```ts
+const VALIDATORS: Record<StepType, Validator> = {
+  ensure: validateCallStep("ensure"),
+  run:    validateCallStep("run"),
+  prompt: validatePrompt,
+  log:    validateMessageStep("log"),
+  send:   validateSend,
+  // ...
+};
+
+const SCOPE = {
+  workflow: { allow: ALL,                        refSpec: workflowRefs },
+  rule:     { allow: ALL.minus(["prompt","send"]), refSpec: ruleRefs },
+};
+
+walk(ast, (step, ctx) => {
+  if (!ctx.scope.allow.has(step.type)) reject(step);
+  VALIDATORS[step.type](step, ctx);
+});
+```
+
+### Net effect
+
+- Each check (redirection, nested-managed, ref, arity, bare-args) is written once.
+- "Is this step allowed here?" is a one-line set lookup, not three throw sites.
+- Expected reduction: **~500–700 lines**.
+
+---
+
+## Refactor 5 — Promote `CompilePrep` to a first-class `ModuleGraph`
+
+**Touches:** `src/transpile/compile-prep.ts`, `src/transpiler.ts`, `src/transpile/build.ts`, `src/transpile/validate.ts`.
+
+### Current shape
+
+The parser is intended to be pure (`source → AST`), but in practice the validator takes a `ValidateContext`:
+
+```ts
+interface ValidateContext {
+  resolveImportPath: (fromFile, importPath, ws?) => string;
+  existsSync:        (path) => boolean;
+  readFile:          (path) => string;
+  parse:             (content, filePath) => jaiphModule;
+  workspaceRoot?:    string;
+}
+```
+
+…so it can recursively read + re-parse imported modules. `emitScriptsForModule` then re-wraps those same callbacks with an optional `prep` cache. `buildScripts` walks the file system on its own. There are three different traversal strategies for "the set of modules in this build."
+
+`compile-prep` already proved the right model — pre-parse all reachable modules once, hand them to validator and emitter. It just isn't the only path.
+
+### Proposed shape
+
+```ts
+// Pipeline:
+const graph = loadModuleGraph(entry, workspaceRoot);  // discover + parse-all
+validate(graph);                                       // pure, in-memory
+emit(graph, outDir);                                   // pure, in-memory
+
+// parsejaiph(source, file): jaiphModule  — now I/O-pure.
+// validate, emit never touch disk.
+```
+
+### Net effect
+
+- Parser becomes I/O-pure (easier to fuzz, easier to test).
+- Validator drops its `ValidateContext` shape.
+- Build, validate, and emit all read from one place.
+- Same path serves single-file LSP edits (graph rooted at one file) and full compile (graph rooted at workspace root).
+- Expected reduction: **~300 lines**.
+
+---
+
+## Ordering rationale
+
+1. **Refactor 5 (ModuleGraph) first.** Mechanical, low-risk, unblocks the rest by making the parser pure. Existing acceptance tests pin behavior.
+2. **Refactor 3 (Expr collapse) next.** Doing this before tokenizing means the new parser only has to target one expression shape.
+3. **Refactor 4 (visitor-table validator).** With a simpler AST, this is straight refactoring against the golden corpus.
+4. **Refactor 2 (unify catch/recover).** Cheap win, drops ~400 lines.
+5. **Refactor 1 (tokenizer + RD parser) last.** Biggest change. Should sit on top of a cleaned-up AST and a pure pipeline so it can be staged behind a flag and run side-by-side with the old parser against the golden corpus.
+
+## Out of scope
+
+- **Parser generator.** The grammar is small and the line-oriented sensibility of the language (triple-quoted blocks, fence blocks, comments-on-their-own-line) maps cleanly to a hand-written tokenizer.
+- **Surface syntax changes.** None of these refactors are user-visible. The golden test corpus pins behavior.
+- **Runtime.** The bash emitter and `runtime/` stay put.
+
+---
+
+## Appendix — Secondary improvements (A–E)
+
+The five refactors above are the load-bearing changes. The five below are smaller in scope but each addresses a real structural issue that the top 5 do not fully solve on their own. Where a secondary item is coupled to a top-5 refactor, the ordering rationale below makes the dependency explicit.
+
+### A — Split source-fidelity data from the semantic AST (CST / trivia layer)
+
+**Touches:** `src/types.ts`, plus every parser/formatter/validator/emitter consumer.
+
+`WorkflowStepDef` and `jaiphModule` today carry roughly ten fields that exist *only* so the formatter can round-trip: `leadingComments`, `configLeadingComments`, `trailingTopLevelComments`, `configBodySequence`, `topLevelOrder`, `bareSource`, the `tripleQuoted` flags on `literal`/`return`/`log`/`fail`/`send`/`const`, `bodyKind`, `bodyIdentifier`. Every consumer that does *not* care about formatting (validator, emitter) has to either ignore them or thread them through unchanged.
+
+**Proposed:** introduce a parallel `Trivia` map (keyed by node id) or a separate CST layer that owns the source-fidelity data. The semantic AST stops carrying it; formatter reads from `Trivia` alongside the AST.
+
+**Why it is appendix-only:** it changes most of the AST consumers, but the change is mechanical once the boundary is drawn. Biggest payoff if scheduled **before** Refactor 3, so the `Expr` shape is decided after the source-fidelity fields have been pulled out and the semantic core is visible.
+
+### B — Diagnostics collector instead of fail-fast error reporting
+
+**Touches:** `src/parse/core.ts` (`fail`), `src/errors.ts` (`jaiphError`), every call site in `src/parse/` and `src/transpile/`.
+
+Today `fail()` and `jaiphError()` both throw on the first error. A user fixes one error, recompiles, fixes the next, recompiles, etc. This is also the reason for some defensive ordering inside the validator — it tries to surface the "most useful" error first because it knows it will only get to surface one.
+
+**Proposed:** introduce a `Diagnostics` collector. Parser and validator append errors instead of throwing; the compile run reports the full set at the end (sorted by file/line). A "fatal" tier still exists for cases where continuing would produce garbage.
+
+**Why it is appendix-only:** almost zero marginal cost if done as part of Refactor 4 (visitor-table validator), since the new visitor already needs a unified entry/exit per step. Doing it standalone is also fine but touches more files.
+
+### C — Single-pass workflow walk
+
+**Touches:** `src/transpile/validate.ts`.
+
+The validator walks each workflow's step tree at least three times before its main check loop runs: `collectKnownVars`, `collectPromptSchemas`, `validateImmutableBindings`. Each walks the same nested step structure (if/for_lines/catch/recover) with subtly different recursion rules. Bug-fixes to "what counts as a binding here" land in 2–3 walkers.
+
+**Proposed:** one visitor that accumulates `{knownVars, promptSchemas, bindings}` as it descends, and the main per-step validator runs after (or during) that single descent.
+
+**Why it is appendix-only:** falls out naturally inside Refactor 4. Doing it separately is a fine ~50-line refactor.
+
+### D — Collapse `bareIdentifierArgs` into a typed `Arg[]`
+
+**Touches:** `src/types.ts`, `src/parse/core.ts` (`parseCallRef`), validator and emitter.
+
+Today every call-bearing node carries both `args: string` (raw text) and `bareIdentifierArgs: string[]` (a re-parse of which arguments happened to be bare identifiers). The validator must remember to check `bareIdentifierArgs` exists at each call site. The emitter has to do its own re-parse of `args` because it doesn't trust either field alone.
+
+**Proposed:**
+
+```ts
+type Arg =
+  | { kind: "literal"; raw: string }
+  | { kind: "var";     name: string };
+
+// Calls carry args: Arg[]. No second field. No re-parsing downstream.
+```
+
+**Why it is appendix-only:** can be done inside Refactor 3 (it is part of the same "single AST shape per concept" story) or as a standalone task. Standalone is cleaner if Refactor 3 is otherwise too large.
+
+### E — Decouple the validator from the runtime
+
+**Touches:** `src/transpile/validate.ts` (the `import { tripleQuotedRawForRuntime } from "../runtime/orchestration-text"` at the top), `src/runtime/orchestration-text.ts`.
+
+The validator imports a runtime helper (`tripleQuotedRawForRuntime`) so it can compute "what the runtime will see" when reporting errors. That is a one-way dependency from compile-time on runtime semantics. The right direction is the opposite: the parser/validator decides the canonical string, and the runtime consumes that decision.
+
+**Proposed:** move the canonicalization into a parser-side helper (e.g. `src/parse/triple-quote.ts:canonicalizeTripleQuotedString`). The runtime imports *that* instead of the validator importing a runtime function.
+
+**Why it is appendix-only:** small surface (one helper, ~30 lines), but it removes a layering inversion that will keep biting if the runtime grows more such helpers.
+
+### Ordering with the top 5
+
+```
+1. Refactor 5  (ModuleGraph)
+2. A           (CST/trivia split)            ← before Refactor 3 to settle AST shape
+3. D           (typed Arg[])                 ← can fold into Refactor 3 if scoped slightly wider
+4. Refactor 3  (Expr collapse)
+5. C           (single-pass workflow walk)   ← prep for validator
+6. B           (Diagnostics collector)       ← prep for validator
+7. Refactor 4  (visitor-table validator)
+8. E           (decouple validator/runtime)
+9. Refactor 2  (unify catch/recover)
+10. Refactor 1 (tokenizer + RD parser)
+```
diff --git a/docs/_layouts/docs.html b/docs/_layouts/docs.html
index bb4f5fd2..51694220 100644
--- a/docs/_layouts/docs.html
+++ b/docs/_layouts/docs.html
@@ -43,23 +43,33 @@
         <div id="docs-nav-panel" class="docs-nav-panel" role="region" aria-labelledby="docs-nav-toggle" hidden>
             <ul class="docs-nav-list">
                 <li><a href="{{ '/' | relative_url }}">jaiph.org</a></li>
-                <li><a href="{{ '/getting-started' | relative_url }}"{% if page.permalink == '/getting-started' %} class="docs-nav-active" aria-current="page"{% endif %}>Getting started</a></li>
-                <li><a href="{{ '/setup' | relative_url }}"{% if page.permalink == '/setup' %} class="docs-nav-active" aria-current="page"{% endif %}>Setup</a></li>
-                <li><a href="{{ '/libraries' | relative_url }}"{% if page.permalink == '/libraries' %} class="docs-nav-active" aria-current="page"{% endif %}>Libraries</a></li>
-                <li><a href="{{ '/artifacts' | relative_url }}"{% if page.permalink == '/artifacts' %} class="docs-nav-active" aria-current="page"{% endif %}>Artifacts</a></li>
-                <li><a href="{{ '/language' | relative_url }}"{% if page.permalink == '/language' %} class="docs-nav-active" aria-current="page"{% endif %}>Language</a></li>
-                <li><a href="{{ '/grammar' | relative_url }}"{% if page.permalink == '/grammar' %} class="docs-nav-active" aria-current="page"{% endif %}>Grammar</a></li>
-                <li><a href="{{ '/cli' | relative_url }}"{% if page.permalink == '/cli' %} class="docs-nav-active" aria-current="page"{% endif %}>CLI</a></li>
-                <li><a href="{{ '/configuration' | relative_url }}"{% if page.permalink == '/configuration' %} class="docs-nav-active" aria-current="page"{% endif %}>Configuration</a></li>
-                <li><a href="{{ '/testing' | relative_url }}"{% if page.permalink == '/testing' %} class="docs-nav-active" aria-current="page"{% endif %}>Testing</a></li>
-                <li><a href="{{ '/spec-async-handles' | relative_url }}"{% if page.permalink == '/spec-async-handles' %} class="docs-nav-active" aria-current="page"{% endif %}>Async handles</a></li>
-                <li><a href="{{ '/inbox' | relative_url }}"{% if page.permalink == '/inbox' %} class="docs-nav-active" aria-current="page"{% endif %}>Inbox</a></li>
-                <li><a href="{{ '/hooks' | relative_url }}"{% if page.permalink == '/hooks' %} class="docs-nav-active" aria-current="page"{% endif %}>Hooks</a></li>
-                <li><a href="{{ '/sandboxing' | relative_url }}"{% if page.permalink == '/sandboxing' %} class="docs-nav-active" aria-current="page"{% endif %}>Sandboxing</a></li>
+                <li class="docs-nav-group">Tutorials</li>
+                <li><a href="{{ '/tutorials/first-workflow' | relative_url }}"{% if page.permalink == '/tutorials/first-workflow' %} class="docs-nav-active" aria-current="page"{% endif %}>Your first workflow</a></li>
+                <li><a href="{{ '/tutorials/first-agent-run' | relative_url }}"{% if page.permalink == '/tutorials/first-agent-run' %} class="docs-nav-active" aria-current="page"{% endif %}>Your first agent + sandboxed run</a></li>
+                <li class="docs-nav-group">How-to guides</li>
+                <li><a href="{{ '/how-to/install' | relative_url }}"{% if page.permalink == '/how-to/install' %} class="docs-nav-active" aria-current="page"{% endif %}>Install &amp; switch versions</a></li>
+                <li><a href="{{ '/how-to/sandbox-run' | relative_url }}"{% if page.permalink == '/how-to/sandbox-run' %} class="docs-nav-active" aria-current="page"{% endif %}>Run in a Docker sandbox</a></li>
+                <li><a href="{{ '/how-to/agent-auth' | relative_url }}"{% if page.permalink == '/how-to/agent-auth' %} class="docs-nav-active" aria-current="page"{% endif %}>Authenticate agent backends</a></li>
+                <li><a href="{{ '/how-to/configure-backend' | relative_url }}"{% if page.permalink == '/how-to/configure-backend' %} class="docs-nav-active" aria-current="page"{% endif %}>Configure backend &amp; model</a></li>
+                <li><a href="{{ '/how-to/hooks' | relative_url }}"{% if page.permalink == '/how-to/hooks' %} class="docs-nav-active" aria-current="page"{% endif %}>Add a hook</a></li>
+                <li><a href="{{ '/how-to/libraries' | relative_url }}"{% if page.permalink == '/how-to/libraries' %} class="docs-nav-active" aria-current="page"{% endif %}>Use &amp; publish a library</a></li>
+                <li><a href="{{ '/how-to/artifacts' | relative_url }}"{% if page.permalink == '/how-to/artifacts' %} class="docs-nav-active" aria-current="page"{% endif %}>Save artifacts</a></li>
+                <li><a href="{{ '/how-to/testing' | relative_url }}"{% if page.permalink == '/how-to/testing' %} class="docs-nav-active" aria-current="page"{% endif %}>Write &amp; run tests</a></li>
+                <li class="docs-nav-group">Reference</li>
+                <li><a href="{{ '/reference/cli' | relative_url }}"{% if page.permalink == '/reference/cli' %} class="docs-nav-active" aria-current="page"{% endif %}>CLI</a></li>
+                <li><a href="{{ '/reference/configuration' | relative_url }}"{% if page.permalink == '/reference/configuration' %} class="docs-nav-active" aria-current="page"{% endif %}>Configuration</a></li>
+                <li><a href="{{ '/reference/grammar' | relative_url }}"{% if page.permalink == '/reference/grammar' %} class="docs-nav-active" aria-current="page"{% endif %}>Grammar</a></li>
+                <li><a href="{{ '/reference/language' | relative_url }}"{% if page.permalink == '/reference/language' %} class="docs-nav-active" aria-current="page"{% endif %}>Language</a></li>
+                <li><a href="{{ '/reference/env-vars' | relative_url }}"{% if page.permalink == '/reference/env-vars' %} class="docs-nav-active" aria-current="page"{% endif %}>Environment variables</a></li>
+                <li class="docs-nav-group">Explanation</li>
                 <li><a href="{{ '/architecture' | relative_url }}"{% if page.permalink == '/architecture' %} class="docs-nav-active" aria-current="page"{% endif %}>Architecture</a></li>
+                <li><a href="{{ '/sandboxing' | relative_url }}"{% if page.permalink == '/sandboxing' %} class="docs-nav-active" aria-current="page"{% endif %}>Sandboxing</a></li>
+                <li><a href="{{ '/inbox' | relative_url }}"{% if page.permalink == '/inbox' %} class="docs-nav-active" aria-current="page"{% endif %}>Inbox &amp; Dispatch</a></li>
+                <li><a href="{{ '/spec-async-handles' | relative_url }}"{% if page.permalink == '/spec-async-handles' %} class="docs-nav-active" aria-current="page"{% endif %}>Async Handles</a></li>
+                <li><a href="{{ '/why-jaiph' | relative_url }}"{% if page.permalink == '/why-jaiph' %} class="docs-nav-active" aria-current="page"{% endif %}>Why Jaiph</a></li>
+                <li class="docs-nav-group">Contributing</li>
                 <li><a href="{{ '/contributing' | relative_url }}"{% if page.permalink == '/contributing' %} class="docs-nav-active" aria-current="page"{% endif %}>Contributing</a></li>
-                <li><a href="https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md"
-                        target="_blank" rel="noopener noreferrer">Agent Skill</a></li>
+                <li><a href="{{ '/jaiph-skill' | relative_url }}"{% if page.permalink == '/jaiph-skill' %} class="docs-nav-active" aria-current="page"{% endif %}>Agent Skill</a></li>
             </ul>
         </div>
     </nav>
diff --git a/docs/agent-auth.md b/docs/agent-auth.md
new file mode 100644
index 00000000..166afece
--- /dev/null
+++ b/docs/agent-auth.md
@@ -0,0 +1,90 @@
+---
+title: Authenticate agent backends
+permalink: /how-to/agent-auth
+diataxis: how-to
+---
+
+# Authenticate agent backends
+
+This recipe sets the credentials each agent backend needs so the CLI's credential pre-flight passes and `prompt` steps reach the model.
+
+`jaiph run` runs a host-side **credential pre-flight** before it spawns the runner or the Docker container. The pre-flight is keyed to the backend(s) declared in the entry file. Missing credentials produce `E_AGENT_CREDENTIALS` (hard abort) or a `jaiph: warning:` (host-only, for `claude` and `cursor` — see the table below). Hard failures exit before any runner or container is launched. The behavior is implemented in `src/cli/run/preflight-credentials.ts`.
+
+## Prerequisites
+
+- The entry `.jh` file declares a backend (`agent.backend = "claude" | "cursor" | "codex"`) at module or workflow scope, or uses a `prompt` step that consumes the default backend.
+
+## Pick the backend's credential
+
+| Backend | Required credentials | Host run (no Docker) | Docker run (any mode incl. `inplace`) |
+|---|---|---|---|
+| `claude` | `ANTHROPIC_API_KEY` **or** `CLAUDE_CODE_OAUTH_TOKEN` | warn only (a stored Claude CLI login may still work) | hard error `E_AGENT_CREDENTIALS` |
+| `cursor` | `CURSOR_API_KEY` | warn only (a stored `cursor-agent login` may still work) | hard error `E_AGENT_CREDENTIALS` |
+| `codex`  | `OPENAI_API_KEY` | hard error `E_AGENT_CREDENTIALS` (no CLI-login fallback) | hard error `E_AGENT_CREDENTIALS` — `OPENAI_*` is **not** on the Docker env allowlist, so a host-only key is treated as missing |
+
+Under Docker sandboxing the host-side stored logins (Keychain entries, `~/.claude`, `cursor-agent login`) do **not** cross the container boundary. Only allowlisted host env vars are forwarded (`JAIPH_*`, `ANTHROPIC_*`, `CLAUDE_*`, `CURSOR_*`; see [Sandboxing](sandboxing.md#what-docker-protects-against)). Set credentials on the **host** so the allowlist can forward them into the container.
+
+## 1. Authenticate Claude
+
+Either set the API key directly:
+
+```bash
+export ANTHROPIC_API_KEY="sk-ant-..."
+```
+
+Or obtain a long-lived OAuth token through the Claude CLI:
+
+```bash
+claude setup-token
+export CLAUDE_CODE_OAUTH_TOKEN="..."
+```
+
+On host runs (no Docker), a stored `~/.claude` / macOS Keychain login from a previous interactive `claude` session also works — but in that case the pre-flight emits a warning rather than failing.
+
+## 2. Authenticate Cursor
+
+```bash
+export CURSOR_API_KEY="..."
+```
+
+For host runs only, an interactive `cursor-agent login` (stored on disk) also satisfies the runtime — but the pre-flight emits a warning unless the env var is set.
+
+## 3. Authenticate Codex (OpenAI)
+
+```bash
+export OPENAI_API_KEY="sk-..."
+```
+
+`OPENAI_API_KEY` is required on **both** host and Docker runs. The `codex` backend has no CLI-login fallback — there is no warning path.
+
+Under Docker, `OPENAI_*` is outside the forwarding allowlist, so preflight treats a host-only `OPENAI_API_KEY` as missing even when you export it. Codex workflows need `jaiph run --unsafe` (host execution) or a different backend inside the sandbox.
+
+To target an OpenAI-compatible endpoint instead of the default, set `JAIPH_CODEX_API_URL` to the chat-completions URL (`JAIPH_*` is forwarded under Docker).
+
+## 4. Run the pre-flight
+
+```bash
+jaiph run ./flow.jh
+```
+
+The pre-flight runs before the banner. Hard failures print a stderr message naming the backend, the model (when `agent.default_model` is set), the entry `.jh` file, the config scope that picked the backend (`module config`, `workflow <name>`, `JAIPH_AGENT_BACKEND env`, or `default`), and the concrete remedy. The error code is `E_AGENT_CREDENTIALS`. Host-only warnings for `claude` and `cursor` use the same header fields with a `jaiph: warning:` prefix.
+
+## Skip the pre-flight (escape hatch)
+
+`JAIPH_UNSAFE=true` (or `jaiph run --unsafe`) skips the pre-flight entirely — the host is in charge, a stored CLI login may work, and the runtime's per-backend guards remain as a backstop. The pre-flight is also skipped when the entry file neither declares an explicit backend nor uses any `prompt` step (nothing would credential against).
+
+## Verification
+
+When every required credential is present, preflight is silent — no stderr before the banner. On host runs, missing `claude` or `cursor` env vars emit `jaiph: warning:` lines and the run still proceeds (a stored CLI login may satisfy the runtime). A hard failure prints:
+
+```
+E_AGENT_CREDENTIALS: agent.backend "claude" selected by module config in /path/to/flow.jh — neither ANTHROPIC_API_KEY nor CLAUDE_CODE_OAUTH_TOKEN is set. Run `claude setup-token` and export CLAUDE_CODE_OAUTH_TOKEN, or set ANTHROPIC_API_KEY.
+```
+
+Under Docker the message includes the suffix `(Docker is on — set the env var on the host so it is forwarded into the container.)`.
+
+## Related
+
+- [Run a workflow in a Docker sandbox](/how-to/sandbox-run) — how host env vars cross the container boundary.
+- [Configure backend/model](/how-to/configure-backend) — picking which backend a workflow uses.
+- [Sandboxing — What Docker protects against](sandboxing.md#what-docker-protects-against) — env allowlist and what crosses the container boundary.
diff --git a/docs/architecture.md b/docs/architecture.md
index 55e9ff50..6dc87d33 100644
--- a/docs/architecture.md
+++ b/docs/architecture.md
@@ -1,8 +1,12 @@
 ---
 title: Architecture
 permalink: /architecture
+diataxis: explanation
 redirect_from:
   - /architecture.md
+  - /spec-async-isolated
+  - /target-design
+  - /reporting
 ---
 
 # Architecture
@@ -19,42 +23,62 @@ For **how to contribute** — branches, test layers, E2E assertion policy, and b
 
 Workflow authors write `.jh` / `.test.jh` modules. The toolchain turns those files into **validated** modules plus **extracted script files**, then the **same AST interpreter** runs workflows whether you use local `jaiph run`, Docker, or `jaiph test`.
 
-1. Parse source into AST (the CLI parses once up front for `jaiph run` metadata such as `runtime` config; `buildRuntimeGraph` and transpilation use the same parser on disk contents).
-2. **Compile-time** validation (`validateReferences`, invoked from **`emitScriptsForModule`** / **`buildScripts()`**) runs before script extraction, not inside `buildRuntimeGraph()` (the graph loader only parses modules and follows imports). The **`jaiph compile`** command walks the same import closure but runs **`validateReferences` only**: it parses each reachable module on disk and **does not** emit **`scripts/`** (no **`buildScriptFiles`** / **`buildScripts`**), **does not** invoke **`buildRuntimeGraph()`**, and never spawns the workflow runner (`src/cli/commands/compile.ts`). For a **directory** argument it discovers `*.jh` via `walkjhFiles`, which **skips** `*.test.jh`; to validate a test module, pass that file explicitly. Imported modules in the closure are still validated recursively either way.
-3. **CLI** (`dist/src/cli.js` via npm, or a **Bun-compiled** `dist/jaiph` binary) prepares script executables (scripts-only), then spawns a **detached child** that loads **`node-workflow-runner.js`**. That child calls `buildRuntimeGraph()` and runs **`NodeWorkflowRuntime`**. The child’s interpreter is **`process.execPath`** of the CLI process (Node when you run `node dist/src/cli.js`, the standalone Bun binary when you run `dist/jaiph`). Script steps execute as managed subprocesses; prompt, inbox I/O, and event/summary emission are handled by the kernel under `src/runtime/kernel/`.
+1. Parse source into AST. Every CLI path walks the entry plus its transitive `.jh` import closure **once** through **`loadModuleGraph`** (`src/transpile/module-graph.ts`) and reuses that **`ModuleGraph`** for the banner (`metadataToConfig`), validation (**`validateModule`** inside **`emitScriptsForModuleFromGraph`**, invoked by **`buildScriptsFromGraph`**), script-body extraction, and — across the parent → child process boundary on the default local `jaiph run` — for **`buildRuntimeGraph(graph)`** in the spawned runner (see [Local module graph](#local-module-graph) and the sequence diagram below). `parsejaiph(source, filePath)` is I/O-pure; validation and script emit operate entirely on the in-memory graph and never re-read `.jh` files. The only fs entry point that reads `.jh` sources is `loadModuleGraph`.
+2. **Compile-time** validation runs before script extraction. The validator consumes the in-memory graph; imported ASTs are looked up by absolute path and never re-read from disk. Three validation entry points share the same per-module walk via **`validateModuleInto`**: **`validateModule(ast, graph)`** is the per-module throwing form (used by **`emitScriptsForModuleFromGraph`** / **`buildScriptsFromGraph()`** so the existing single-error path stays intact), **`validateReferences(graph)`** validates every reachable module then throws the first sorted error, and **`collectDiagnostics(graph)`** returns a populated `Diagnostics` collector (`src/diagnostics.ts`) with **every** recoverable error from every reachable module. The **`jaiph compile`** command walks the same import closure but routes through `collectDiagnostics`: it builds a graph per entry, collects diagnostics, prints them all (sorted by file/line/col, in `path:line:col CODE message` form on stderr — or as a single JSON array on stdout with `--json`), and exits non-zero if any diagnostic was collected. It **does not** emit **`scripts/`**, **does not** invoke **`buildRuntimeGraph()`**, and never spawns the workflow runner (`src/cli/commands/compile.ts`). For a **directory** argument it discovers `*.jh` via `walkjhFiles`, which **skips** `*.test.jh`; to validate a test module, pass that file explicitly. Imported modules in the closure are still validated recursively either way.
+3. **CLI** (`dist/src/cli.js` via npm, or a **Bun-compiled** `dist/jaiph` binary) prepares script executables (scripts-only), then spawns a **detached child** through the internal **`__workflow-runner`** argv marker (**`spawnJaiphWorkflowProcess`** in `src/runtime/kernel/workflow-launch.ts`). The child entrypoint is **`runWorkflowRunner`** (`src/runtime/kernel/node-workflow-runner.ts`), which loads or deserializes the module graph, calls **`buildRuntimeGraph()`**, then runs **`NodeWorkflowRuntime`**. Under Node the spawn is **`process.execPath`** + **`dist/src/cli.js`** + **`__workflow-runner`**; under the Bun standalone binary, **`process.execPath`** is the **`jaiph`** binary itself with the same marker. Script steps execute as managed subprocesses; prompt, inbox I/O, and event/summary emission are handled by the kernel under `src/runtime/kernel/`.
 4. Stream live events to the CLI and persist durable run artifacts.
 
-Interactive **`jaiph run`** parses **`__JAIPH_EVENT__`** lines from the runner’s stderr, renders the progress tree, and runs hooks. **`jaiph run --raw`** skips that shell: the child uses inherited stdio so events still land on stderr unchanged — used when embedding Jaiph or when the host wraps a container (see [CLI — `jaiph run`](cli.md#jaiph-run) and [Sandboxing — Docker container isolation](sandboxing.md#docker-container-isolation)).
+Interactive **`jaiph run`** parses **`__JAIPH_EVENT__`** lines from the runner’s stderr, renders the progress tree, and runs hooks. **`jaiph run --raw`** skips that shell: the child uses inherited stdio so events still land on stderr unchanged — used when embedding Jaiph or when the host wraps a container (see [CLI — `jaiph run`](cli.md#jaiph-run) and [Sandboxing](sandboxing.md)).
 
-All orchestration — local `jaiph run`, `jaiph test`, and **Docker `jaiph run`** — uses the **Node workflow runtime** (AST interpreter). Docker containers run the same `node-workflow-runner` process with the compiled JS source tree and scripts mounted read-only.
+All orchestration — local `jaiph run`, `jaiph test`, and **Docker `jaiph run`** — uses the **Node workflow runtime** (AST interpreter). Docker containers run the same **`jaiph run --raw`** / **`__workflow-runner`** dispatch with the compiled JS source tree and scripts mounted read-only.
 
 ## Core components
 
 - **CLI (`src/cli`, invoked via compiled `src/cli.ts` → `dist/src/cli.js`)**
   - Entry point (`run`, `test`, `compile`, `init`, `install`, `use`, `format`). Paths ending in `.jh` / `.test.jh` are also accepted as implicit commands (see `src/cli/index.ts`).
-  - **Workflow launch** is owned in TypeScript (`src/runtime/kernel/workflow-launch.ts` + `src/cli/run/lifecycle.ts`): spawns **`node-workflow-runner.js`** with `process.execPath`, which calls `buildRuntimeGraph()` then `NodeWorkflowRuntime`. The **`jaiph run`** path always launches the **`default`** workflow via argv wired in `workflow-launch.ts` (`node-workflow-runner` calls `runDefault`). `setupRunSignalHandlers` accepts an optional `onSignalCleanup` callback for Docker sandbox teardown on SIGINT/SIGTERM.
+  - **Workflow launch** is owned in TypeScript (`src/runtime/kernel/workflow-launch.ts` + `src/cli/run/lifecycle.ts`): spawns the runner via **`process.execPath`** and the **`__workflow-runner`** argv marker. **`runWorkflowRunner`** (`src/runtime/kernel/node-workflow-runner.ts`) handles that argv, loads or reads the module graph, calls **`buildRuntimeGraph()`**, then **`NodeWorkflowRuntime.runDefault()`**. The **`default`** workflow name is wired in **`buildRunModuleLaunch`** (`workflow-launch.ts`). `setupRunSignalHandlers` accepts an optional `onSignalCleanup` callback for Docker sandbox teardown on SIGINT/SIGTERM.
   - Parses runtime events and renders progress (except `--raw`); dispatches hooks.
 
 - **Parser (`src/parser.ts`, `src/parse/*`)**
-  - Converts `.jh`/`.test.jh` into `jaiphModule` AST.
-  - Reusable primitives: `parseFencedBlock()` (`src/parse/fence.ts`) handles triple-backtick fenced bodies with optional lang tokens for scripts and inline scripts. `parseTripleQuoteBlock()` (`src/parse/triple-quote.ts`) handles `"""..."""` blocks for prompts, `const`, `log`, `logerr`, `fail`, `return`, and `send` — all positions where multiline strings appear.
+  - Converts `.jh`/`.test.jh` into a **semantic AST** (`jaiphModule`) plus a parallel **`Trivia`** store of source-fidelity data. `parsejaiphWithTrivia(source, filePath)` returns `{ ast, trivia }`; the legacy `parsejaiph(source, filePath)` is a thin wrapper that returns only the `ast` for consumers that don't need round-trip data. Both entry points are I/O-pure.
+  - Reusable primitives: `parseFencedBlock()` (`src/parse/fence.ts`) handles triple-backtick fenced bodies with optional lang tokens for scripts and inline scripts. `parseTripleQuoteBlock()` (`src/parse/triple-quote.ts`) handles `"""..."""` blocks for prompts, `const`, `log`, `logerr`, `fail`, `return`, and `send` — all positions where multiline strings appear. `canonicalizeTripleQuotedString()` (same file) reproduces the dedent + escape decoding that match-arm bodies still need (they carry an unprocessed `tripleQuoteBodyToRaw`-shaped string plus a `tripleQuotedBody` flag rather than being dedented at parse time); both the validator and the runtime call it, so "what the validator inspects" and "what the runtime executes" are bit-for-bit identical.
+  - **Unified `run` / `ensure` host parsing.** `run ref(...)`, `run async ref(...)`, and `ensure ref(...)`, optionally followed by `catch (binding) { ... }` (any host) or `recover(binding) { ... }` (`run` only), are parsed by a single helper `parseRunOrEnsure` in `src/parse/workflow-brace.ts`. The attached `catch` / `recover` clause — bindings, body shape (multi-line `{ … }`, inline `{ stmt[; stmt]* }`, or single-statement) — is parsed by **one** helper `parseAttachedBlock(filePath, lines, idx, …, keyword, textAfterKeyword, trivia)` in `src/parse/steps.ts`. There is no separate mini parser for catch/recover bodies: `parseAttachedBlock` delegates each body statement to the **same** `parseBlockStatement` (`src/parse/workflow-brace.ts`) that handles top-level statements, so every statement form accepted in a workflow / rule body is accepted identically inside a `catch` / `recover` body. "Is this statement allowed inside a catch/recover body?" is a validator concern (the `RULE_SCOPE` / `WORKFLOW_SCOPE` distinction in `validate-step.ts`), not enforced by which mini-parser branches happened to fire. `src/parse/steps.ts` is bounded at **≤200 lines** by `src/parse/parse-attached-block.test.ts`, which also asserts no function named `parse(Run)?(Catch|Recover|EnsureStep)` reappears.
+  - **Keyword dispatch table.** Inside `parseBlockStatement` (`src/parse/workflow-brace.ts`), every workflow / rule body line that does not begin with `#` is routed by a single `STATEMENT: Record<string, BlockHandler>` table keyed by the leading identifier — there is no longer a `startsWith` cascade where `"run async "` must be tested before `"run "` and `"prompt "` must be tested before a bare assignment. The dispatcher tokenizes the first identifier on the trimmed line, looks it up once, and invokes the matching handler (`tryParseIf` / `tryParseFor` / `tryParseConst` / `tryParseFail` / `tryParseWait` / `tryParseEnsure` / `tryParseRun` / `tryParsePrompt` / `tryParseLog` / `tryParseLogerr` / `tryParseReturn` / `tryParseStandaloneMatch`), which either returns a `{ step, nextIdx }` result, returns `null` to fall through, or calls `fail(...)` to abort. Two non-keyword fallbacks fire after the table lookup in order: `trySend` (matches `channel <- rhs` via `matchSendOperator`) then `shellFallthrough` (everything else becomes a shell `exec` step). Assignment-shape error guards (`name = prompt …`, `name = run …` without `const`, plus the `forRule` rejection of `prompt`) run once before dispatch in `applyAssignmentGuards(c)`. The per-line context (`filePath`, `lines`, `idx`, `innerRaw`, `inner`, `innerNo`, `trivia`, `forRule`, `opts`) is threaded through handlers as a single `BlockCtx` record. **Adding a new top-level keyword is a two-file change:** one row in `STATEMENT` (`workflow-brace.ts`) plus one entry in the `JAIPH_KEYWORDS` reserved set (`core.ts`) — pinned by `src/parse/parse-synthetic-keyword.test.ts`, which patches `STATEMENT` at runtime with a synthetic `zzznoop` handler, asserts dispatch fires, asserts the same input falls through to the shell handler when the row is removed, and greps both source files to confirm each symbol lives in exactly one place. Every existing parse-error message, line, and column is preserved bit-for-bit: `src/parse/parse-error-snapshot.test.ts` walks every `=== name` block in `test-fixtures/compiler-txtar/parse-errors.txt`, captures `{ file, line, col, code, message }` for each, and diffs against the snapshot stored at `test-fixtures/compiler-txtar/parse-errors-snapshot.json` (refreshable with `UPDATE_SNAPSHOTS=1` only after confirming the change is intentional). The wider tokenizer rewrite — the ad-hoc `inDoubleQuote` / `inTripleQuote` / `braceDepth` scanners replicated across `src/parse/`, the line-walking `{ step, nextIdx }` contract, and the per-handler regex bodies — is **not** part of this refactor and remains future work.
 
 - **AST / Types (`src/types.ts`)**
-  - Shared compile-time schema (`jaiphModule`, step defs, test defs, hook payload types).
+  - Shared compile-time schema (`jaiphModule`, step defs, test defs, hook payload types). The semantic AST carries **only** what the validator, emitter, transpiler, and runtime need; surface-form data that exists purely to round-trip the formatter (leading comments on imports / channels / `const` / `test` blocks, top-level emit order, `config` body sequence, `"""..."""` flags on `literal` / `return` / `log` / `logerr` / `fail` / `send` / `const`, the `bareSource` of `return <ident>`, and prompt / script `bodyKind` discriminators) lives in **`Trivia`** instead — see [Trivia (CST layer)](#trivia-cst-layer).
+  - **One `Expr` for every value position.** Anywhere a value can appear — `const name = …`, `return …`, `send channel <- …`, `log` / `logerr` / `fail` arguments, and the body of an `exec` statement — the AST stores a single tagged union: `Expr = literal | call | ensure_call | inline_script | prompt | match | shell | bare_ref`. There is **no longer** a separate `ConstRhs` union, `SendRhsDef` union, or `managed:` sidecar on `return` / `log` / `logerr` (the placeholder strings `"__match__"` / `"run inline_script"` / `"__JAIPH_MANAGED__"` are gone too — a meta-test in `src/types-shape.test.ts` fails if any reappear under `src/`). The eight `Expr` kinds: `literal` (verbatim source text — quoted string, `$var` / `${var}` form, or post-dedent triple-quoted body), `call` (managed workflow/script call; `async: true` for `run async ref(...)` capture position), `ensure_call` (managed rule call), `inline_script` (`` `body`(args) `` or fenced), `prompt` (carries the JSON-quoted body and optional flat `returns` schema), `match` (a `match <subject> { ... }` evaluated for its value), `shell` (raw shell fragment used as a managed substitution on the send RHS), and `bare_ref` (bare symbol on a send RHS — always rejected by the validator, preserved so the error message can name the symbol).
+  - **Eight `WorkflowStepDef` variants** (down from fourteen): `exec` (side-effecting managed call statement — was `run` / `ensure` / `run_inline_script` / `prompt` / standalone `match` / inline `shell`; the discriminator now lives inside `body.kind`, with `captureName` / `catch` / `recover` as step-level attributes); `const`, `return`, `send` (bind, propagate, or emit an `Expr`); `say` (was `log` / `logerr` / `fail` — `level: "fail"` aborts the workflow with the message, otherwise the message is written to the corresponding stream); `if` / `for_lines` (control flow, unchanged shape); `trivia` (formatter-only `comment` / `blank_line` slots — skipped by the runtime and validator). A type-level exhaustive `switch` in `src/types-shape.test.ts` pins both the step count at **8** and the `Expr` kind count at **8**.
+  - **Call arguments are a typed sum.** Every call-bearing `Expr` (`call`, `ensure_call`, `inline_script`) carries `args?: Arg[]` where `Arg = { kind: "literal"; raw: string } | { kind: "var"; name: string }`. The parser classifies each argument once (a bare in-scope-style identifier becomes `var`; everything else — quoted strings, `${…}` interpolations, nested `run …` / `ensure …` calls, inline-script bodies — is stored verbatim as `literal`). There is no separate `args: string` text payload or shadow `bareIdentifierArgs: string[]` field, and no downstream consumer re-parses call arguments: the validator walks the typed list to enforce arity, reject nested unmanaged calls inside literals, and resolve `var` refs against in-scope bindings; the emitter renders by mapping each `Arg` to its source form; the runtime turns `Arg[]` back into a runtime string via `argsToRuntimeString` (`var` → `${name}`, `literal` → raw) so the existing handle-resolution / interpolation path is unchanged.
 
-- **Validator (`src/transpile/validate.ts`)**
+- **Trivia / CST layer (`src/parse/trivia.ts`)**
+  {: #trivia-cst-layer}
+  - `Trivia` is a parallel store keyed by AST-node identity (per-node via `WeakMap`) and a small `ModuleTrivia` record for module-level data. The parser builds it alongside the AST; **only the formatter reads it**. Validator, emitter, transpiler, and runtime never import from `src/parse/trivia.ts` — a grep test (`src/parse/trivia-grep.test.ts`) pins this invariant by rejecting any reference to `Trivia` / `createTrivia` / `NodeTrivia` / `ModuleTrivia` from validator and emitter source files.
+  - A separate type-shape test (`src/parse/trivia-ast-shape.test.ts`) asserts at compile time that none of the formatter-only fields reappear on `jaiphModule`, `ImportDef`, `ScriptImportDef`, `ChannelDef`, `TestBlockDef`, `WorkflowMetadata`, `ScriptDef`, or any `WorkflowStepDef` / `Expr` variant. (`ConstRhs` / `SendRhsDef` no longer exist — their fields live inside `Expr` — and `src/types-shape.test.ts` fails if those symbols reappear as exports of `src/types.ts`.)
+
+- **Validator (`src/transpile/validate.ts` + `src/transpile/validate-step.ts`)**
   - Resolves imports and symbol references; emits deterministic compile-time errors. Import resolution (`resolveImportPath` in `transpile/resolve.ts`) checks relative paths first, then falls back to project-scoped libraries under `<workspace>/.jaiph/libs/` — the workspace root is threaded through all compilation call sites. Export visibility is enforced by `validateRef` in `validate-ref-resolution.ts`: if an imported module declares any `export`, only exported names are reachable through the import alias.
+  - **Two-file split.** `validate.ts` owns the **outer** layer: import / channel-route / test-block checks plus `walkStepTree` (the single descent that builds `{ knownVars, promptSchemas, flat }` for each workflow / rule). `validate-step.ts` owns the **per-step** visitor: one row per `WorkflowStepDef.type` in a `VALIDATORS: Record<StepType, StepValidator>` table, a single `validateExpr` dispatcher over the 8 `Expr.kind` values, and the call-shape / channel / string-content helpers. `validate.ts` is bounded at **≤700 lines** (currently ~450) by a CI-style test in `src/transpile/validate-visitor.test.ts`; new validators belong in `validate-step.ts`.
+  - **Visitor table + scope.** Per-step validation has one entry point — `validateStep(step, ctx)` in `validate-step.ts`. It looks the step's `type` up in `VALIDATORS` (the dispatch table), then consults `ctx.scope.allowSteps` (a `Set<StepType>`) once to decide whether this step is permitted in the current scope. Two scopes exist: `WORKFLOW_SCOPE` (allows every step variant including `send` and `prompt`) and `RULE_SCOPE` (rejects `send` outright; rejects `prompt` and `run async` from inside `exec` bodies). The scope also carries `runRefExpect` (`RUN_TARGET_REF_EXPECT` for workflows, `RUN_IN_RULE_REF_EXPECT` for rules) and `withPromptSchemas` (workflows collect prompt-returning bindings; rules skip schema collection). Adding a new step type requires exactly one row in `VALIDATORS` and, if the rule/workflow split needs to differ, an entry in `Scope.allowSteps` — an `AC4` test in `validate-visitor.test.ts` injects a synthetic step type and asserts it produces exactly one diagnostic with the documented `internal: no validator for step type "…"` message until the row is added.
+  - **Single managed-call-shape helper.** Every `call` / `ensure_call` site runs the same five checks against the typed `Arg[]` directly — shell-redirection rejection (only `literal` args are scanned), nested-unmanaged-call rejection inside `literal` raws, ref resolution (with the scope's `runRefExpect` for `call`, `RULE_REF_EXPECT` for `ensure_call`), arity (`args.length` vs declared params), and `var`-arg resolution against in-scope bindings via `validateArgVarRefs`. The sequence lives once in `validateCallable(expr, ctx)`; both `run` and `ensure` validators invoke it with a different ref expectation / target kind. There is no longer a separate `validateBareIdentifierArgs` helper, no per-site repetition of the five-step sequence, and no place re-parses an `args: string` payload by splitting on commas or rescanning quotes.
+  - **Diagnostics collector (recoverable errors).** The validator no longer fails fast on the first user-level error. Every recoverable check appends to a `Diagnostics` collector (`src/diagnostics.ts`) via `diag.error(file, line, col, code, msg)`, which records a `JaiphDiagnostic` and short-circuits the current validation unit through a `BailoutError`. Each top-level unit (per-import block, per-rule walk, per-rule step, per-workflow walk, per-workflow step, per-test-block step, per-channel route) is wrapped in `diag.capture(fn)`, which absorbs the bailout (and any thrown `jaiphError` from leaf helpers like `validate-ref-resolution.ts` / `validate-string.ts` / `validate-prompt-schema.ts` / `shell-jaiph-guard.ts`) so the next sibling unit still runs. `collectDiagnostics(graph)` walks every module and returns the populated collector; the legacy **`validateReferences(graph)`** is now a thin wrapper that throws the first sorted diagnostic via **`jaiphError`** so graph-level callers and existing per-error tests keep working; **`emitScriptsForModuleFromGraph`** still calls **`validateModule(ast, graph)`** per module before emit. `Diagnostics.sorted()` returns errors ordered by `(file, line, col)`; `formatLines()` renders the standard `path:line:col CODE message` shape. A grep test (`src/transpile/diagnostics-collector.test.ts`) pins the migration: `validate.ts` + `validate-step.ts` hold **zero** `throw jaiphError(` sites, and the remaining `throw jaiphError(` call sites under `src/` are confined to a documented allowlist — fatal aborts in the parser (`src/parse/core.ts`), the loader (`src/transpile/module-graph.ts`), and the test-file shape check (`src/cli/commands/test.ts`); the legacy bridge in `src/diagnostics.ts`; and the four leaf validation helpers above, each of which has every caller wrapped in `diag.capture(...)`.
+  - The validator drives off `WorkflowStepDef.type` (8 variants) and `Expr.kind` (8 variants). For every value-bearing step (`const` / `return` / `send` / `say`) and for the body of every `exec` step, a single `validateExpr(expr, ...)` dispatcher handles the value: it routes `call` / `ensure_call` / `inline_script` to call-site validation (`validateCallable`), walks `match` arms, schema-checks `prompt`, and runs the substitution scanner on `literal` raws. There is no dual code path for "managed sidecar vs literal value" — that branch is gone.
+  - **No compile-time → runtime imports.** Nothing under `src/transpile/` may `import … from "…/runtime/…"`. Compile-time code must not depend on runtime semantics: when the validator needs the same canonical form the runtime will see (the dedented, escape-decoded view of a triple-quoted match-arm body), both sides import a parser-side helper (`canonicalizeTripleQuotedString` in `src/parse/triple-quote.ts`) rather than reaching across the layer. A grep test (`src/transpile/no-runtime-imports.test.ts`) scans every non-test `*.ts` under `src/transpile/` and fails if any `from "…/runtime/…"` import appears; a separate corpus test (`src/parse/canonicalize-triple-quoted.test.ts`) parses every `.jh` under `test-fixtures/` and `examples/`, collects every triple-quoted match-arm body, and asserts `canonicalizeTripleQuotedString` matches the pre-move `tripleQuotedRawForRuntime` output bit-for-bit.
+  - **Single workflow walk.** Each workflow / rule has its step tree descended exactly once by `walkStepTree` (in `validate.ts`), which simultaneously accumulates `knownVars` (env decls + params + every nested `const` / capture / `for_lines` iterator), `promptSchemas` (top-level prompt-returning bindings, gated by `options.withPromptSchemas` so rules skip schema collection), enforces immutable-binding / `script`-collision rules inline (mutating a shared `bindings` map and threading a fresh inner map under each `for_lines` so loop iterators only shadow inside the body), and emits a flat `FlatStepEntry[]` of every step in tree order with the enclosing `catch` / `recover` failure binding attached. The main per-step validator loop iterates that flat list non-recursively and calls `validateStep` once per entry, so `walkStepTree`'s internal `descend` is the **only** recursive helper in `validate.ts` that takes a `WorkflowStepDef[]`. A pair of grep / AST tests (`src/transpile/validate-single-walk.test.ts`) pins both invariants: the prior helpers (`collectKnownVars`, `collectPromptSchemas`, `validateImmutableBindings`) cannot reappear by name, and at most one recursive `WorkflowStepDef[]` walker may live in `validate.ts`.
 
 - **Transpiler (`src/transpiler.ts`, `src/transpile/*`)**
-  - **`emitScriptsForModule`** parses, runs **`validateReferences`**, and **`buildScriptFiles`** — the only compile path for `jaiph run` / `jaiph test` — **persists only atomic `script` files** under `scripts/`. **`buildScripts()`** can also take a **directory** of non-test `*.jh` modules (`src/transpile/build.ts` uses `walkjhFiles`); the **`jaiph run`** and **`jaiph test`** commands always pass a **single entry file** (`.jh` or `*.test.jh`). Inline scripts (`` run `body`(args) ``) are also emitted as `scripts/__inline_<hash>` with deterministic hash-based names (`inlineScriptName` in `src/inline-script-name.ts`). There is no workflow-level bash emission.
+  - **`emitScriptsForModuleFromGraph`** validates one module against the graph and runs **`buildScriptFiles`** — the only compile path for `jaiph run` / `jaiph test` — **persists only atomic `script` files** under `scripts/`. **`buildScripts(input, outDir, ws?)`** is the path-based wrapper used by tests and the directory walk; it loads a `ModuleGraph` and delegates. **`buildScriptsFromGraph(graph, outDir)`** is the graph-based entry point used by `jaiph run` / `jaiph test`, which already loaded the graph. Inline scripts (`` run `body`(args) ``) are also emitted as `scripts/__inline_<hash>` with deterministic hash-based names (`inlineScriptName` in `src/inline-script-name.ts`). There is no workflow-level bash emission.
+  - The pipeline contract is **`loadModuleGraph` → `buildScriptsFromGraph(graph, outDir)`**, which runs **`validateModule`** + **`buildScriptFiles`** per reachable module via **`emitScriptsForModuleFromGraph`**. `parsejaiph` is I/O-pure; validation and script emit never re-read `.jh` sources during graph work. Each reachable module is parsed exactly once per `jaiph run` (see [Local module graph](#local-module-graph)).
 
 - **Node Workflow Runtime (`src/runtime/kernel/node-workflow-runtime.ts`)**
   - `NodeWorkflowRuntime` interprets the AST directly: walks workflow steps, manages scope/variables, delegates prompt and script execution to kernel helpers, handles channels/inbox/dispatch, owns the frame stack and heartbeat, and writes run artifacts.
+  - One private `evaluateExpr(scope, expr, …)` dispatcher handles every value position — `const` / `return` / `send` / `say` step handlers and the body of every `exec` step delegate to it. It switches on `Expr.kind` to run the managed call (`call` / `ensure_call` / `inline_script`) or `prompt`, walks a `match` expression, or interpolates a `literal` value through `interpolateWithCaptures`. There is no fan-out across "managed sidecar vs literal value" because that branch is gone from the AST.
+  - **Prompt transport-failure retry.** `runPromptStep` wraps each `executePrompt` invocation in a retry loop driven by the schedule resolved through `src/runtime/kernel/prompt-retry.ts` (default `15s → 1m → 10m → 30m → 2h`, six total attempts; configurable via `JAIPH_PROMPT_RETRY` / `JAIPH_PROMPT_RETRY_DELAYS`). Only the transport path (non-zero exit from the backend) is retried; invalid JSON and schema-validation failures return `{ ok: false }` on the first attempt. Each attempt emits its own `PROMPT_START` / `PROMPT_END` and `STEP_START` / `STEP_END`; each failure (and the final termination) logs a `LOGERR` through `RuntimeEventEmitter.emitLog`. The backoff sleep is injectable (`sleep` constructor option) and interruptible via `runtime.abort()` / an internal `AbortController` so SIGINT and in-process aborts halt the loop without further backend calls. Retry composes **below** `recover` / `catch` — backoff is exhausted before the failure reaches the recover loop. See [Configuration — Prompt retry on transport failure](configuration.md#prompt-retry-on-transport-failure).
   - Three sibling modules under `src/runtime/kernel/` carry concerns that used to live inline in the runtime file. Dependency direction is one-way (orchestrator → helpers/emitter/mock); no circular imports back.
     - **`runtime-arg-parser.ts`** — stateless interpolation and call-argument parsing (`interpolate`, `parseInlineCaptureCall`, `commaArgsToInterpolated`, `parseArgsRaw`, `parseInlineScriptAt`, `parseManagedArgAt`, `parseArgTokens`, `stripOuterQuotes`, `parsePromptSchema`, `sanitizeName`, `nowIso`) plus shared constants and the `ParsedArgToken` / `PromptSchemaField` types. Direct unit tests live in `runtime-arg-parser.test.ts`.
-    - **`runtime-event-emitter.ts`** — `RuntimeEventEmitter` owns **`__JAIPH_EVENT__`** writes on stderr (step/log traffic when not suppressed), **`run_summary.jsonl`** appends for the wider timeline (including workflow/prompt records that are summary-first), plus step/prompt sequence counters. Constructed with `{ runId, runDir, env, getFrameStack, getAsyncIndices, suppressLiveEvents? }`; the runtime delegates structured emission to it. The optional `suppressLiveEvents` flag (forwarded from `NodeWorkflowRuntime`'s `suppressLiveEvents` option) skips the live stderr **`__JAIPH_EVENT__`** lines while **`appendRunSummaryLine`** keeps updating **`run_summary.jsonl`** — used by in-process callers like the test runner that share stderr with `node --test` reporter output. The CLI's spawned `node-workflow-runner` child does not set it, so production runs stream events to stderr as before.
+    - **`runtime-event-emitter.ts`** — `RuntimeEventEmitter` owns **`__JAIPH_EVENT__`** writes on stderr (step/log traffic when not suppressed), **`run_summary.jsonl`** appends for the wider timeline (including workflow/prompt records that are summary-first), plus step/prompt sequence counters. Constructed with `{ runId, runDir, env, getFrameStack, getAsyncIndices, suppressLiveEvents? }`; the runtime delegates structured emission to it. The optional `suppressLiveEvents` flag (forwarded from `NodeWorkflowRuntime`'s `suppressLiveEvents` option) skips the live stderr **`__JAIPH_EVENT__`** lines while **`appendRunSummaryLine`** keeps updating **`run_summary.jsonl`** — used by in-process callers like the test runner that share stderr with `node --test` reporter output. The CLI's spawned **`__workflow-runner`** child does not set it, so production runs stream events to stderr as before.
     - **`runtime-mock.ts`** — `executeMockBodyDef` and `executeMockShellBody` for `*.test.jh` workflow/rule/script mocks. Shell-kind mocks run `bash -c`; steps-kind mocks dispatch back into the runtime via an `executeStepsBack` callback so the body runs against the full step interpreter.
-  - `buildRuntimeGraph()` (`graph.ts`) loads reachable modules with **`parsejaiph` only** (import closure); it does **not** run `validateReferences`. Cross-module refs are resolved from that graph at runtime. For **`script import`** declarations, `buildRuntimeGraph()` injects synthetic `ScriptDef` stubs (`graph.ts`) so reference resolution matches the validated compile path without re-reading external script bodies at graph-build time.
+  - `buildRuntimeGraph()` (`graph.ts`) accepts either an entry file path (legacy) or an already-loaded `ModuleGraph` and returns the runtime-ready view by injecting `ScriptDef` stubs for **`import script`** declarations so reference resolution matches the validated compile path without re-reading external script bodies. Cross-module refs are resolved from that graph at runtime. `RuntimeGraph` is a type alias for `ModuleGraph` — there is one canonical "all reachable modules" representation. The stub-injection helper (`attachScriptImportStubs`) is idempotent.
 
 - **Node Test Runner (`src/runtime/kernel/node-test-runner.ts`)**
   - Executes `*.test.jh` test blocks using `NodeWorkflowRuntime` with mock support (mock prompts, mock workflow/rule/script bodies). Pure Node harness — no Bash test transpilation.
@@ -63,11 +87,28 @@ All orchestration — local `jaiph run`, `jaiph test`, and **Docker `jaiph run`*
   - Prompt execution (`prompt.ts`), streaming parse (`stream-parser.ts`), schema (`schema.ts`), **`mock.ts`** (sequential prompt responses / mock-arm dispatch from test env JSON), **`runtime-mock.ts`** (mock workflow/rule/script **bodies** for `*.test.jh`), **`emit.ts`** (durable **`run_summary.jsonl`** helpers — `appendRunSummaryLine`, `formatUtcTimestamp` — consumed by `RuntimeEventEmitter`), **`workflow-launch.ts`** (spawn contract). **`RuntimeEventEmitter`** (`runtime-event-emitter.ts`) owns live **`__JAIPH_EVENT__`** lines on stderr and coordinates summary writes plus step/prompt sequence counters. Script subprocesses are launched directly from `NodeWorkflowRuntime`.
 
 - **Formatter (`src/format/emit.ts`)**
-  - `jaiph format` rewrites `.jh` / `.test.jh` files into canonical style. Pure AST→text emitter; no side-effects beyond file writes.
+  - `jaiph format` rewrites `.jh` / `.test.jh` files into canonical style. `emitModule(ast, trivia, opts?)` reads the semantic AST together with the parallel **`Trivia`** store ([Trivia (CST layer)](#trivia-cst-layer)) to round-trip leading comments, top-level order, `config` body sequence, `"""..."""` and `bareSource` forms, the original quotedness of top-level `const` values (`EnvDeclDef.wasQuoted` — `true` for `"…"` / `"""…"""` sources, `undefined` for bare tokens — so a quoted value is never silently rewritten as bare based on whether it contains a space), and prompt / script body discriminators. Step emission switches on `WorkflowStepDef.type` (8 variants) and an `emitExpr` helper switches on `Expr.kind` (8 kinds) — there are no dual code paths for "managed sidecar vs literal value" because that branch was removed from the AST. Call arguments render straight off the typed `Arg[]` — `var` → bare name, `literal` → raw — so the formatter no longer re-parses any args string or consults a `bareIdentifierArgs` shadow field. Pure data→text emitter; no side-effects beyond file writes. Round-trip is bit-for-bit on every fixture under `examples/` and `test-fixtures/golden-ast/fixtures/` — pinned by `src/format/roundtrip.test.ts`, which asserts `parse → format → parse → format` converges in one step on every fixture.
 
 - **Docker runtime helper (`src/runtime/docker.ts`)**
-  - Parses mount specs, resolves Docker config (image, network, timeout), and builds the `docker run` invocation when the CLI enables **Docker sandboxing** for `jaiph run` (environment-driven; there is no `jaiph run --docker` flag — see [Sandboxing](sandboxing.md)). The container runs the same `node-workflow-runner` entry as local execution. The default image is the official `ghcr.io/jaiphlang/jaiph-runtime` GHCR image; every selected image must already contain `jaiph` (no auto-install or derived-image build at runtime). Image preparation (`prepareImage`) runs before the CLI banner: it checks whether the image is local, pulls with `--quiet` if needed (short status lines on stderr instead of Docker’s default pull UI), and verifies that `jaiph` exists in the image. `spawnDockerProcess` does not pull or verify — it receives a pre-resolved image. The spawn call uses `stdio: ["ignore", "pipe", "pipe"]` — stdin is ignored so the Docker CLI does not block on stdin EOF, which would stall event streaming and hang the host CLI after the container exits.
-  - **Workspace immutability:** Docker runs cannot modify the host workspace. The host checkout is mounted read-only; `/jaiph/workspace` is a sandbox-local copy-on-write overlay discarded on exit. The only host-writable path is `/jaiph/run` (run artifacts). Workflows that need to capture workspace changes should write files (for example a `git diff` into a temp path) and publish them with `artifacts.save()`. See [Sandboxing](sandboxing.md) for the full contract and [Libraries — `jaiphlang/artifacts`](libraries.md#jaiphlangartifacts--publishing-files-out-of-the-sandbox).
+  - Parses mount specs, resolves Docker config (image, network, timeout), and builds the `docker run` invocation when the CLI enables **Docker sandboxing** for `jaiph run` (environment-driven; there is no `jaiph run --docker` flag — see [Sandboxing](sandboxing.md)). The container runs the same **`jaiph run --raw`** / **`__workflow-runner`** entry as local execution. The default image is the official `ghcr.io/jaiphlang/jaiph-runtime` GHCR image; every selected image must already contain `jaiph` (no auto-install or derived-image build at runtime). Image preparation (`prepareImage`) runs before the CLI banner: it checks whether the image is local, pulls with `--quiet` if needed (short status lines on stderr instead of Docker’s default pull UI), and verifies that `jaiph` exists in the image. `spawnDockerProcess` does not pull or verify — it receives a pre-resolved image. The spawn call uses `stdio: ["ignore", "pipe", "pipe"]` — stdin is ignored so the Docker CLI does not block on stdin EOF, which would stall event streaming and hang the host CLI after the container exits.
+  - **Workspace immutability:** By default Docker runs cannot modify the host workspace. The host checkout is mounted read-only (overlay) or as a disposable clone (copy); `/jaiph/workspace` is sandbox-local and discarded on exit. The only host-writable path is `/jaiph/run` (run artifacts). Workflows that need to capture workspace changes should write files (for example a `git diff` into a temp path) and publish them with `artifacts.save()`. The explicit opt-in **inplace** mode (truthy **`JAIPH_INPLACE`** — `1` or `true`, or `jaiph run --inplace`) breaks this contract on purpose — the host workspace itself is bind-mounted read-write so the run's edits persist live on the host, with the rest of the sandbox (caps, env allowlist, mount set) unchanged. See [Sandboxing](sandboxing.md) for the full contract and [Save artifacts](artifacts.md).
+
+## Local module graph
+{: #local-module-graph}
+
+The toolchain has one canonical representation — **`ModuleGraph`** — for "all `.jh` modules reachable from an entry point, parsed once." The same graph is used by the validator, the script emitter, and the runtime; on the default local `jaiph run` path it also crosses the parent CLI → child runner boundary so each reachable `.jh` is parsed exactly **once** per run.
+
+- **`loadModuleGraph(entryFile, workspaceRoot?)`** (`src/transpile/module-graph.ts`) walks the entry plus its transitive `import` edges through `resolveImportPath` and returns `{ entryFile, workspaceRoot?, modules: Map<absPath, { filePath, ast, imports: Map<alias, absPath> }> }`. **`<lib>/<path>`** imports (for example `jaiphlang/queue`) resolve through the workspace library fallback under `.jaiph/libs/` when a relative path does not exist. This is the **only** routine that reads `.jh` sources from disk; `parsejaiph(source, filePath)` itself is I/O-pure.
+- **`src/cli/commands/run.ts`** calls `loadModuleGraph` once after path normalization. The entry AST is reused for **`metadataToConfig(mod.metadata)`** (banner / `runtime` config). The same graph is passed to **`buildScriptsFromGraph(graph, outDir)`**, which calls **`emitScriptsForModuleFromGraph`** per reachable module; each call runs **`validateModule(ast, graph)`** against the in-memory ASTs.
+- **Process boundary.** The CLI serializes the graph with **`writeModuleGraph`** to **`<outDir>/.jaiph-module-graph.json`** (deterministic JSON: entries sorted by absolute path; ASTs included verbatim). It points the spawned **`__workflow-runner`** child at the file through the internal env var **`JAIPH_MODULE_GRAPH_FILE`**. The runner reads it back with **`readModuleGraph`** and passes the result to **`buildRuntimeGraph(graph)`**, which produces the runtime view (with **`import script`** stub injection) without touching disk. Cross-module workflow / rule / script resolution matches the on-disk load path.
+- **Scope of the env-var hand-off.** `JAIPH_MODULE_GRAPH_FILE` is set **only** when the host CLI spawns the local **`__workflow-runner`** child with Docker sandboxing disabled (`dockerConfigForBanner.enabled === false`). It is **not** set on these paths, which load the graph from disk inside the runner instead:
+  - **`jaiph run --raw`** — `runWorkflowRaw` (`src/cli/commands/run.ts`) calls `buildScripts` directly without writing the graph file; the runner uses inherited stdio and falls back to `loadModuleGraph` from the source file.
+  - **Docker `jaiph run`** — the host writes the graph file under `outDir`, but skips the env var because the inner container command is `jaiph run --raw …` and the host bind-mount layout does not plumb the cache file inside the container.
+  - **`jaiph test`** — `runSingleTestFile` builds the graph in `src/cli/commands/test.ts` and threads it through `runTestFile(graph, ...)` directly (no env var needed; same process).
+
+  When the env var is absent the runner falls back to the disk-walk parse path, preserving prior behavior.
+
+User-visible contracts (banner, hooks, run artifacts, `run_summary.jsonl`, `return_value.txt`, exit codes, `__JAIPH_EVENT__` streaming) are unchanged.
 
 ## Runtime vs CLI responsibilities
 
@@ -119,20 +160,21 @@ Channels are validated at compile time (`validateReferences` / send RHS rules) a
 
 ## Test runner integration (`*.test.jh` in the kernel)
 
-**How** `jaiph test` wires into the same stack as `jaiph run`: `*.test.jh` files are parsed in the CLI; `runTestFile()` drives blocks in-process. **`buildRuntimeGraph(testFile)`** is called **once per `runTestFile` invocation** and the resulting graph is reused across all blocks and `test_run_workflow` steps (the import closure is constant for a given test file within a single process run). Each `test_run_workflow` step resolves mocks against that cached graph, then constructs `NodeWorkflowRuntime` with `mockBodies` / mock prompt env, passing **`suppressLiveEvents: true`** so **`RuntimeEventEmitter`** skips writing **`__JAIPH_EVENT__`** lines to **stderr** while still appending **`run_summary.jsonl`** for that run. Without this flag, every workflow event would print to the test process's stderr and swamp `node --test` reporter output. Mock prompts, workflows, rules, and scripts are supported through the runtime's mock infrastructure.
+**How** `jaiph test` wires into the same stack as `jaiph run`: `runSingleTestFile` (`src/cli/commands/test.ts`) calls `loadModuleGraph(testFileAbs, workspaceRoot)` once, then threads the resulting `ModuleGraph` through `buildScriptsFromGraph(graph, tmpDir)` and `runTestFile(graph, …)`. `runTestFile` calls `buildRuntimeGraph(graph)` once per file and the runtime view is reused across all blocks and `test_run_workflow` steps (the import closure is constant for a given test file within a single process run). Each `test_run_workflow` step resolves mocks against that runtime view, then constructs `NodeWorkflowRuntime` with `mockBodies` / mock prompt env, passing **`suppressLiveEvents: true`** so **`RuntimeEventEmitter`** skips writing **`__JAIPH_EVENT__`** lines to **stderr** while still appending **`run_summary.jsonl`** for that run. Without this flag, every workflow event would print to the test process's stderr and swamp `node --test` reporter output. Mock prompts, workflows, rules, and scripts are supported through the runtime's mock infrastructure.
 
-Before that, the CLI prepares script executables via **`buildScripts(testFileAbs, tmpDir, workspaceRoot)`** — the same **`buildScripts`** helper as `jaiph run`, with the **test file as the entrypoint**. That walks the test module and its **import closure** (transitive `import` edges), runs **`validateReferences`** / **`emitScriptsForModule`** per reachable file, and writes `scripts/` so imported workflows have paths under `JAIPH_SCRIPTS`. Unrelated `*.jh` files elsewhere in the repo are not compiled unless imported.
+The `buildScriptsFromGraph` call writes `scripts/` so imported workflows have paths under `JAIPH_SCRIPTS`. Unrelated `*.jh` files elsewhere in the repo are not compiled unless imported.
 
 Authoring rules, fixtures, and mock syntax for `*.test.jh` are documented in [Testing](testing.md), not here.
 
 ## CLI progress reporting pipeline
 
-The progress UI combines a **static** step tree derived from the workflow AST (`src/cli/run/progress.ts`) with **live** updates from the runtime event stream. Event wiring: `src/cli/run/events.ts` and `src/cli/run/stderr-handler.ts` parse `__JAIPH_EVENT__` lines; `src/cli/run/emitter.ts` bridges into the renderer. Line-oriented formatting (`formatStartLine`, `formatHeartbeatLine`, `formatCompletedLine`) lives primarily in `src/cli/run/display.ts`, which shares some display helpers with `progress.ts`. Async branch numbering (subscript ₁₂₃… prefixes) is driven by `async_indices` on step and log events — the runtime propagates a chain of 1-based branch indices through `AsyncLocalStorage`, and the stderr handler renders them at the appropriate indent level. `const` steps whose value is a `match_expr` are walked for nested `run`/`ensure` arms; matched targets appear as child items in the step tree (e.g. `▸ script safe_name` under the `const` row). This pipeline does not apply to **`jaiph run --raw`**.
+The progress UI combines a **static** step tree derived from the workflow AST (`src/cli/run/progress.ts`) with **live** updates from the runtime event stream. Event wiring: `src/cli/run/events.ts` and `src/cli/run/stderr-handler.ts` parse `__JAIPH_EVENT__` lines; `src/cli/run/emitter.ts` bridges into the renderer. Line-oriented formatting (`formatStartLine`, `formatHeartbeatLine`, `formatCompletedLine`) lives primarily in `src/cli/run/display.ts`, which shares some display helpers with `progress.ts`. Async branch numbering (subscript ₁₂₃… prefixes) is driven by `async_indices` on step and log events — the runtime propagates a chain of 1-based branch indices through `AsyncLocalStorage`, and the stderr handler renders them at the appropriate indent level. `const` steps whose `Expr` value is `kind: "match"` are walked for nested `run` / `ensure` arms; matched targets appear as child items in the step tree (for example `▸ workflow my_flow` or `▸ rule my_rule` under the `const` row). This pipeline does not apply to **`jaiph run --raw`**.
 
 ## Distribution: Node vs Bun standalone
 
-- **Development / npm:** `npm run build` runs `tsc`, copies **`src/runtime/`** to **`dist/src/runtime/`** (kernel, `docker.ts`, etc.), then copies **`runtime/overlay-run.sh`** from the repo root into **`dist/src/runtime/overlay-run.sh`**. The published `jaiph` bin is **`node dist/src/cli.js`**.
-- **Standalone:** `npm run build:standalone` runs the same build, copies **`dist/src/runtime`** to **`dist/runtime`** beside the binary, then `bun build --compile ./src/cli.ts --outfile dist/jaiph`. Workflow launch still spawns `node-workflow-runner.js` using **`process.execPath`**, so the standalone artifact is **self-contained** (no separate Node install) when end users run that binary. **Bash** (or whatever shebang your `script` steps use) is still required on the host for script subprocesses. Ship **`dist/jaiph`** with **`dist/runtime`** alongside it so kernel paths resolve (same layout as `npm run build:standalone`; table in [Contributing](contributing.md)).
+- **Development / npm:** `npm run build` runs `npm run embed-assets` (regenerates **`src/runtime/embedded-assets.ts`** from `runtime/overlay-run.sh` and `docs/jaiph-skill.md`, and **`src/version.ts`** from `package.json`'s `version` field), then `tsc`, copies **`src/runtime/`** to **`dist/src/runtime/`** (kernel, `docker.ts`, etc.), and copies **`runtime/overlay-run.sh`** from the repo root into **`dist/src/runtime/overlay-run.sh`**. The published `jaiph` bin is **`node dist/src/cli.js`**.
+- **Standalone:** `npm run build:standalone` runs the same build, copies **`dist/src/runtime`** to **`dist/runtime`** beside the binary, then `bun build --compile ./src/cli.ts --outfile dist/jaiph`. Workflow launch self-spawns via **`process.execPath`** using the internal **`__workflow-runner`** argv marker (`src/runtime/kernel/workflow-launch.ts` + `src/cli/index.ts`): the node build invokes `node dist/src/cli.js __workflow-runner …`; the bun-compiled binary invokes itself, `jaiph __workflow-runner …`. The reserved marker is excluded from `--help`/usage and the file-shorthand path. `overlay-run.sh` and `docs/jaiph-skill.md` are also embedded base64 inside the executable via **`src/runtime/embedded-assets.ts`**, so the standalone artifact is **fully self-contained** — no sibling `runtime/` or `docs/` files required. The displayed `jaiph --version` string is sourced from the generated **`src/version.ts`** (codegen'd from `package.json` by `embed-assets`), so the literal is statically baked into both the `tsc` and the `bun build --compile` outputs without a runtime read of `package.json`. **Bash** (or whatever shebang your `script` steps use) is still required on the host for script subprocesses. Ship **`dist/jaiph`** alone, or with **`dist/runtime`** alongside it for parity with the npm layout (table in [Contributing](contributing.md)).
+- **Release artifacts:** `.github/workflows/release.yml` cross-compiles the standalone binary for **darwin/linux × arm64/x64** on **`v*`** tag pushes and on pushes to the **`nightly`** branch, generates a `SHA256SUMS` covering the four binaries, runs a `--version` sanity gate on the linux-x64 output, and uploads the five assets to the matching GitHub Release (stable tag or rolling **`nightly`** prerelease). Asset filenames are fixed by the installer contract — see [Contributing — Release asset naming contract](contributing.md#release-asset-naming-contract).
 
 ## Mermaid architecture diagram
 
@@ -140,26 +182,27 @@ The progress UI combines a **static** step tree derived from the workflow AST (`
 flowchart TD
     U[User / CI] --> CLI[CLI: Node or Bun jaiph]
 
-    subgraph Transpile["Per-module: emitScriptsForModule()"]
-        PARSE[parsejaiph]
-        VAL[validateReferences]
+    subgraph Transpile["Per-module: emitScriptsForModuleFromGraph()"]
+        VAL[validateModule]
         EMIT[Emit atomic script files under scripts/]
-        PARSE --> VAL
         VAL -->|compile errors| ERR[Deterministic compile errors]
         VAL --> EMIT
     end
 
-    CLI -->|jaiph run| BS1[buildScripts]
+    CLI -->|jaiph run| LMG1[loadModuleGraph entry + closure]
+    LMG1 --> BS1[buildScriptsFromGraph]
     BS1 --> Transpile
 
-    CLI -->|jaiph test| BS2[buildScripts(entry .test.jh)]
+    CLI -->|jaiph test| LMG2[loadModuleGraph(entry .test.jh)]
+    LMG2 --> BS2[buildScriptsFromGraph]
     BS2 --> Transpile
-    BS2 --> TR[Node Test Runner in-process]
+    LMG2 --> TR[Node Test Runner in-process]
 
-    Transpile -->|jaiph run local| RW[Node workflow runner child]
-    Transpile -->|jaiph run Docker| DC[Container runs node-workflow-runner]
+    Transpile -->|jaiph run local| RW[__workflow-runner child]
+    Transpile -->|jaiph run Docker| DC[Container: jaiph run --raw]
+    LMG1 -. JAIPH_MODULE_GRAPH_FILE (local non-Docker only) .-> RW
 
-    RW --> G[buildRuntimeGraph parse-only + imports]
+    RW --> G[buildRuntimeGraph from graph]
     G --> GRAPH[RuntimeGraph]
     RW --> RT[NodeWorkflowRuntime]
     RT --> GRAPH
@@ -193,29 +236,41 @@ Interactive **`jaiph run`** (no **`--raw`**): banner, progress tree, hooks, and
 sequenceDiagram
     participant User
     participant CLI as CLI jaiph run
-    participant Prep as buildScripts
-    participant TF as emitScriptsForModule per module
-    participant Runner as node-workflow-runner
-    participant Graph as buildRuntimeGraph
+    participant Load as loadModuleGraph
+    participant Prep as buildScriptsFromGraph
+    participant TF as emitScriptsForModuleFromGraph per module
+    participant Runner as __workflow-runner child
+    participant Graph as buildRuntimeGraph(graph)
     participant Runtime as NodeWorkflowRuntime
     participant Kernel as JS kernel
     participant Report as Artifacts (.jaiph/runs)
 
     User->>CLI: jaiph run main.jh args...
-    Note over CLI: parse once for metadata config only
-    CLI->>Prep: buildScripts(input)
-    Prep->>TF: loop: parse + validateReferences + emit
+    CLI->>Load: loadModuleGraph(entry, workspace)
+    Load-->>CLI: ModuleGraph (modules map)
+    Note over CLI: reuse entry AST for metadataToConfig / banner
+    CLI->>Prep: buildScriptsFromGraph(graph, outDir)
+    Prep->>TF: loop: validateModule + emit (in-memory AST)
     TF-->>Prep: scripts/ atomic only
     Prep-->>CLI: scriptsDir + env JAIPH_SCRIPTS
-    alt local
-        CLI->>Runner: spawn detached node-workflow-runner
+    alt local (non-Docker)
+        CLI->>CLI: writeModuleGraph(<outDir>/.jaiph-module-graph.json)
+        Note over CLI: set JAIPH_MODULE_GRAPH_FILE on child env
+        CLI->>Runner: spawn detached __workflow-runner child
     else Docker
         CLI->>CLI: prepareImage (pull --quiet + verify jaiph)
         Note over CLI: runs before banner so pull doesn't interleave
-        CLI->>Runner: spawn container running node-workflow-runner
+        CLI->>Runner: spawn container running jaiph run --raw
         Note over CLI: CLI parses events on stderr only
     end
-    Runner->>Graph: buildRuntimeGraph(sourceAbs) parse-only
+    alt JAIPH_MODULE_GRAPH_FILE set (local non-Docker)
+        Runner->>Runner: readModuleGraph(file)
+        Runner->>Graph: buildRuntimeGraph(graph)
+        Note over Graph: no .jh re-reads
+    else absent (Docker / --raw / test runner)
+        Runner->>Runner: loadModuleGraph(sourceAbs, workspace)
+        Runner->>Graph: buildRuntimeGraph(graph)
+    end
     Graph-->>Runner: RuntimeGraph
     Runner->>Runtime: runDefault(run args)
     Runtime->>Kernel: prompt / managed scripts / emit / inbox
@@ -226,7 +281,7 @@ sequenceDiagram
     CLI-->>User: PASS/FAIL
 ```
 
-**Docker:** the inner container command is **`jaiph run --raw …`** (see [Sandboxing](sandboxing.md#docker-container-isolation)): no banner or progress UI inside the container; **`__JAIPH_EVENT__`** lines still appear on stderr for the host CLI to parse.
+**Docker:** the inner container command is **`jaiph run --raw …`** (see [Sandboxing](sandboxing.md)): no banner or progress UI inside the container; **`__JAIPH_EVENT__`** lines still appear on stderr for the host CLI to parse.
 
 ## Sequence diagram: `jaiph test` flow
 
@@ -234,20 +289,20 @@ sequenceDiagram
 sequenceDiagram
     participant User
     participant CLI as CLI jaiph test
-    participant Parser as parsejaiph
-    participant Prep as buildScripts(test file)
+    participant Load as loadModuleGraph
+    participant Prep as buildScriptsFromGraph
     participant TestRunner as runTestFile / runTestBlock
-    participant Graph as buildRuntimeGraph
+    participant Graph as buildRuntimeGraph(graph)
     participant Runtime as NodeWorkflowRuntime
     participant Report as Artifacts
 
     User->>CLI: jaiph test flow.test.jh
-    CLI->>Parser: parse test file
-    Parser-->>CLI: jaiphModule + tests[] blocks
-    CLI->>Prep: buildScripts(test path, tmp) import closure
+    CLI->>Load: loadModuleGraph(test file, workspace)
+    Load-->>CLI: ModuleGraph (entry + import closure)
+    CLI->>Prep: buildScriptsFromGraph(graph, tmp)
     Prep-->>CLI: scriptsDir
-    CLI->>TestRunner: runTestFile(test path workspace scriptsDir blocks)
-    TestRunner->>Graph: buildRuntimeGraph(test file) once per file
+    CLI->>TestRunner: runTestFile(graph, workspace, scriptsDir, blocks)
+    TestRunner->>Graph: buildRuntimeGraph(graph) once per file
     Graph-->>TestRunner: RuntimeGraph cached
     loop each test block
         TestRunner->>TestRunner: mocks / shell steps / expectations
@@ -264,9 +319,9 @@ sequenceDiagram
 
 ## Summary
 
-- `.jh` / `*.test.jh` share parser/AST; **compile-time** validation runs in **`emitScriptsForModule`** during **`buildScripts`**. **`buildRuntimeGraph`** loads modules with **parse-only** imports.
-- **`jaiph compile`** walks import closures with **`validateReferences` only**, and exits — no **`scripts/`** emission (**no **`buildScriptFiles`** / **`buildScripts`**), no **`buildRuntimeGraph()`**, no runner spawn. Directory discovery omits **`*.test.jh`** unless you pass a test file explicitly.
-- **Node-only runtime:** all execution — local `jaiph run`, Docker `jaiph run`, and `jaiph test` — goes through `NodeWorkflowRuntime`. Docker containers run `node-workflow-runner` with the compiled JS tree and scripts mounted, using the same semantics as local execution.
+- `.jh` / `*.test.jh` share parser/AST. The pipeline is **`loadModuleGraph` → `buildScriptsFromGraph(graph, outDir)`** (per-module **`validateModule`** + **`buildScriptFiles`** via **`emitScriptsForModuleFromGraph`**); `parsejaiph` is I/O-pure and graph-based validation / emit operate entirely in-memory. **`buildRuntimeGraph`** consumes the same `ModuleGraph` (loaded in the runner from disk or — on the default local **`jaiph run`** path — deserialized from the parent CLI's graph file via **`JAIPH_MODULE_GRAPH_FILE`**; see [Local module graph](#local-module-graph)).
+- **`jaiph compile`** walks import closures through **`collectDiagnostics(graph)`** (the multi-error sibling of **`validateReferences`**), prints the full diagnostic set sorted by `(file, line, col)`, and exits non-zero on any non-empty set — no **`scripts/`** emission (no **`buildScriptFiles`** / **`buildScripts`**), no **`buildRuntimeGraph()`**, no runner spawn. Directory discovery omits **`*.test.jh`** unless you pass a test file explicitly.
+- **Node-only runtime:** all execution — local `jaiph run`, Docker `jaiph run`, and `jaiph test` — goes through `NodeWorkflowRuntime`. Docker containers run **`jaiph run --raw`** / **`__workflow-runner`** with the compiled JS tree and scripts mounted, using the same semantics as local execution.
 - **CLI** owns launch, observation, hooks (except **`jaiph run --raw`**), and runtime preparation (`buildScripts`). **`jaiph run --raw`** still emits **`__JAIPH_EVENT__`** on stderr from the runtime; the CLI does not attach the interactive progress/hooks pipeline. **`jaiph test`** passes **`suppressLiveEvents: true`** into **`NodeWorkflowRuntime`** so **`RuntimeEventEmitter`** skips writing those live stderr lines while **`run_summary.jsonl`** still records workflow traffic where the emitter appends it.
 - Workflow execution runs in **`NodeWorkflowRuntime`**, with **script steps** as managed subprocesses.
 - No workflow-level `.sh` files or `jaiph_stdlib.sh` are produced or required.
diff --git a/docs/artifacts.md b/docs/artifacts.md
index 397bff1a..70952d01 100644
--- a/docs/artifacts.md
+++ b/docs/artifacts.md
@@ -1,51 +1,89 @@
 ---
-title: Runtime artifacts
-permalink: /artifacts
+title: Save artifacts
+permalink: /how-to/artifacts
+diataxis: how-to
 redirect_from:
+  - /artifacts
   - /artifacts.md
 ---
 
-# Runtime artifacts
+# Save artifacts
 
-Long-running orchestration tools usually split **telemetry you watch while something runs** from **evidence you keep after it stops**. The first answers “what is happening now?”; the second answers “what happened, in enough detail to debug or audit later?” Jaiph does the same.
+This recipe publishes files from a workflow into the run's `artifacts/` directory under the run logs root (`.jaiph/runs/` by default). That is the supported export path when Docker sandboxing is on — in the default overlay and copy modes, workspace edits are discarded at container exit, but anything copied into `artifacts/` remains on the host.
 
-For Jaiph, **live** observation is the `__JAIPH_EVENT__` JSON line protocol on the workflow runner’s **stderr** (what the interactive CLI and [Hooks](hooks.md) consume). **Durable** observation is a directory tree on disk: step captures, an append-only summary timeline, optional inbox copies, and a writable `artifacts/` folder for anything workflows publish explicitly.
+The runtime always creates an `artifacts/` directory under the run log directory and exposes its absolute path as `JAIPH_ARTIFACTS_DIR`. The `jaiphlang/artifacts` library is the canonical way to copy files into that directory; you can also write there directly from a `script` step.
 
-When you run a workflow, or `jaiph test` executes workflows inside test blocks, **`NodeWorkflowRuntime`** materializes that durable tree. **`jaiph run`** defaults to `<workspace>/.jaiph/runs/`; override with `run.logs_dir` or **`JAIPH_RUNS_DIR`** (see [Configuration — Run keys](configuration.md#run-keys)). The test runner uses its own ephemeral runs root under **`JAIPH_RUNS_DIR`** so normal workspace runs are not overwritten — see [Configuration — Testing with `jaiph test`](configuration.md#testing-with-jaiph-test). The layout below matches what the runtime creates in the constructor (see [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout)). In Docker mode, paths inside recorded events may use container prefixes (`/jaiph/run/…`); the CLI maps them to host paths when reporting failures — see [Sandboxing — Path remapping](sandboxing.md#path-remapping).
+## Prerequisites
 
-## Run directory layout
+- A workspace with `.jaiph/libs/jaiphlang/` installed (`jaiph install jaiphlang`) if you want to use the library — see [Use & publish a library](/how-to/libraries).
+- The file(s) you want to save exist by the time the `artifacts.save(...)` step runs.
 
-The runtime uses a UTC-dated hierarchy. Each run gets its own folder: UTC date, then UTC time plus a **basename** used only for naming (not a path): **`JAIPH_SOURCE_FILE`** when set in the environment (the CLI and `node-workflow-runner` set this to the entry file basename), otherwise `basename(graph.entryFile)` from the parsed graph.
+## 1. Import the library
 
+```jh
+import "jaiphlang/artifacts" as artifacts
 ```
-.jaiph/runs/
-  <YYYY-MM-DD>/                       # UTC date (see NodeWorkflowRuntime)
-    <HH-MM-SS>-<source-basename>/       # UTC time + basename (see above)
-      000001-module__step.out          # stdout capture per step (6-digit seq prefix)
-      000001-module__step.err          # stderr capture (may be empty)
-      artifacts/                       # user-published files (`jaiphlang/artifacts`); `JAIPH_ARTIFACTS_DIR`
-      inbox/                           # audit copies of routed channel payloads (optional)
-      heartbeat                        # liveness: epoch ms, refreshed about every 10s
-      return_value.txt                 # `runDefault` only: status 0 and `returnValue` defined (may be "")
-      run_summary.jsonl                # durable event timeline (JSON Lines)
+
+## 2. Save a single file
+
+```jh
+workflow default() {
+  # ... produce ./build/output.bin somehow ...
+  const dest = run artifacts.save("./build/output.bin")
+  log "saved to ${dest}"
+}
 ```
 
-Sequence numbers in those filenames are **monotonic and unique** per run. `RuntimeEventEmitter` owns a single in-memory counter (`allocStepSeq`) that advances whenever a step allocates paired capture files: **`executeManagedStep`** (nested **`workflow`** / **`rule`**, **`script`** references, inline scripts, and **`shell`** lines run via `sh -c`) plus **`prompt`** steps (which call `allocStepSeq` inside `emitPromptStepStart`). Ordinary **`log`**, **`logerr`**, **`fail`**, **`send`**, and most **`const`** bindings do **not** open new numbered `.out`/`.err` pairs — they still emit **`LOG`/`LOGERR`** or **`INBOX_ENQUEUE`** records (and related lines) into **`run_summary.jsonl`** where applicable. There is **no** `.seq` file in the run directory. For the live vs durable split, see [Architecture — Contracts](architecture.md#contracts): `__JAIPH_EVENT__` on stderr is the streaming path; `run_summary.jsonl` is the durable timeline.
+`save` copies the source path into `${JAIPH_ARTIFACTS_DIR}/...` preserving the relative layout (the leading `./` is stripped). Absolute source paths are copied using `basename` only. The workflow value is the absolute destination path.
 
-## What each artifact is for
+## 3. Save several files at once
 
-- **`*.out` / `*.err`** — Paired capture files for steps that record subprocess or prompt I/O. The runtime creates both paths at **`STEP_START`**. For **managed** steps (extracted scripts, nested workflows/rules, single-line `shell`, and similar), stdout/stderr are **streamed** into the files during execution, then **rewritten** with the final aggregated strings at step end — so a long-running step’s `.out` can be tailed while it runs (see [CLI — Run artifacts and live output](cli.md#run-artifacts-and-live-output)). **Prompt** steps stream the model transcript into `.out`; `.err` is only overwritten when stderr from the backend is non-empty (otherwise the placeholder file stays zero-length). **Errors and CLI progress** still use the live `__JAIPH_EVENT__` stream on stderr; these files are the on-disk record.
+`save` accepts a **newline-separated** list of paths. Blank or whitespace-only lines are ignored:
+
+```jh
+workflow default() {
+  const paths = """
+  a.txt
+  b/nested.txt
+  """
+  const dests = run artifacts.save(paths)
+  log "${dests}"
+}
+```
 
-- **`run_summary.jsonl`** — Append-only JSON Lines timeline: workflow boundaries, step start/end, `LOG` / `LOGERR`, prompt lifecycle, inbox events, and the same step payload fields as the live stream. It is **truncated to empty at runtime startup**, then each event appends a line via `appendRunSummaryLine` as execution proceeds. The in-process test runner can set `suppressLiveEvents`, which **stops** `__JAIPH_EVENT__` lines from going to stderr while **`run_summary.jsonl` keeps updating** (see [Architecture — Core components](architecture.md#core-components), `RuntimeEventEmitter`).
+The returned value is the newline-separated list of absolute destination paths, in the same order.
 
-- **`inbox/`** — When channels are used, a **`send`** may persist a copy of the payload here (`NNN-<channel>.txt`) for audit. The runtime walks ancestor workflow contexts and writes a file **only when it finds a matching route for that channel** on the stack (same condition as “routed” dispatch — see [Inbox & Dispatch](inbox.md)); unrouted sends enqueue without creating `inbox/` files. Delivery stays in-memory; this directory is not a mailbox API.
+## 4. (Alternative) Write directly from a script step
+
+If you need full control of layout or names, write to `$JAIPH_ARTIFACTS_DIR` from a `script` step:
+
+```jh
+script save_report = ```
+  mkdir -p "$JAIPH_ARTIFACTS_DIR/reports"
+  cp ./report.html "$JAIPH_ARTIFACTS_DIR/reports/"
+```
 
-- **`heartbeat`** — Best-effort file containing a wall-clock millisecond timestamp, rewritten on a timer (~10s). Liveness for external watchdogs; not required for normal CLI use.
+workflow default() {
+  run save_report()
+}
+```
+
+The runtime also sets `JAIPH_RUN_DIR`, `JAIPH_RUN_SUMMARY_FILE`, and `JAIPH_RUN_ID` on script steps if you need those paths.
+
+## Verification
+
+After the run, list the artifacts directory:
+
+```bash
+ls <runs_root>/<YYYY-MM-DD>/<HH-MM-SS>-<source>/artifacts/
+```
 
-- **`return_value.txt`** — Written only from **`runDefault`** (the normal **`jaiph run`** entry path) when the top-level workflow finishes with **exit status 0** and the aggregated result has **`returnValue !== undefined`** (empty string is allowed and produces a zero-byte file; **`undefined`** means the file is omitted — typically “fell off the end” of the workflow without a **`return`**). **`runNamedWorkflow`** (`test_run_workflow`, nested named runs, etc.) returns the value to the caller but does **not** write this file.
+Replace `<runs_root>` with `.jaiph/runs` when `JAIPH_RUNS_DIR` is unset, or with your configured runs directory otherwise. Date and time segments are UTC; `<source>` is the entry-file basename (or `JAIPH_SOURCE_FILE` when set). You should see the files your workflow saved. Under Docker sandboxing the host path is the same — the run mount at `/jaiph/run` inside the container is bound to the host runs root, so artifacts land on the host even though the run executed inside the container.
 
-- **`artifacts/`** — Created in the constructor together with the empty **`run_summary.jsonl`** (truncated file). The runtime sets **`JAIPH_ARTIFACTS_DIR`**, **`JAIPH_RUN_DIR`**, **`JAIPH_RUN_SUMMARY_FILE`**, and **`JAIPH_RUN_ID`**: if **`JAIPH_RUN_ID`** is already set in the incoming environment it is preserved; otherwise a new UUID is generated. User workflows usually publish into **`artifacts/`** through **`jaiphlang/artifacts`** (`artifacts.save`). In Docker mode it sits under the **host-writable** run mount (`/jaiph/run/...` inside the container), not the read-only workspace overlay. See [Libraries — `jaiphlang/artifacts`](libraries.md#jaiphlangartifacts--publishing-files-out-of-the-sandbox) and [Sandboxing](sandboxing.md).
+`artifacts.save(...)` exits with a failure when the input list is empty after trimming, when any listed path is missing or not a regular file, or when `JAIPH_ARTIFACTS_DIR` is unset — wrap the call in `recover` / `catch` if you want the workflow to tolerate that.
 
-## Keeping runs out of git
+## Related
 
-Run `jaiph init` to add `.jaiph/.gitignore` entries for `runs` and `tmp` under `.jaiph/`. You can mirror those paths in a root `.gitignore` if you prefer.
+- [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout) — the full run directory tree, including where `artifacts/` sits.
+- [Use & publish a library](/how-to/libraries) — installing `jaiphlang/artifacts` and writing your own libraries.
+- [Sandboxing — The three sandbox modes](sandboxing.md#the-three-sandbox-modes) — overlay and copy discard workspace edits; artifacts persist on the host in every mode.
diff --git a/docs/cli.md b/docs/cli.md
index b956872f..2bc3fd07 100644
--- a/docs/cli.md
+++ b/docs/cli.md
@@ -1,474 +1,298 @@
 ---
-title: CLI Reference
-permalink: /cli
+title: CLI
+permalink: /reference/cli
+diataxis: reference
 redirect_from:
+  - /cli
   - /cli.md
 ---
 
-# Jaiph CLI Reference
+# CLI
 
-Jaiph is a workflow system: authors write `.jh` modules, and a **TypeScript CLI** prepares scripts, launches a **Node workflow runtime**, and surfaces progress while the **JavaScript kernel** executes the AST in process (no separate workflow shell). The CLI is what you install as the `jaiph` binary — it is the boundary between your terminal or CI and the interpreter.
+This page is the authoritative inventory of the `jaiph` CLI: every subcommand, every flag, every exit-relevant behaviour. It does not explain how to choose between commands — see [Why Jaiph](why-jaiph.md) for context and the how-to pages for recipes.
 
-At a high level, the CLI does four things: **compile** script bodies from your module graph (`buildScripts`), **spawn** the detached workflow runner (`node-workflow-runner`) for `jaiph run`, **observe** `__JAIPH_EVENT__` lines on stderr to render progress and drive hooks (unless `--raw`), and **leave** durable artifacts under `.jaiph/runs`. `jaiph test` reuses the same compilation step and runtime kernel but executes test blocks in-process with mocks — see [Architecture](architecture.md) for the full pipeline.
+The published `jaiph` bin is `node dist/src/cli.js` (npm) or the standalone `dist/jaiph` (Bun-compiled). Both dispatch through `src/cli/index.ts`.
 
-This page lists **commands**, important **flags**, and **environment variables**. It focuses on how the tool behaves, not on the language itself. For semantics and the overall language model, see [Language](language.md). For concrete syntax rules (imports, orchestration strings, managed calls, …), see [Grammar](grammar.md). For repository layout, pipelines, and contracts (`__JAIPH_EVENT__`, artifacts, Docker vs local), see [Architecture](architecture.md).
+## Invocation forms
 
-**Commands:** `run`, `test`, `compile`, `format`, `init`, `install`, `use`.
+| Form | Effect |
+|---|---|
+| `jaiph` | Print the overview and exit `0`. |
+| `jaiph --help` / `-h` | Print the overview and exit `0`. |
+| `jaiph --version` / `-v` | Print the CLI version and exit `0`. |
+| `jaiph <subcommand> [-h \| --help]` | Print the subcommand's usage (flags + one example) and exit `0`. Recognised anywhere in the arg list before `--` (except `compile`: help flags must precede path arguments). |
+| `jaiph <path>` | File shorthand. Paths ending in `*.test.jh` route to `jaiph test`; other `*.jh` paths route to `jaiph run`. Non-existent paths fall through to normal command parsing. |
+| `jaiph <unknown>` | Print `Unknown command: <name>`, repeat the overview, exit `1`. |
 
-**Global options:** `-h` / `--help` and `-v` / `--version` are recognized only as the **first token after `jaiph`** (e.g. `jaiph --help`). They are not treated as global flags after a subcommand or a file path (`jaiph run --help` is **not** usage — use `jaiph --help`, or **`jaiph compile -h`** / **`jaiph compile --help`** for compile-specific usage — the `compile` command parses `-h` / `--help` after the subcommand). Running **`jaiph`** with no arguments prints the same overview and exits **0**.
+The reserved internal marker `__workflow-runner` is excluded from `--help`/usage and from the file-shorthand path; it is used by `process.execPath` self-spawn (see [Architecture — Distribution: Node vs Bun standalone](architecture.md#distribution-node-vs-bun-standalone)).
 
-Any other unknown first token prints `Unknown command: …`, repeats the overview, and exits **1**.
+## Subcommand summary
 
-## File shorthand
-
-If the **first argument after `jaiph`** is an **existing path** (resolved relative to the current working directory), Jaiph routes it automatically based on the extension. Files ending in **`*.test.jh`** are run as tests (same as `jaiph test <file>`). Other paths ending in **`.jh`** are run as workflows (same as `jaiph run <file>`). The `*.test.jh` check happens first, so test modules are never mistaken for workflows. Paths that do not exist fall through to normal command parsing (e.g. you cannot rely on shorthand for a not-yet-created file).
-
-Additional positional tokens after a **workflow** shorthand are forwarded to **`workflow default`**, matching `jaiph run`. Tokens after a **test** shorthand are accepted but **ignored** (same as `jaiph test <file>` with extra arguments).
-
-```bash
-# Workflow shorthand
-jaiph ./flows/review.jh "review this diff"
-# equivalent to: jaiph run ./flows/review.jh "review this diff"
-
-# Test shorthand
-jaiph ./e2e/say_hello.test.jh
-# equivalent to: jaiph test ./e2e/say_hello.test.jh
-```
+| Subcommand | Purpose |
+|---|---|
+| `run` | Compile, launch, and observe one workflow run (with optional Docker sandboxing). |
+| `test` | Execute `*.test.jh` blocks in-process with mocks. |
+| `compile` | Multi-error validation pass — no `scripts/` emission, no runtime spawn. |
+| `format` | Rewrite `.jh` / `.test.jh` files into canonical style. |
+| `init` | Initialize `.jaiph/` directory layout in a workspace. |
+| `install` | Install project-scoped libraries from the registry or git URLs. |
+| `use` | Reinstall `jaiph` globally with a selected version or channel. |
 
 ## `jaiph run`
 {: #jaiph-run}
 
-Parse, validate, and run a Jaiph workflow file. Requires a `workflow default` entrypoint.
-
-```bash
-jaiph run [--target <dir>] [--raw] <file.jh> [--] [args...]
-```
-
-Any path ending in `.jh` is accepted (including `*.test.jh`, since the extension is still `.jh`). For files that only contain test blocks, use `jaiph test` instead.
-
-**Sandboxing:** whether the workflow runs in a **Docker container** or **directly on the host** is decided from environment variables and the workflow’s `runtime` metadata — there is no `jaiph run --docker` flag. Defaults and mounts are documented in [Sandboxing](sandboxing.md).
-
-**Flags:**
-
-- **`--target <dir>`** — keep emitted script files and run metadata under `<dir>` instead of a temp directory (useful for debugging).
-- **`--raw`** — skip the banner, live progress tree, hooks, and CLI failure footer. The workflow runner child uses **inherited stdio** so `__JAIPH_EVENT__` JSON lines go to **stderr** unchanged. When **Docker sandboxing** is used, the **host** runs interactive `jaiph run` and the **container** runs `jaiph run --raw …` so the host can parse events from the container’s stderr ([Architecture](architecture.md), [Sandboxing](sandboxing.md)). **Important:** if you invoke `jaiph run --raw` yourself on the host, the CLI takes a separate code path that **never starts Docker** — workflow execution runs locally in that process even when `JAIPH_DOCKER_ENABLED=true`. Use `--raw` for embedding or piping; use interactive `jaiph run` (no `--raw`) when you want the CLI to apply sandbox env rules. There is no PASS/FAIL line, **`return_value.txt` is not printed to stdout**, and the process exit code alone reflects success or failure. See [Sandboxing — Runtime behavior](sandboxing.md#runtime-behavior).
-- **`--`** — end of Jaiph flags; remaining args are passed to `workflow default` (e.g. `jaiph run file.jh -- --verbose`).
-
-**Examples:**
-
-```bash
-jaiph run ./.jaiph/bootstrap.jh
-jaiph run ./flows/review.jh "review this diff"
-```
+Compile and execute a workflow's `default` entrypoint.
 
-### Argument passing
-
-Positional arguments are available inside `script` bodies as standard bash `$1`, `$2`, `"$@"`. In Jaiph orchestration strings (`log`, `prompt`, `fail`, `return`, `send`, `run`/`ensure` args), use **named parameters** (e.g. `workflow default(task)` → `${task}`) — only `${identifier}` forms are supported (no shell parameter expansion). The same rule applies to `prompt` text and to `const` RHS strings where orchestration applies.
-
-Rules receive forwarded arguments through `ensure`:
-
-```jaiph
-script check_branch = `test "$(git branch --show-current)" = "$1"`
-
-rule current_branch(expected) {
-  run check_branch("${expected}")
-}
-
-workflow default() {
-  ensure current_branch("main")
-}
+```text
+jaiph run [--target <dir>] [--raw] [--workspace <dir>] [--inplace] [--unsafe] [--yes|-y] <file.jh> [--] [args...]
 ```
 
-**Rule** bodies are **managed steps only** — no raw shell lines; use `run` to a `script` for shell execution. **Workflow** bodies may include **inline shell** lines that do not parse as a Jaiph step (the compiler still validates them); for anything non-trivial, prefer a top-level `script` and `run`. In bash-bearing contexts (mainly `script` bodies, and restricted `const` / send RHS forms), `$(...)` and the first command word are validated: they must not invoke Jaiph rules, workflows, or scripts, contain inbox send (`<-`), or use `run` / `ensure` as shell commands (`E_VALIDATE`). See [Grammar — Language concepts](grammar.md#language-concepts) and [Grammar — Managed calls vs command substitution](grammar.md#managed-calls-vs-command-substitution).
-
-For `const` in those bodies, a reference plus arguments on the RHS must be written as `const name = run ref([args...])` (or `ensure` for rule capture), not as `const name = ref([args...])` — the latter is `E_PARSE` with text that explains the fix.
-
-### Shebang execution
+Sandbox selection is environment-driven; there is no `--docker` flag. The boolean sandbox flags (`--inplace`, `--unsafe`, `--yes`) are CLI front-ends that mutate the launched runtime env for one run only — see [Configuration — Precedence](configuration.md#precedence) and [Environment variables](env-vars.md).
 
-If a `.jh` file is executable and has `#!/usr/bin/env jaiph`, you can run it directly:
+### Flags
 
-```bash
-./.jaiph/bootstrap.jh "task details"
-./flows/review.jh "review this diff"
-```
-
-### Compile-time and process model
+| Flag | Argument | Effect |
+|---|---|---|
+| `--target` | `<dir>` | Keep emitted script files and run metadata under `<dir>` instead of a temp directory. |
+| `--raw` | — | Skip the banner, live progress tree, hooks, and PASS/FAIL footer. The runner child inherits stdio; `__JAIPH_EVENT__` JSON lines go to stderr unchanged. Host `--raw` never launches Docker even when `JAIPH_DOCKER_ENABLED=true`. |
+| `--workspace` | `<dir>` | Override the workspace root used for library resolution and the Docker workspace mount. A missing value, missing path, or non-directory aborts with a specific message. There is no `JAIPH_WORKSPACE` env equivalent input — that name is reserved for the in-container remap output. |
+| `--inplace` | — | Front-end for `JAIPH_INPLACE=1`. |
+| `--unsafe` | — | Front-end for `JAIPH_UNSAFE=true`. Cannot be combined with `--inplace` (`E_FLAG_CONFLICT`). |
+| `-y`, `--yes` | — | Front-end for `JAIPH_INPLACE_YES=1`. Required to use `--inplace` non-interactively. |
+| `--` | — | End of Jaiph flags; remaining tokens are forwarded to `workflow default`. |
 
-The CLI runs `buildScripts()`, which walks the entry file and its import closure. Each reachable module is parsed and `validateReferences` runs before script files are written. Unrelated `.jh` files on disk are not read.
+### Pre-flight
 
-After validation, the CLI spawns the Node workflow runner as a detached child. The runner loads the graph with `buildRuntimeGraph()` (parse-only imports; no `validateReferences` here) and executes `NodeWorkflowRuntime`. Prompt steps, script subprocesses, inbox dispatch, and event emission are handled in the runtime kernel — workflows and rules are interpreted in-process; only `script` steps spawn a managed shell. The CLI listens on stderr for `__JAIPH_EVENT__` JSON lines, the single event channel for all execution modes. Stdout carries only plain script output, forwarded to the terminal as-is.
+After module-graph load and Docker-mode resolution, before the runner / container is spawned, the host CLI runs a credential pre-flight (`src/cli/run/preflight-credentials.ts`). Missing credentials produce either `E_AGENT_CREDENTIALS` (hard error) or a warning depending on backend and Docker mode — see [Authenticate agent backends](/how-to/agent-auth) and [Configuration — Credential pre-flight](configuration.md#credential-pre-flight). `jaiph run --raw` does not run the pre-flight.
 
-### Run progress and tree output
+### Progress markers
 
-During `jaiph run`, the CLI renders a live tree of steps. Each step appears as a line with a marker, the step kind (`workflow`, `prompt`, `script`, `rule`), and the step name:
+| Marker | Meaning |
+|---|---|
+| `▸` | Step started. |
+| `✓` | Step completed successfully (with elapsed time). |
+| `✗` | Step failed (with elapsed time). |
+| `ℹ` | `log` message (dim/gray, no marker timing). |
+| `!` | `logerr` message (red; rendered on stdout with the progress tree). |
+| `·` | Continuation marker (heartbeat lines in non-TTY mode). |
+| ` ₁`, ` ₂`, … | Subscript prefix for `run async` branch numbering. |
 
-- **`▸`** — step started
-- **`✓`** / **`✗`** — step completed (pass/fail), with elapsed time (e.g. `✓ workflow scanner (0s)`, `✗ rule ci_passes (11s)`)
-- **`ℹ`** — `log` message (dim/gray, inline at the correct depth; no marker, spinner, or timing)
-- **`!`** — `logerr` message (red, writes to stderr)
+PASS line: `✓ PASS workflow default (0.2s)`. TTY runs append a transient `▸ RUNNING workflow <name> (X.Xs)` line that is replaced by the PASS/FAIL line on exit. `--raw` and non-TTY modes skip both. Disable color globally with `NO_COLOR=1`.
 
-The root PASS/FAIL summary uses the format `✓ PASS workflow default (0.2s)`. Completion lines include the step kind and name so each line is self-identifying even when multiple steps run concurrently.
+Non-TTY heartbeat cadence is controlled by `JAIPH_NON_TTY_HEARTBEAT_FIRST_SEC` (default `60`) and `JAIPH_NON_TTY_HEARTBEAT_INTERVAL_MS` (default `30000`, floor `250`).
 
-**`log` / `logerr` and backslash escapes:** The displayed text follows `echo -e` semantics — a literal `\n` or `\t` in the message becomes a newline or tab. `LOG` / `LOGERR` JSON on stderr (and the `message` field in `run_summary.jsonl`) carries the unexpanded shell string.
+### Step display
 
-**TTY mode:** one extra line at the bottom shows the running workflow and elapsed time: `▸ RUNNING workflow <name> (X.Xs)` — updated in place every second. When the run completes, it is replaced by the final PASS/FAIL line.
+Step lines include the kind (`workflow`, `prompt`, `script`, `rule`) and name. Parameterised invocations append `key="value"` pairs in parentheses (positional params use `1=…` / `2=…`); whitespace is collapsed; values are truncated to 32 characters. Prompt step lines additionally show the backend name (or custom command basename) and the first 24 characters of the prompt body in quotes (full line capped at 96 characters).
 
-**Successful exit:** when the default workflow exits **0**, the CLI prints `✓ PASS workflow default (...)` plus elapsed time (see above). If the workflow **returns** a value, the runtime writes `return_value.txt` under the run directory; the CLI prints that value on stdout **after** the PASS line, separated by a blank line (host paths are unchanged; Docker runs remap container paths when reading the file). See [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout).
+### Return values
 
-**Non-TTY mode** (CI, pipes, log capture): no RUNNING line and no in-place updates. Step start (▸) and completion (✓/✗) lines still print as they occur. Long-running steps additionally print **heartbeat** lines to avoid looking like a hang:
+When `workflow default` returns a value (success only), the runtime writes `return_value.txt` under the run directory. Interactive `jaiph run` prints that value on stdout after the PASS line, separated by a blank line. `jaiph run --raw` never prints it to stdout; the file alone is the contract.
 
-- Format: `· <kind> <name> (running <N>s)` — entire line dim/gray (plain text with `NO_COLOR`).
-- Cadence: first heartbeat after `JAIPH_NON_TTY_HEARTBEAT_FIRST_SEC` seconds (default **60**), then every `JAIPH_NON_TTY_HEARTBEAT_INTERVAL_MS` milliseconds (default **30000**; minimum **250**). Short steps emit no heartbeats.
-- Nested steps: heartbeats describe the innermost (deepest active) step.
+### Run artifacts
 
-**Event stream:** on stderr, the runtime emits `__JAIPH_EVENT__` lines (JSON). The CLI parses them to drive the tree, hooks, and failure summaries. Other stderr text is forwarded to the terminal. If a payload is not valid JSON, the CLI treats it as plain stderr.
+Each run directory is `<JAIPH_RUNS_DIR>/<YYYY-MM-DD>/<HH-MM-SS>-<source>/`, UTC. `<source>` is `JAIPH_SOURCE_FILE` if set, otherwise the entry-file basename. Layout pinned in [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout).
 
-**Parameterized invocations** show argument values inline in gray after the step name:
+Step `.out` files are written incrementally; consumers may `tail -f` them. `.out` / `.err` pairs are allocated at `STEP_START` with monotonic per-run sequence numbers (`%06d-<safe_name>.out|.err`).
 
-- All parameters use `key="value"` format in parentheses. Internal refs (`::impl`) and empty values are omitted.
-- Positional parameters display as `1="value"`, `2="value"`. Named parameters display as `name="value"`.
-- Whitespace in values is collapsed to a single space. Values are truncated to 32 characters (with `...`).
-- Prompt steps show the backend name (or custom command basename) and a preview (first 24 characters of prompt text) in quotes: `prompt cursor "summarize the..."` or `prompt my-agent.sh "summarize the..."`, followed by parameters (capped at 96 characters total).
+### Failure footer
 
-Example lines:
+Interactive `jaiph run` only (`--raw` omits this block). On non-zero exit, the CLI emits a stderr footer with `Logs:`, `Summary:`, `out:` / `err:` paths, and an `Output of failed step:` excerpt. The fields are resolved from the last `STEP_END` object with non-zero `status` in `run_summary.jsonl`; `out_content` / `err_content` are preferred over `out_file` / `err_file`. In Docker mode, container-internal `/jaiph/run/*` paths are remapped to host paths.
 
-- `▸ workflow docs_page (1="docs/cli.md", 2="strict")`
-- `· prompt cursor (running 60s)`
-- `·   ▸ prompt cursor "${role} does ${task}" (role="engineer", task="Fix bugs")`
-- `·   ▸ script fib (1="3")`
-- `·   ▸ rule check_arg (1="Alice")`
+### Hook events
 
-If no parameters are passed, the line is unchanged (e.g. `▸ workflow default`). Disable color with `NO_COLOR=1`.
+Hooks load from `~/.jaiph/hooks.json` (global) and `<project>/.jaiph/hooks.json` (project-local; project overrides global per event). Hooks run on the **host** CLI process even in Docker mode. See [Add a hook](/how-to/hooks).
 
-**Async branch numbering.** When a workflow contains multiple `run async` steps, each branch is prefixed with a **subscript number** (₁₂₃…) at the async call site's indentation level. Numbers use Unicode subscript digits (U+2080–U+2089) and are assigned in **dispatch order** within the parent workflow (first `run async` = ₁, second = ₂, etc.). The subscript number is always rendered with a leading space (` ₁`, ` ₂`, ` ₁₂`) and in dim/grey (same style as `·` continuation markers); in non-TTY or `NO_COLOR` mode it is emitted without ANSI codes. Non-async lines (root workflow, final PASS/FAIL) have no prefix.
+## `jaiph test`
 
-If a nested workflow also uses `run async`, those branches get their own numbering scope at the nested indent level:
+Execute `*.test.jh` blocks using the same `NodeWorkflowRuntime` as `jaiph run`, in-process, with mock support.
 
 ```text
-workflow default
- ₁▸ workflow parallel_suite
- ₂▸ workflow lint_check
- ₁·  ₁▸ workflow test_unit
- ₁·  ₂▸ workflow test_integration
- ₁·  ₁✓ workflow test_unit (2s)
- ₁·  ₂✓ workflow test_integration (5s)
- ₁✓ workflow parallel_suite (5s)
- ₂✓ workflow lint_check (1s)
-
-✓ PASS workflow default (5s)
+jaiph test                            # discover all *.test.jh under the workspace root
+jaiph test <dir>                      # discover all *.test.jh recursively under <dir>
+jaiph test <file.test.jh>             # run a single test file
 ```
 
-All async branches render as siblings at the same indentation level. Inner steps within each branch appear one level deeper. The runtime isolates each async branch's frame stack, so `depth` on events is relative to the branch's own call depth. The `async_indices` array on events carries the chain of 1-based branch indices (one per nested `run async` level) so the display layer can map lines to branches.
+| Invocation | Workspace root detection |
+|---|---|
+| `jaiph test` | Walk up from `process.cwd()` until `.jaiph` or `.git`; falls back to `process.cwd()`. |
+| `jaiph test <dir>` | Walk up from the resolved `<dir>`. |
+| `jaiph test <file>` | Walk up from the test file's directory. |
 
-**Prompt transcript replay.** The progress renderer shows only ▸ / ✓ lines for a `prompt` step — not a nested subtree. After the step completes (on terminal stdout, non-test runs), the runtime replays the step's `.out` artifact if stdout was not already streamed live. Replay is skipped when stdout is a pipe or when the prompt already streamed via tee. `jaiph test` does not use this replay path.
+Zero matches with no arguments (or with a directory containing no `*.test.jh` files) writes `jaiph test: no *.test.jh files found (nothing to do)` to stderr and exits `0`. An explicit file path that does not exist or is not `*.test.jh` exits `1`. Plain workflow files (`*.jh` without `.test`) are not supported as test entries. Extra positional tokens after the path are accepted but ignored.
 
-To surface the agent answer inline in the tree, use `log` explicitly:
+Assertions: `expect_contain`, `expect_equal`, `expect_not_contain` — see [Write & run tests](/how-to/testing).
 
-```jaiph
-const response = prompt "Summarize the report"
-log response
-```
-
-### Failed run summary (stderr)
-
-On non-zero exit, the CLI may print a footer with the path to `run_summary.jsonl`, `out:` / `err:` artifact paths, and `Output of failed step:` plus a trimmed excerpt. These are resolved from the **last** `STEP_END` object in the summary with `status` != 0, using `out_content` / `err_content` when present and otherwise the `out_file` / `err_file` fields (last matches terminal failure after `catch`/`ensure` retries and stray earlier failures). If no failed `STEP_END` is found, the CLI falls back to a run-directory artifact heuristic.
-
-In Docker mode, artifact paths recorded by the container use container-internal prefixes (`/jaiph/run/…`). The CLI remaps these to host paths and discovers the run directory from the bind-mounted runs directory by matching the `JAIPH_RUN_ID` in each `run_summary.jsonl` when the container meta file is inaccessible. This run-id-based lookup is safe under concurrent `jaiph run` invocations sharing the same runs directory. The failure summary therefore displays identically to local (no-sandbox) runs — same structure, same host-resolvable paths, same "Output of failed step" excerpt. See [Sandboxing — Path remapping](sandboxing.md#path-remapping).
-
-### Run artifacts and live output
-
-Each run directory is `<JAIPH_RUNS_DIR>/<YYYY-MM-DD>/<HH-MM-SS>-<source>/`, where date and time are UTC and `<source>` is `JAIPH_SOURCE_FILE` if set, otherwise the entry file basename. Steps that allocate captures open **paired** `NNNNNN-<safe_name>.out` and `.err` files at **`STEP_START`** (see [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout) and [Runtime artifacts — What each artifact is for](artifacts.md#what-each-artifact-is-for)).
-
-Step **stdout** artifacts are written **incrementally during execution**, so you can tail a running step's output in real time:
+## `jaiph compile`
+{: #jaiph-compile}
 
-```bash
-# In one terminal — run a long workflow
-jaiph run ./flows/deploy.jh
+Parse modules and run `collectDiagnostics(graph)` — the same per-module validator as `jaiph run`, but collecting every recoverable error instead of stopping at the first — **without** writing `scripts/`, **without** calling `buildRuntimeGraph()`, and **without** spawning the workflow runner.
 
-# In another terminal — watch a step's output as it executes
-tail -f .jaiph/runs/2026-03-22/14-30-00-deploy.jh/000003-deploy__run_migrations.out
+```text
+jaiph compile [--json] [--workspace <dir>] <file.jh | directory> ...
 ```
 
-Which steps get numbered `.out`/`.err` pairs, how prompts differ from managed scripts, and when empty files are removed are spelled out in [Runtime artifacts](artifacts.md); the durable timeline either way is **`run_summary.jsonl`**.
-
-### Run summary (`run_summary.jsonl`) {#run-summary-jsonl}
-
-Each run directory also contains `run_summary.jsonl`: one JSON object per line, appended in execution order. It is the canonical append-only record of runtime events (lifecycle, logs, inbox flow, and step boundaries). Tooling can tail the file by byte offset and process new lines idempotently. For a single run, lines follow execution order; inbox routes always drain **sequentially**, so inbox lifecycle events stay aligned with dispatch order. Summary lines are still appended atomically under a lock shared with other concurrent writers on the same run directory (for example `run async` branches appending step events).
-
-**Versioning.** Every object includes `event_version` (currently `1`). New fields may be added; consumers should tolerate unknown keys.
-
-**Common fields.** All lines include `type`, `ts` (UTC timestamp), `run_id`, and `event_version`. Step-related types also carry `id`, `parent_id`, `seq`, and `depth` (matching the `__JAIPH_EVENT__` stream on stderr).
-
-**Correlation rules:**
-
-- **`run_id`:** same across all lines in a given run's file.
-- **Workflow boundaries:** for each workflow name, `WORKFLOW_START` count equals `WORKFLOW_END` count.
-- **Steps:** `STEP_START` and `STEP_END` share the same `id`. Use `parent_id`, `seq`, and `depth` to rebuild the tree.
-- **Inbox:** one `INBOX_ENQUEUE` per `send` with a unique `inbox_seq` (zero-padded, e.g. `001`). Each routed target gets one `INBOX_DISPATCH_START` and one `INBOX_DISPATCH_COMPLETE` sharing the same `inbox_seq`, `channel`, `target`, and `sender`.
-- **Ordering:** lines are valid JSONL (one object per line, atomic append). Inbox dispatch is sequential; `ts` order matches dispatch order for inbox lifecycle events on a single run.
-
-**Event taxonomy (schema `event_version` 1):**
-
-| Field | `WORKFLOW_START` | `WORKFLOW_END` | `STEP_START` | `STEP_END` | `LOG` | `LOGERR` | `INBOX_ENQUEUE` | `INBOX_DISPATCH_START` | `INBOX_DISPATCH_COMPLETE` |
-|-------|------------------|----------------|--------------|------------|-------|----------|-----------------|------------------------|---------------------------|
-| `type` | required | required | required | required | required | required | required | required | required |
-| `ts` | required | required | required | required | required | required | required | required | required |
-| `run_id` | required | required | required | required | required | required | required | required | required |
-| `event_version` | required (`1`) | required (`1`) | required (`1`) | required (`1`) | required (`1`) | required (`1`) | required (`1`) | required (`1`) | required (`1`) |
-| `workflow` | required (name) | required (name) | — | — | — | — | — | — | — |
-| `source` | required (basename or empty) | required (basename or empty) | — | — | — | — | — | — | — |
-| `func`, `kind`, `name` | — | — | required | required | — | — | — | — | — |
-| `status`, `elapsed_ms` (step) | — | — | null on start | required numbers when ended | — | — | — | — | — |
-| `out_file`, `err_file` | — | — | required strings | required strings | — | — | — | — | — |
-| `id`, `parent_id`, `seq`, `depth` | — | — | required | required | — | — | — | — | — |
-| `params` | — | — | optional JSON array | optional JSON array | — | — | — | — | — |
-| `dispatched`, `channel`, `sender` | — | — | optional (inbox dispatch) | optional (inbox dispatch) | — | — | — | — | — |
-| `out_content`, `err_content` | — | — | — | optional on `STEP_END` | — | — | — | — | — |
-| `async_indices` | — | — | optional `number[]` | optional `number[]` | optional `number[]` | optional `number[]` | — | — | — |
-| `message`, `depth` | — | — | — | — | required | required | — | — | — |
-| `inbox_seq`, `channel`, `sender` | — | — | — | — | — | — | required | required | required |
-| `payload_preview`, `payload_ref` | — | — | — | — | — | — | required | — | — |
-| `target` | — | — | — | — | — | — | — | required | required |
-| `status`, `elapsed_ms` (dispatch) | — | — | — | — | — | — | — | — | required (exit code and ms) |
-
-`PROMPT_START` / `PROMPT_END` (not in the table): include `backend`, optional `model`, optional `model_reason`, optional `status`, optional `preview`, `depth`, and optional `step_id` / `step_name` tying the prompt to the enclosing step frame. `model` is the resolved model name (or `null` when the backend auto-selects). `model_reason` is one of `explicit`, `flags`, or `backend-default` — see [Configuration — Model resolution](configuration.md#model-resolution).
-
-**Event semantics:**
-
-- **`WORKFLOW_START` / `WORKFLOW_END`:** mark entry and exit of a workflow body. `workflow` is the declared name; `source` is the `.jh` basename.
-- **`STEP_START` / `STEP_END`:** mirror stderr step events. `STEP_END` may include `out_content` / `err_content` (embedded artifact text, size-capped).
-- **`LOG` / `LOGERR`:** emitted by `log` / `logerr` keywords. `depth` is the step-stack depth. `message` is the shell string before `echo -e` expansion.
-- **`INBOX_ENQUEUE`:** recorded when a message is queued. `payload_preview` is UTF-8-safe JSON (up to 4096 bytes; truncated with `...`). `payload_ref` is `null` when the full body fits, otherwise a run-relative path.
-- **`INBOX_DISPATCH_START` / `INBOX_DISPATCH_COMPLETE`:** wrap one invocation of a route target. `status` is exit code; `elapsed_ms` is wall time.
-
-Together with step `.out` / `.err` files, `run_summary.jsonl` is enough to reconstruct the step tree, log timelines, inbox flow, and workflow boundaries.
-
-### Hooks
-
-You can run custom commands at workflow/step lifecycle events via hooks. Config lives in `~/.jaiph/hooks.json` (global) and `<project>/.jaiph/hooks.json` (project-local); project-local overrides global per event. See [Hooks](hooks.md) for schema, events, payload, and examples.
-
-## `jaiph test`
-
-Run tests from `*.test.jh` files that contain `test "..." { ... }` blocks. Test files can import workflows and use `mock prompt` to simulate agent responses without calling the real backend.
+At least one path is required. `-h` / `--help` must appear before the first path (they are not scanned after a path token, unlike other subcommands).
 
-The test runner uses the same Node workflow runtime as `jaiph run`. For each test file, the CLI runs **`buildScripts`** with that file as the **entrypoint** (the test module plus its **import closure** only — not every `*.jh` in the repo), so imported workflow modules get emitted scripts under `JAIPH_SCRIPTS`. It then builds the runtime graph **once** per file and reuses it across all blocks and `test_run_workflow` steps. Each block runs through the AST interpreter with mock support and assertion evaluation (`expect_contain`, `expect_equal`, `expect_not_contain`).
+| Argument shape | Behaviour |
+|---|---|
+| File path (`*.jh` or `*.test.jh`) | Expanded to the transitive import closure. Each module in the union is parsed and validated once. |
+| Directory path | Tree scanned for `*.jh` files; `*.test.jh` is **skipped** (use an explicit file path to validate a test module). Each non-test `*.jh` is treated as an entrypoint and its closure merged into the validation set. |
 
-**Usage:**
+| Flag | Effect |
+|---|---|
+| `--json` | On success, print `[]` to stdout. On failure, print one JSON array of `{ file, line, col, code, message }` diagnostics to stdout and exit `1`. |
+| `--workspace <dir>` | Override library resolution root for all reached modules. Without it, the workspace is auto-detected per path. |
 
-- `jaiph test` — discover and run all `*.test.jh` under the workspace root. The workspace root is found by walking up from the **current working directory** until a directory with `.jaiph` or `.git` is found; if neither exists, the current directory is used (same `detectWorkspaceRoot` algorithm as `jaiph run` / `jaiph install`).
-- `jaiph test <dir>` — run all `*.test.jh` files recursively under the given directory. Workspace root for script compilation is detected by walking up from **that directory** (resolved), not necessarily from your shell cwd.
-- `jaiph test <file.test.jh>` — run a single test file; workspace root is detected from the test file’s directory.
+Within each entry's import closure, diagnostics are sorted by `(file, line, col)`; when multiple entry points are supplied, those batches are appended in discovery order (not re-sorted globally). Without `--json`, the same set is written to stderr as `path:line:col CODE message` lines. Any non-empty diagnostic set exits `1`. Parser/loader failures abort the affected entry's closure with a single diagnostic for that entry; siblings continue.
 
-With no arguments, or with a directory that contains no test files, the command exits with status **1** and prints an error.
-
-Passing a plain workflow file (e.g. `say_hello.jh`) is not supported; the test file imports the workflow and declares mocks. Extra arguments after the path are accepted but ignored. See [Testing](testing.md) for test block syntax and assertions.
+## `jaiph format`
 
-**Examples:**
+Reformat `.jh` / `.test.jh` files into canonical style.
 
-```bash
-jaiph test
-jaiph test ./e2e
-jaiph test e2e/workflow_greeting.test.jh
-jaiph test e2e/say_hello.test.jh
+```text
+jaiph format [--check] [--indent <n>] <path.jh ...>
 ```
 
-## `jaiph compile`
+Paths must end with `.jh`. Formatting is idempotent. Comments and shebangs are preserved. Triple-quoted bodies, prompt blocks, and fenced script blocks emit verbatim — inner lines are not re-indented relative to the surrounding scope.
 
-Parse modules and run **`validateReferences`** (the same compile-time checks as before `jaiph run`) **without** writing `scripts/`, **without** calling **`buildRuntimeGraph`**, and **without** spawning the workflow runner. Use this for CI gates, pre-commit hooks, or editor diagnostics.
+| Flag | Argument | Default | Effect |
+|---|---|---|---|
+| `--indent` | `<n>` | `2` | Spaces per indent level. |
+| `--check` | — | — | Verify without writing. Exit `0` when files match canonical form, `1` when any file would change. |
 
-```bash
-jaiph compile [--json] [--workspace <dir>] <file.jh | directory> ...
-```
+Top-level ordering: the formatter hoists `import`, `config`, and `channel` declarations to the top (in that order, preserving relative source order within each group). Other top-level definitions (`const`, `rule`, `script`, `workflow`, `test`) keep their relative source order. Comments before a hoisted construct move with it; comments before non-hoisted definitions stay in place.
 
-At least one path is required. **`jaiph compile -h`** or **`jaiph compile --help`** prints command-specific usage and exits **0**.
+Top-level `const` quoting: the source delimiter is preserved per binding. Quoted values stay quoted; bare tokens stay bare; `"""…"""` values emit verbatim. The formatter does not toggle between styles based on value content.
 
-**File arguments** — Each `*.jh` file is expanded to its **transitive import closure**; every module in the union is parsed and validated once.
+Blank-line preservation: a single blank line between steps inside a workflow or rule body is preserved. Multiple consecutive blank lines collapse to one. Trailing blank lines before `}` are removed.
 
-**Directory arguments** — The tree is scanned for `*.jh` files whose basename is **not** `*.test.jh` (same rule as `walkjhFiles` in the transpiler: files like `foo.test.jh` are skipped). Each non-test `*.jh` under the tree is treated as an entrypoint and its closure merged into the same validation set. To validate a test module’s graph explicitly, pass that **`*.test.jh` file** as a path (directories never pick up `*.test.jh` as roots).
+## `jaiph init`
 
-**Flags:**
+```text
+jaiph init [workspace-path]
+```
 
-- **`--json`** — On success, print `[]` to stdout. On failure, print one JSON **array** of objects `{ "file", "line", "col", "code", "message" }` to stdout and exit **1** (non-JSON errors use a synthetic `E_COMPILE` object when the message is not in `file:line:col CODE …` form).
-- **`--workspace <dir>`** — Override the workspace root used for **library import resolution** (`<workspace>/.jaiph/libs/`, etc.) for **all** modules reached from the given paths. When omitted, the workspace is **auto-detected** from each path’s location (`detectWorkspaceRoot` — same algorithm as `jaiph run`, starting from the file’s directory or from a directory argument).
+Creates the following under the target workspace:
 
-## `jaiph format`
+| File | Content |
+|---|---|
+| `.jaiph/.gitignore` | Two-line file listing `runs` and `tmp`. If the file exists and does not match, the command exits non-zero. |
+| `.jaiph/bootstrap.jh` | Canonical bootstrap workflow; made executable. The body is a triple-quoted multiline `prompt` that asks the agent to scaffold workflows. |
+| `.jaiph/SKILL.md` | Copy of the skill markdown shipped with this `jaiph` build (see [`JAIPH_SKILL_PATH`](env-vars.md)). |
 
-Reformat Jaiph source files to a canonical style. Paths must end with **`.jh`**, which includes **`*.test.jh`** test modules. The formatter parses each file into an AST and re-emits it with consistent whitespace and indentation. Formatting is idempotent — running it twice produces the same output. Comments and shebangs are preserved. Multiline string bodies (`"""…"""`), prompt blocks, and fenced script blocks are emitted verbatim — inner lines are not re-indented relative to the surrounding scope, so repeated formatting never shifts embedded content deeper.
+SKILL.md resolution order: `JAIPH_SKILL_PATH` (if set and the path exists) → install-relative paths (`jaiph-skill.md` next to the package tree, then `docs/jaiph-skill.md` next to the package) → `docs/jaiph-skill.md` under the current working directory → the embedded copy baked into the binary. There is no "skip and warn" path; the file is always written.
 
-**Blank-line preservation:** A single blank line between steps inside a workflow or rule body is preserved — use it for visual grouping of related calls. Multiple consecutive blank lines are collapsed to one; trailing blank lines before `}` are removed. This applies to all block-level steps (calls, `log`, `const`, `if`, etc.).
+## `jaiph install`
 
-**Top-level ordering:** The formatter hoists `import`, `config`, and `channel` declarations to the top of the file (in that order, preserving source order within each group). All other top-level definitions — `const`, `rule`, `script`, `workflow`, and `test` blocks — keep their original relative order from the source file. Comments immediately before an `import`, `config`, or `channel` move with that construct when hoisted; comments before non-hoisted definitions stay in place.
+Install project-scoped libraries into `.jaiph/libs/<name>/` under the workspace root. The workspace root is detected from `process.cwd()` (`detectWorkspaceRoot` — walks up until `.jaiph` or `.git`, with temp-directory guards).
 
-```bash
-jaiph format [--check] [--indent <n>] <path.jh ...>
+```text
+jaiph install [--force] [<name[@version]> | <repo-url[@version]> ...]
+jaiph install [--force]                  # restore from lockfile
 ```
 
-One or more file paths are required (each path must end with `.jh`, e.g. `flow.jh` or `e2e/flow.test.jh`). Paths that do not end with `.jh` are rejected. If a file cannot be parsed, the command exits immediately with status 1 and a parse error on stderr.
+| Flag | Effect |
+|---|---|
+| `--force` | Delete and re-clone existing libraries. Accepted anywhere in the argument list. |
 
-**Flags:**
+### Argument classification
 
-- **`--indent <n>`** — spaces per indent level (default: `2`).
-- **`--check`** — verify formatting without writing. Exits 0 when all files are already formatted; exits 1 when any file needs changes, printing the file name to stderr. No files are modified in check mode.
+| Argument shape | Resolution |
+|---|---|
+| Bare registry name matching `^[A-Za-z0-9_-]+(@[A-Za-z0-9._+/-]+)?$` (no `/`, no `:`) | Looked up in the registry index. Examples: `jaiphlang`, `mylib@v1.2`. |
+| Anything else | Parsed as a git URL with optional trailing `@<version>`. Examples: `https://github.com/you/queue-lib.git`, `git@github.com:org/repo.git@main`. |
 
-**Examples:**
+### Post-clone hygiene
 
-```bash
-# Rewrite files in place
-jaiph format flow.jh utils.jh
+Each successful clone runs three checks before the lib counts as installed:
 
-# Check formatting in CI (non-zero exit on drift); ensure globs expand to real paths
-jaiph format --check src/**/*.jh
+- **`.jh` module check** — at least one `*.jh` file must exist under the clone (recursive, `.git` skipped). Failure removes the directory and aborts with `lib "<name>" contains no .jh modules — not a jaiph library?`. No lock entry written.
+- **Commit capture** — `git rev-parse HEAD` is recorded as the 40-char `commit` on the lock entry.
+- **`.git` strip** — `<libDir>/.git` is removed recursively.
 
-# Use 4-space indentation
-jaiph format --indent 4 flow.jh
-```
+### Restore-from-lockfile mode
 
-## `jaiph init`
+`jaiph install` with no positional args reads `.jaiph/libs.lock` and clones each entry. The registry is never contacted. If a lock entry carries a `commit`, the cloned HEAD must match it; on mismatch the directory is removed and the run fails with the locked vs cloned SHAs and the remedy. Lock entries without `commit` (older lockfiles) restore without the check.
 
-Initialize Jaiph files in a workspace directory.
+### Parallel clones
 
-```bash
-jaiph init [workspace-path]
-```
+Missing libraries are cloned with bounded concurrency (default **4 in flight**). The warm-skip pass runs before any clone. Independent clone failures still propagate; failed libraries are not added to the lockfile.
 
-Creates:
+### Registry
 
-- `.jaiph/.gitignore` — lists `runs` and `tmp`. If the file already exists and does not match this exact list, `jaiph init` exits with a non-zero status.
-- `.jaiph/bootstrap.jh` — canonical bootstrap workflow; made executable. The template uses a triple-quoted multiline prompt body (`prompt """ ... """`) so the generated file parses and compiles as valid Jaiph. It asks the agent to scaffold workflows under `.jaiph/` and ends by logging a summary (`WHAT CHANGED` + `WHY`). Docker sandboxing uses the default `ghcr.io/jaiphlang/jaiph-runtime` image unless you set `runtime.docker_image` or `JAIPH_DOCKER_IMAGE`.
-- `.jaiph/SKILL.md` — copied when the CLI can resolve a skill markdown file: if **`JAIPH_SKILL_PATH`** is set **and** that path exists, it wins; otherwise the CLI tries install-relative paths (`jaiph-skill.md` beside the packaged tree, then `docs/jaiph-skill.md` beside the package), then **`docs/jaiph-skill.md` under the current working directory**. If none of these exist, `SKILL.md` is not written and a note is printed.
+| Aspect | Value |
+|---|---|
+| Source | `JAIPH_REGISTRY` (default `https://jaiph.org/registry`). |
+| Loading | Loaded once per invocation when at least one positional argument is a bare name. URL-form installs and restore-from-lock never read the registry. |
+| Disk paths | Values without a `://` scheme, or starting with `file://`, are read from disk. Everything else is fetched via global `fetch`. |
+| Index format | `{ "libs": { "<name>": { "url": "<git-url>", "description": "<string>" } } }`. Each key must match `^[A-Za-z0-9_-]+$`. Unknown per-entry keys are accepted and ignored. |
+| Lookup errors | `lib "<name>" not found in registry <source>`, `failed to read registry <source>: <cause>`, `failed to fetch registry <source>: HTTP <status>`, `failed to parse registry <source>: <cause>`, `failed to parse registry <source>: invalid name "<name>"`. |
 
-## `jaiph install`
+### Lockfile
 
-Install project-scoped libraries. Libraries are git repos cloned into `.jaiph/libs/<name>/` under the **workspace root**. The workspace is determined from the **current working directory** (`detectWorkspaceRoot(process.cwd())` — walk upward until `.jaiph` or `.git`, with the same temp-directory guards as `jaiph run`). A lockfile (`.jaiph/libs.lock`) under that root tracks installed libraries for reproducible setups.
-
-```bash
-jaiph install [--force] <repo-url[@version]> ...
-jaiph install [--force]
-```
-
-**With arguments** — clone each repo into `.jaiph/libs/<name>/` (shallow: `--depth 1`) and upsert the entry in `.jaiph/libs.lock`. The library name is derived from the URL: last path segment, stripped of `.git` suffix (e.g. `github.com/you/queue-lib.git` → `queue-lib`). Version pinning is usually written as **`https://…/name.git@<tag-or-branch>`**; other URL shapes with a trailing **`@ref`** are also accepted when the parser can split URL and version unambiguously.
-
-**Without arguments** — restore all libraries from `.jaiph/libs.lock`. Useful after cloning a project or in CI. If the lockfile exists but lists **no** libraries, the command prints `No libs in lockfile.` and exits **0**.
-
-If `.jaiph/libs/<name>/` already exists, the library is skipped. Use **`--force`** (anywhere in the argument list) to delete and re-clone.
-
-**Lockfile format** (`.jaiph/libs.lock`):
+`.jaiph/libs.lock` shape:
 
 ```json
 {
   "libs": [
-    { "name": "queue-lib", "url": "https://github.com/you/queue-lib.git", "version": "v1.0" }
+    {
+      "name": "jaiphlang",
+      "url": "https://github.com/jaiphlang/jaiphlang.git",
+      "commit": "1a2b3c4d5e6f7890abcdef1234567890abcdef12"
+    },
+    {
+      "name": "queue-lib",
+      "url": "https://github.com/you/queue-lib.git",
+      "version": "v1.0",
+      "commit": "fedcba9876543210fedcba9876543210fedcba98"
+    }
   ]
 }
 ```
 
-**Examples:**
-
-```bash
-# Install a library
-jaiph install https://github.com/you/queue-lib.git
-
-# Install at a specific version
-jaiph install https://github.com/you/queue-lib.git@v1.0
-
-# Re-clone an existing library
-jaiph install --force https://github.com/you/queue-lib.git
-
-# Restore all libraries from lockfile
-jaiph install
-```
-
-After installation, import library modules using the `<lib-name>/<path>` convention:
-
-```jaiph
-import "queue-lib/queue" as queue
-```
-
-See [Grammar — Imports and Exports](grammar.md#imports-and-exports) for resolution rules.
+The lock entry stores the resolved clone URL so restore works without the registry. `commit` is written automatically after each successful clone.
 
 ## `jaiph use`
 
-Reinstall Jaiph globally with the selected channel or version.
+Reinstall `jaiph` globally with the selected channel or version.
 
-```bash
+```text
 jaiph use <version|nightly>
 ```
 
-- `nightly` — installs from the `nightly` ref.
-- `<version>` — installs tag `v<version>`.
-
-**Examples:**
-
-```bash
-jaiph use nightly
-jaiph use 0.9.4
-```
-
-## File extension
+| Argument | Effect |
+|---|---|
+| `nightly` | Reinstalls from the rolling `nightly` prerelease. |
+| `<version>` (e.g. `0.10.0`) | Reinstalls the release binary for tag `v<version>`. |
 
-**`.jh`** is the file extension for Jaiph source files. Use it for entrypoints, imports, and all CLI commands (`run`, `test`). Import resolution appends `.jh` when the path omits the extension.
+Implementation: re-invokes `JAIPH_INSTALL_COMMAND` (default `curl -fsSL https://jaiph.org/install | bash`) with `JAIPH_REPO_REF` set to `nightly` or `v<version>`. The installer downloads the matching per-platform binary plus `SHA256SUMS`, verifies the checksum, and replaces `~/.local/bin/jaiph` (or `JAIPH_BIN_DIR`).
 
 ## Environment variables
 
-### Runtime and config overrides
-
-These variables apply to `jaiph run` and workflow execution. Variables marked **internal** are set automatically — do not set them manually.
-
-**Internal variables:**
-
-- `JAIPH_META_FILE` — path to the run metadata file (under the CLI’s build output directory for that invocation). Set on the **detached workflow child** only; the parent strips any inherited value so leftover exports do not collide. The runner writes `run_dir=` / `summary_file=` lines for the host to read after exit.
-- `JAIPH_SOURCE_ABS` — absolute path to the entry `.jh` file; set by the CLI for **`jaiph run`** before spawn. Required by the runner (local and Docker).
-- `JAIPH_SCRIPTS` — directory containing emitted **`script`** files for this run; set after **`buildScripts()`**. Any **`JAIPH_SCRIPTS`** exported in the parent shell is cleared before launch so nested toolchains do not point at the wrong tree.
-- `JAIPH_RUN_DIR`, `JAIPH_RUN_ID`, `JAIPH_RUN_SUMMARY_FILE` — for a normal (**non-raw**) **`jaiph run`**, the host generates **`JAIPH_RUN_ID`** once per invocation (UUID), passes it through to the detached child (and into Docker when sandboxed), and Docker failure-path discovery can match summaries by this id. The runtime uses **`JAIPH_RUN_ID`** as the stable run identifier; if it is absent, the runtime may assign its own UUID. **`JAIPH_RUN_DIR`** and **`JAIPH_RUN_SUMMARY_FILE`** are set inside the runner once the UTC run directory exists.
-- `JAIPH_SOURCE_FILE` — set automatically by the CLI to the entry file **basename**. Used to name run directories (see [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout)).
-
-**Workspace and run paths:**
-
-- `JAIPH_WORKSPACE` — workspace root, set by the CLI. Detected by walking up from the entry `.jh` file's directory until `.jaiph` or `.git` is found. Guards in `detectWorkspaceRoot` skip misleading markers under shared system temp directories (`/tmp`, `/var/tmp`, macOS `/var/folders/.../T/...`) and nested `.jaiph/tmp` trees. In Docker sandbox mode the runtime remaps it inside the container (see [Sandboxing](sandboxing.md)).
-- `JAIPH_RUNS_DIR` — root directory for run logs. If unset in the environment, the CLI merges the entry module **`config`** field **`run.logs_dir`** (when present) into the spawned process environment; otherwise the default layout is `.jaiph/runs` under the workspace. Exporting **`JAIPH_RUNS_DIR` yourself locks that choice: in-file **`run.logs_dir`** cannot override an environment-provided value.
-
-**Agent and prompt configuration:**
+See [Environment variables](env-vars.md) for the complete inventory. The variables most relevant to CLI behaviour:
 
-- `JAIPH_AGENT_BACKEND` — prompt backend: `cursor` (default), `claude`, or `codex`. Overrides in-file `agent.backend`. When set to `claude`, the Anthropic Claude CLI must be on PATH. When set to `codex`, `OPENAI_API_KEY` must be set. See [Configuration](configuration.md).
-- `JAIPH_AGENT_MODEL` — default model for `prompt` steps (overrides in-file `agent.default_model`).
-- `JAIPH_AGENT_COMMAND` — command for the Cursor backend (e.g. `cursor-agent`; overrides in-file `agent.command`).
-- `JAIPH_AGENT_TRUSTED_WORKSPACE` — trusted workspace directory for Cursor backend `--trust`. Defaults to project root.
-- `JAIPH_AGENT_CURSOR_FLAGS` — extra flags for Cursor backend (string, split on whitespace).
-- `JAIPH_AGENT_CLAUDE_FLAGS` — extra flags for Claude backend (string, split on whitespace).
-- `OPENAI_API_KEY` — API key for the codex backend. Required when `agent.backend` is `"codex"`.
-- `JAIPH_CODEX_API_URL` — endpoint URL for the codex backend (default: `https://api.openai.com/v1/chat/completions`). Use this to point at a compatible proxy or self-hosted endpoint.
+- `JAIPH_DOCKER_ENABLED`, `JAIPH_UNSAFE`, `JAIPH_INPLACE`, `JAIPH_INPLACE_YES` — sandbox enablement and mode.
+- `JAIPH_DOCKER_IMAGE`, `JAIPH_DOCKER_NETWORK`, `JAIPH_DOCKER_TIMEOUT` — Docker mode parameters.
+- `JAIPH_NON_TTY_HEARTBEAT_FIRST_SEC`, `JAIPH_NON_TTY_HEARTBEAT_INTERVAL_MS` — non-TTY progress cadence.
+- `JAIPH_RUNS_DIR`, `JAIPH_WORKSPACE`, `JAIPH_SOURCE_FILE` — run-layout inputs.
+- `JAIPH_INSTALL_COMMAND`, `JAIPH_REGISTRY`, `JAIPH_SKILL_PATH` — install / init inputs.
+- `NO_COLOR` — disable ANSI colour output.
 
-**Execution behavior:**
+## Live and durable contracts
 
-- `JAIPH_DEBUG` — set to `true` for debug tracing.
-- `JAIPH_RECURSION_DEPTH_LIMIT` — maximum recursion depth for workflows and rules (default: **256**). Exceeding this limit produces a runtime error.
-- `NO_COLOR` — disables colored output.
+- **Live contract** (runtime → CLI): `__JAIPH_EVENT__` JSON lines on **stderr** only. Hooks and the interactive progress tree consume this stream. Stdout carries plain script output forwarded as-is.
+- **Durable contract**: `.jaiph/runs/...` + `run_summary.jsonl` + `.out` / `.err` step artifacts + optional `return_value.txt`. See [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout).
 
-**Non-TTY heartbeat:**
+`run_summary.jsonl` event types: `WORKFLOW_START`, `WORKFLOW_END`, `STEP_START`, `STEP_END`, `LOG`, `LOGERR`, `INBOX_ENQUEUE`, `INBOX_DISPATCH_START`, `INBOX_DISPATCH_COMPLETE`, `PROMPT_START`, `PROMPT_END`. Every object carries `type`, `ts` (UTC), `run_id`, and `event_version` (currently `1`). Step events also carry `id`, `parent_id`, `seq`, `depth`. See [Architecture — Contracts](architecture.md#contracts).
 
-- `JAIPH_NON_TTY_HEARTBEAT_FIRST_SEC` — seconds before the first heartbeat (default: `60`).
-- `JAIPH_NON_TTY_HEARTBEAT_INTERVAL_MS` — minimum milliseconds between subsequent heartbeats (default: `30000`; minimum `250`).
-
-**Docker sandbox** (`jaiph run` only — see [Sandboxing](sandboxing.md)):
-
-- **`JAIPH_UNSAFE`** — set to `true` to **disable** Docker when `JAIPH_DOCKER_ENABLED` is **unset** (run on the host). This is the supported “no container” escape hatch.
-- **`JAIPH_DOCKER_ENABLED`** — when set, must be exactly `true` to force Docker on, or any other value to force Docker **off**. When **unset**, Docker follows the unsafe rule above (on by default unless `JAIPH_UNSAFE=true`). `CI=true` does **not** change this default.
-- **`JAIPH_DOCKER_IMAGE`** — Docker image (overrides in-file `runtime.docker_image`). The image must already contain a `jaiph` binary; otherwise the run fails with `E_DOCKER_NO_JAIPH`. Defaults to the official GHCR runtime image (`ghcr.io/jaiphlang/jaiph-runtime:<version>`).
-- **`JAIPH_DOCKER_NETWORK`** — Docker network mode (overrides in-file `runtime.docker_network`).
-- **`JAIPH_DOCKER_TIMEOUT`** — execution timeout in seconds (overrides in-file `runtime.docker_timeout_seconds`).
-
-In-file `runtime.docker_enabled` is **not** supported (parse error); use the variables above instead.
-
-For overlay vs copy workspace mode, mounts, and stderr wiring, see [Sandboxing](sandboxing.md).
-
-### Install and `jaiph use`
+## File extension
 
-- `JAIPH_REPO_URL` — Git repo URL or local path for install script.
-- `JAIPH_REPO_REF` — ref used when installing; `jaiph use <version>` sets this to `v<version>` or `nightly` for nightly.
-- `JAIPH_BIN_DIR` — target bin directory (default: `$HOME/.local/bin`).
-- `JAIPH_LIB_DIR` — target lib directory (default: `$JAIPH_BIN_DIR/.jaiph`).
-- `JAIPH_INSTALL_COMMAND` — command run by `jaiph use` to reinstall (default: `curl -fsSL https://jaiph.org/install | bash`).
+`.jh` is the file extension for Jaiph source. Import resolution appends `.jh` when the path omits the extension. `*.test.jh` is the test-module convention recognised by `jaiph test` and file shorthand.
 
-### `jaiph init`
+## Related
 
-- `JAIPH_SKILL_PATH` — path to the skill markdown copied to `.jaiph/SKILL.md` when running `jaiph init`. The file **must exist** at this path; otherwise the variable is ignored and the CLI falls back to the same install-relative and `docs/jaiph-skill.md` (cwd) search described under [`jaiph init`](#jaiph-init).
+- [Configuration](configuration.md) — config keys, precedence, scoping.
+- [Grammar](grammar.md) — syntax and validation catalog.
+- [Language](language.md) — step semantics and step-output contract.
+- [Environment variables](env-vars.md) — every variable Jaiph reads.
diff --git a/docs/configuration.md b/docs/configuration.md
index e433b8f7..d1ba8de1 100644
--- a/docs/configuration.md
+++ b/docs/configuration.md
@@ -1,360 +1,276 @@
 ---
 title: Configuration
-permalink: /configuration
+permalink: /reference/configuration
+diataxis: reference
 redirect_from:
+  - /configuration
   - /configuration.md
 ---
 
 # Configuration
 
-When you need the same workflow sources to behave differently on different machines, you separate **what the graph does** (rules, `prompt` / `script` / `run`, channels) from **operational knobs**: which LLM backend to use, where to write run logs and debug output, and how the CLI chooses host vs. Docker. Jaiph keeps the language stable and pushes those choices into **configuration** — in-file `config` blocks, environment variables, and defaults in the tool. Inbox dispatch order is defined by the language (sequential drain of route targets — see [Inbox & Dispatch](inbox.md)); it is not a configuration toggle.
+This page is the authoritative inventory of Jaiph configuration keys: every key, its value type, default, environment-variable equivalent, and precedence. For environment-variable details (defaults, scopes, sandbox forwarding) see [Environment variables](env-vars.md). For the CLI flags that front-end the same knobs see [CLI](cli.md).
 
-All execution is interpreted by the Node workflow runtime (`NodeWorkflowRuntime`): the AST, managed scripts, prompts, channels, inbox, and `.jaiph/runs` artifacts (see [Architecture](architecture.md)). Configuration only adjusts that stack; it does not change the workflow language or the compile graph.
+Configuration sources, in priority order:
 
-`jaiph compile` parses each module in the import closure (same grammar as `emitScriptsForModule`), so **unknown `config` keys and wrong value types** surface as the same parse diagnostics as before `jaiph run`. With a **directory** argument it treats every non-test **`*.jh`** file in that directory as its own entrypoint (see `walkjhFiles` — `*.test.jh` is skipped unless you pass a test file explicitly) and validates each entry’s transitive imports. **`validateReferences` only** — no `scripts/` emission, no `buildRuntimeGraph()`, no runner spawn (see [Architecture](architecture.md#summary)). Runtime graph loading is parse-only; **compile-time** reference validation runs in the transpile path, not in `buildRuntimeGraph()`.
+1. **Environment variables** — locked once observed by the host CLI; see [Locked variables](#locked-variables).
+2. **Workflow-level `config { … }`** — applies for the duration of that workflow.
+3. **Module-level `config { … }`** — applies to all workflows in that file unless overridden.
+4. **Built-in defaults** — lowest priority.
 
-**Source of truth:** When this document and the implementation disagree, treat the source code as authoritative.
+Docker enablement uses a separate, env-only resolution; see [Docker enablement](#docker-enablement).
 
-## Three ways to configure
+## Config block syntax
 
-Jaiph provides three configuration mechanisms. When the same key is set in more than one place, the highest-priority source wins:
-
-1. **Environment variables** — highest priority. Includes `JAIPH_AGENT_*`, `JAIPH_RUNS_DIR`, `JAIPH_DEBUG`, `JAIPH_DOCKER_ENABLED`, other `JAIPH_DOCKER_*`, and `JAIPH_UNSAFE` (for Docker on/off, see [Sandboxing — Enabling Docker](sandboxing.md#enabling-docker)). Docker **enablement** is only controlled here — there is no `runtime.*` in-file key for that (removed; using it is a parse error with a migration message).
-2. **In-file `config { ... }` blocks** — at module scope and optionally inside a `workflow` body.
-3. **Built-in defaults** — lowest priority, used when nothing else sets a value.
-
-For **agent and run keys**, the full precedence chain is:
-
-> **environment > workflow-level config > module-level config > defaults**
-
-`run.recover_limit` is an exception: only **module-level** values affect `run … recover` (see [Run keys](#run-keys)).
-
-For **`runtime.*` (image, network, timeout)**, the host CLI merges them when it **may spawn Docker** (`resolveDockerConfig` in `src/runtime/docker.ts`) — not inside `NodeWorkflowRuntime`. Precedence is **`JAIPH_DOCKER_*` environment > module-level `runtime.*` > defaults** (Docker on/off remains env-only, see above and [Precedence in detail](#precedence-in-detail)). A **host** invocation of **`jaiph run --raw`** skips that driver entirely and always runs the workflow runner **locally** (no container); **`runtime.*` is unused on that path**. Sandboxed workflows still run `jaiph run --raw …` **inside** the container. `runtime.*` cannot appear in workflow-level `config` blocks.
-
-## In-file config blocks
-
-### Module-level config
-
-Each `*.jh` file may have **at most one** module-level `config { ... }` block. It is optional. Settings apply to all workflows in **that** file, unless a workflow has its own block.
-
-**`jaiph run`:** the CLI reads **only the entry file’s** module `config` when it builds the initial process environment via `resolveRuntimeEnv` (before spawning the workflow runner or Docker). Imported modules’ module-level `config` is not merged into that first env snapshot — but the runtime still applies per-module and workflow `config` from the [import graph](architecture.md#summary) when you enter a workflow, run a nested `run` in the same module, or `ensure` a rule (see [Scoping across nested calls](#scoping-across-nested-calls)). **Cross-module** `run` and **same-module** `ensure` are special cases, explained there.
-
-```jh
-config {
-  agent.default_model = "gpt-4"
-  agent.backend = "claude"
-  agent.claude_flags = "--model sonnet-4"
-  run.logs_dir = ".jaiph/runs"
-  run.debug = false
-}
-
-script noop = `true`
-
-rule some_rule() {
-  run noop()
-}
-
-workflow default() {
-  ensure some_rule()
-}
-```
-
-**Syntax rules:**
-
-- The opening line is `config` and `{` with only optional whitespace between them (and nothing else on that line before `{`).
-- One module-level config block per file. A duplicate causes `E_PARSE`: `duplicate config block (only one allowed per file)`.
-- May appear at any position among top-level constructs; convention is near the top.
-- Unknown keys cause `E_PARSE` and list the allowed keys. Wrong value types also cause `E_PARSE`.
-
-### Workflow-level config
-
-A `config { ... }` block inside a `workflow { ... }` body overrides module-level **agent** and **run** keys for that workflow only. This is useful when different workflows in the same file need different models or backends.
-
-```jh
-config {
-  agent.backend = "cursor"
-  agent.default_model = "gpt-3.5"
-}
-
-script noop = `true`
-
-rule some_rule() {
-  run noop()
-}
-
-workflow fast_check() {
-  config {
-    agent.backend = "claude"
-    agent.default_model = "gpt-4"
-  }
-  ensure some_rule()
-}
-
-workflow default() {
-  # Uses module-level config (cursor / gpt-3.5).
-  ensure some_rule()
-}
-```
-
-**Rules:**
-
-- At most one per workflow; it must be the first non-comment construct in the body. A duplicate is `E_PARSE`: `duplicate config block inside workflow (only one allowed per workflow)`.
-- Only **`agent.*` and `run.*` keys** are allowed. Any `runtime.*` or `module.*` key is `E_PARSE`.
-- Workflow-level values apply to all steps in that workflow, including `ensure`d rules and scripts called from it, for **`agent.*`** and **`run.logs_dir`** / **`run.debug`** (merged when the workflow or cross-module `ensure` runs). **`run.recover_limit` is different:** the retry limit for `run … recover` comes only from the **module-level** `config` of the **`.jh` file that owns the current scope** when the step runs; a workflow-level `run.recover_limit` assignment is valid syntax but does **not** change recover behavior today.
-- When the workflow finishes, the previous environment is restored.
-
-**Sibling isolation:** Each workflow gets its own clone of the parent environment. Sibling workflows never see each other's config — even when they execute sequentially. If workflow `alpha` sets `agent.backend = "claude"` and workflow `beta` only sets `agent.default_model = "beta-model"`, `beta` still sees the module-level backend (e.g. `"cursor"`), not `alpha`'s.
+| Aspect | Rule |
+|---|---|
+| Module-level | At most one `config { … }` block per `.jh` file. May appear anywhere among top-level constructs. |
+| Workflow-level | At most one nested `config { … }` per workflow body. Must be the first non-comment construct in the body. |
+| Allowed module keys | `agent.*`, `run.*`, `runtime.*`, `module.*`. |
+| Allowed workflow keys | `agent.*`, `run.*` only. `runtime.*` and `module.*` are `E_PARSE`. |
+| Duplicate block | `E_PARSE duplicate config block (only one allowed per file)` / `E_PARSE duplicate config block inside workflow (only one allowed per workflow)`. |
+| Unknown key | `E_PARSE unknown config key: <key>. Allowed: …` (lists every allowed key). |
+| Wrong value type | `E_PARSE`. |
 
 ### Value syntax
 
 | Type | Format | Example |
-|------|--------|---------|
-| String | Double-quoted | `"gpt-4"` |
-| Boolean | Unquoted `true` / `false` | `true` |
-| Integer | Unsigned decimal digits only | `300` |
-Recognized escapes inside strings: `\\`, `\n`, `\t`, `\"`.
-
-## Config keys reference
-
-### Agent keys
+|---|---|---|
+| String | Double-quoted; supports `\\`, `\n`, `\t`, `\"` | `"gpt-4"` |
+| Boolean | Bare `true` / `false` | `true` |
+| Integer | Unsigned decimal digits | `300` |
 
-These control how `prompt` steps reach the LLM.
+## Agent keys
 
-| Key | Type | Default | Env variable | Description |
-|-----|------|---------|--------------|-------------|
-| `agent.default_model` | string | _(unset)_ | `JAIPH_AGENT_MODEL` | Default model for `prompt` steps. |
-| `agent.command` | string | `cursor-agent` | `JAIPH_AGENT_COMMAND` | Command line for the cursor backend. First token is the executable; the rest are leading arguments. When the command is not `cursor-agent`, Jaiph treats it as a [custom agent command](#custom-agent-commands) — prompt text is piped via stdin and raw stdout is captured. |
-| `agent.backend` | string | `cursor` | `JAIPH_AGENT_BACKEND` | `"cursor"`, `"claude"`, or `"codex"`. See [Backend selection](#backend-selection). |
-| `agent.trusted_workspace` | string | workspace root | `JAIPH_AGENT_TRUSTED_WORKSPACE` | Directory passed to Cursor (`--trust`). Relative paths are resolved against the workspace root at CLI launch. |
-| `agent.cursor_flags` | string | _(unset)_ | `JAIPH_AGENT_CURSOR_FLAGS` | Extra flags appended for the cursor backend (split on whitespace). |
-| `agent.claude_flags` | string | _(unset)_ | `JAIPH_AGENT_CLAUDE_FLAGS` | Extra flags appended for the claude backend (split on whitespace). |
+| Key | Type | Default | Env equivalent | Notes |
+|---|---|---|---|---|
+| `agent.default_model` | string | — | `JAIPH_AGENT_MODEL` | Default model for `prompt` steps. Applies to all backends. |
+| `agent.command` | string | `cursor-agent` | `JAIPH_AGENT_COMMAND` | Cursor backend command. Basename other than `cursor-agent` enables custom-command mode (stdin → command → stdout). |
+| `agent.backend` | string (`cursor` \| `claude` \| `codex`) | `cursor` | `JAIPH_AGENT_BACKEND` | Backend selector. |
+| `agent.trusted_workspace` | string (path) | workspace root | `JAIPH_AGENT_TRUSTED_WORKSPACE` | Directory passed to Cursor as `--trust`. When unset, defaults to `JAIPH_WORKSPACE`. In-file values are assigned to the env var as authored (relative paths are not normalized to absolute paths). |
+| `agent.cursor_flags` | string | — | `JAIPH_AGENT_CURSOR_FLAGS` | Extra flags appended to Cursor invocations (whitespace-split). |
+| `agent.claude_flags` | string | — | `JAIPH_AGENT_CLAUDE_FLAGS` | Extra flags appended to Claude invocations (whitespace-split). |
 
-### Run keys
+## Run keys
 
-These control runtime behavior unrelated to the agent.
+| Key | Type | Default | Env equivalent | Notes |
+|---|---|---|---|---|
+| `run.logs_dir` | string (path) | `.jaiph/runs` | `JAIPH_RUNS_DIR` | Step log directory. Relative paths join the workspace root; absolute paths are used as-is. |
+| `run.debug` | boolean | `false` | `JAIPH_DEBUG` | Enable debug tracing. |
+| `run.recover_limit` | integer | `10` | — (no env override) | Maximum attempts for `run … recover` loops before the step fails. Resolves via workflow > module > default. |
 
-| Key | Type | Default | Env variable | Description |
-|-----|------|---------|--------------|-------------|
-| `run.logs_dir` | string | `.jaiph/runs` | `JAIPH_RUNS_DIR` | Step log directory. Relative paths are joined with the workspace root; absolute paths are used as-is. |
-| `run.debug` | boolean | `false` | `JAIPH_DEBUG` | Enables debug tracing for the run. |
-| `run.recover_limit` | integer | `10` | _(no env override)_ | Maximum attempts for `run … recover` loops before the step fails (see [Language — `recover`](language.md#recover--repair-and-retry-loop)). Effective value comes **only** from the **module-level** `config` block of the **`.jh` file that owns the current scope** (the file containing the workflow or rule that executes the step). Workflow-level `run.recover_limit` does not apply. |
+## Module keys
 
-### Module keys
+Informational metadata only; does not affect execution. Allowed in module-level config only — any `module.*` key inside a workflow-level config is `E_PARSE`.
 
-Optional descriptive metadata about the workflow module. These are informational only — they do not affect agent, run, or runtime behavior. Future features (e.g. MCP tool metadata) may consume them.
+| Key | Type | Default |
+|---|---|---|
+| `module.name` | string | — |
+| `module.version` | string | — |
+| `module.description` | string | — |
 
-| Key | Type | Default | Description |
-|-----|------|---------|-------------|
-| `module.name` | string | _(unset)_ | Human-readable name for this module. |
-| `module.version` | string | _(unset)_ | Version string (no validation — any quoted string is accepted). |
-| `module.description` | string | _(unset)_ | Short description of what this module does. |
+## Runtime (Docker) keys
 
-Module keys can only appear in **module-level** config blocks. Any `module.*` key inside a workflow-level config is `E_PARSE`.
+These configure the Docker sandbox. Allowed in **module-level** config only. They are read by the host CLI when it considers a Docker launch (`resolveDockerConfig` in `src/runtime/docker.ts`) and never affect `NodeWorkflowRuntime` directly. **Docker on/off is not a `runtime.*` key** — see [Docker enablement](#docker-enablement).
 
-```jh
-config {
-  module.name = "deploy-pipeline"
-  module.version = "2.0.0"
-  module.description = "Production deployment with rollback"
-  agent.backend = "claude"
-}
+| Key | Type | Default | Env equivalent | Notes |
+|---|---|---|---|---|
+| `runtime.docker_image` | string | `ghcr.io/jaiphlang/jaiph-runtime:<version>` | `JAIPH_DOCKER_IMAGE` | Container image. Must already contain `jaiph` (`E_DOCKER_NO_JAIPH` otherwise). |
+| `runtime.docker_network` | string | `default` | `JAIPH_DOCKER_NETWORK` | `docker run --network` value. `none` disables egress. |
+| `runtime.docker_timeout_seconds` | integer | `14400` | `JAIPH_DOCKER_TIMEOUT` | Container execution timeout in seconds. `0` disables. Negative or invalid env value produces `E_DOCKER_TIMEOUT`. |
 
-workflow default() {
-  log "deploying..."
-}
-```
+In-file `runtime.docker_enabled` is not supported (`E_PARSE`); use the env-only enablement below.
 
-### Runtime keys (Docker sandbox — beta)
+## Docker enablement
 
-These configure Docker sandboxing. Unlike agent and run keys, they are read when the CLI considers a **Docker launch** for interactive **`jaiph run`** (`src/cli/commands/run.ts` → `spawnExec`). They never affect **`NodeWorkflowRuntime`** directly. They can only appear in **module-level** config blocks (not workflow-level).
+| Check | Result |
+|---|---|
+| `JAIPH_DOCKER_ENABLED` is set to exact `true` | Docker on. |
+| `JAIPH_DOCKER_ENABLED` is set to any other value | Docker off. |
+| `JAIPH_DOCKER_ENABLED` is unset and `JAIPH_UNSAFE=true` | Docker off. |
+| Default (no env) | Docker on. |
 
-> Docker sandboxing is in **beta**. See [Sandboxing](sandboxing.md) for mounts, workspace layout, env forwarding, path remapping, and container behavior.
+`CI=true` does not change this default. Host `jaiph run --raw` never consults this branch — the workflow runner is local in that path. See [Sandboxing](sandboxing.md) for the full model.
 
-> **Host `--raw`:** If you run **`jaiph run --raw`** yourself on the host, the CLI does not enter the Docker branch; image/network/timeout merge is irrelevant for that invocation. Embedding and container flows use **`--raw` inside** the sandbox where the CLI has already picked the image — see [Architecture](architecture.md#sequence-diagram-regular-flow-jh).
+## Precedence
+{: #precedence}
 
-| Key | Type | Default | Env variable | Description |
-|-----|------|---------|--------------|-------------|
-| `runtime.docker_image` | string | `ghcr.io/jaiphlang/jaiph-runtime:<version>` | `JAIPH_DOCKER_IMAGE` | Image name. Must already contain `jaiph`. When unset, uses the official GHCR image tag matching the installed jaiph version. For a custom image, build and push (or tag locally), then set this key or `JAIPH_DOCKER_IMAGE`. |
-| `runtime.docker_network` | string | `default` | `JAIPH_DOCKER_NETWORK` | Docker network mode. |
-| `runtime.docker_timeout_seconds` | integer | `3600` | `JAIPH_DOCKER_TIMEOUT` | Timeout in seconds (default one hour). Use `0` to disable. An invalid or negative **environment** value aborts the run with `E_DOCKER_TIMEOUT` (no silent fallback). In-file must be a non-negative integer. |
+### Agent and run keys
 
-## Precedence in detail
+| Layer | Effect |
+|---|---|
+| Environment (`JAIPH_AGENT_*`, `JAIPH_RUNS_DIR`, `JAIPH_DEBUG`) | Locked when present in the parent env; cannot be overridden by module- or workflow-level config. |
+| Workflow-level `config` | Applies for the workflow body; restored on exit. |
+| Module-level `config` | Applies to workflows without their own block. |
+| Built-in defaults | Lowest priority. |
 
-### Resolution order
+### Runtime (Docker) keys
 
-For **agent and run keys**, resolution order (highest wins):
+| Layer | Effect |
+|---|---|
+| Environment (`JAIPH_DOCKER_*`) | Highest priority for `image`, `network`, `timeout`. |
+| Module-level `config` (`runtime.*`) | Applies when no env override is set. |
+| Built-in defaults | Lowest priority. |
 
-1. **Environment** — `JAIPH_AGENT_*`, `JAIPH_RUNS_DIR`, `JAIPH_DEBUG`. When set, these lock the value for the entire process (see [Locked variables](#locked-variables)).
-2. **Workflow-level `config`** — overrides module values for the duration of that workflow.
-3. **Module-level `config`** — applies to workflows that don't define their own block.
-4. **Built-in defaults.**
-
-For **Docker enablement** on **interactive** **`jaiph run`** (no `--raw` on the host), the CLI uses **`JAIPH_DOCKER_ENABLED` env > unsafe default rule** (env only; `runtime.docker_enabled` is no longer supported). The default rule enables Docker unless `JAIPH_UNSAFE=true` is set; `CI=true` no longer disables Docker (see [Sandboxing — Enabling Docker](sandboxing.md#enabling-docker)). **Host** **`jaiph run --raw`** never consults this branch. For other `runtime.*` keys (image, network, timeout), the merge is **`JAIPH_DOCKER_*` env > module-level `runtime.*` > defaults** whenever Docker launch is considered. Workflow-level config cannot set runtime keys.
-
-### Locked variables
-
-When `jaiph run` builds the runner environment, any of these environment variables already present in `process.env` gets a matching `${NAME}_LOCKED` flag set to `"1"`:
-
-`JAIPH_AGENT_MODEL`, `JAIPH_AGENT_COMMAND`, `JAIPH_AGENT_BACKEND`, `JAIPH_AGENT_TRUSTED_WORKSPACE`, `JAIPH_AGENT_CURSOR_FLAGS`, `JAIPH_AGENT_CLAUDE_FLAGS`, `JAIPH_RUNS_DIR`, `JAIPH_DEBUG`
-
-Locked values cannot be overridden by module-level or workflow-level config — they are authoritative for the entire process. This is how environment variables always win in the precedence chain.
+Workflow-level `config` cannot set `runtime.*` keys.
 
 ### Scoping across nested calls
 
-When workflows call into other workflows, the config scope depends on the call type:
-
-| Call type | What happens |
-|-----------|-------------|
-| **Root entry** (`jaiph run file.jh`) | Full module + workflow metadata is applied (normal precedence). |
-| **Same-module `run`** | Callee's workflow-level `config` is layered on top of the caller's effective env. Module-level config is not re-applied. |
-| **Cross-module `run`** (e.g. `run alias.default`) | Caller's effective env carries as-is. Callee's module and workflow config are ignored. The caller's scope wins. |
+| Call type | Scope behaviour |
+|---|---|
+| Root entry (`jaiph run file.jh`) | Full module + workflow metadata applied with normal precedence. |
+| Same-module `run` | Callee's workflow-level `config` is layered on top of the caller's effective env. Module-level config is not re-applied. |
+| Cross-module `run` (e.g. `run alias.default()`) | Callee's module-level config is layered, then workflow-level on top — same as root-entry precedence, respecting `${NAME}_LOCKED`. |
+| Same-module `ensure` | Caller's scope is reused verbatim. |
+| Cross-module `ensure` | Callee module's `agent.*` / `run.*` are merged on top of the current env (respecting locks). Workflow-level config does not apply to rules. |
 
 After any nested call returns, the caller's scope is restored exactly as before.
 
-### `ensure` and cross-module rules
-
-When you `ensure` a rule from **another** module, the runtime merges that module's module-level `config` (`agent.*` / `run.*`) on top of the current environment (respecting locks). Workflow-level config does not apply to rules.
+## Locked variables
+{: #locked-variables}
 
-**Same-module** `ensure` keeps the caller's environment as-is, so workflow-level overrides stay in place.
+When the host CLI builds the runner environment, any of these variables already present in `process.env` gets a matching `${NAME}_LOCKED=1` flag set on the child env. The runtime refuses to overwrite a locked value from later metadata merges.
 
-## Backend selection
+Locked names: `JAIPH_AGENT_BACKEND`, `JAIPH_AGENT_MODEL`, `JAIPH_AGENT_COMMAND`, `JAIPH_AGENT_TRUSTED_WORKSPACE`, `JAIPH_AGENT_CURSOR_FLAGS`, `JAIPH_AGENT_CLAUDE_FLAGS`, `JAIPH_RUNS_DIR`, `JAIPH_DEBUG`.
 
-`prompt` steps use one of three backends:
+## Config-to-env mapping
 
-- **cursor** (default) — runs `agent.command` (default `cursor-agent`) with stream-json output.
-- **claude** — runs `claude` on `PATH`. If the executable is missing, Jaiph reports an error and exits.
-- **codex** — calls the OpenAI Chat Completions API directly via HTTP. Requires `OPENAI_API_KEY` in the environment. If the key is missing, Jaiph reports an actionable error and exits.
+| In-file key | Environment variable |
+|---|---|
+| `agent.default_model` | `JAIPH_AGENT_MODEL` |
+| `agent.command` | `JAIPH_AGENT_COMMAND` |
+| `agent.backend` | `JAIPH_AGENT_BACKEND` |
+| `agent.trusted_workspace` | `JAIPH_AGENT_TRUSTED_WORKSPACE` |
+| `agent.cursor_flags` | `JAIPH_AGENT_CURSOR_FLAGS` |
+| `agent.claude_flags` | `JAIPH_AGENT_CLAUDE_FLAGS` |
+| `run.logs_dir` | `JAIPH_RUNS_DIR` |
+| `run.debug` | `JAIPH_DEBUG` |
+| `run.recover_limit` | _(no env override)_ |
+| `runtime.docker_image` | `JAIPH_DOCKER_IMAGE` |
+| `runtime.docker_network` | `JAIPH_DOCKER_NETWORK` |
+| `runtime.docker_timeout_seconds` | `JAIPH_DOCKER_TIMEOUT` |
+| `module.name` | _(no env override)_ |
+| `module.version` | _(no env override)_ |
+| `module.description` | _(no env override)_ |
 
-Backend-specific flags come from `agent.cursor_flags` / `agent.claude_flags` (or the matching env vars). The codex backend has no CLI flags; configure it with `OPENAI_API_KEY` and optionally `JAIPH_CODEX_API_URL` (defaults to `https://api.openai.com/v1/chat/completions`). There is no per-`prompt` backend override; the effective backend is whatever the config stack resolves to when the step runs.
+Variables with no in-file equivalent: `JAIPH_CODEX_API_URL` (codex endpoint), `JAIPH_PROMPT_RETRY` / `JAIPH_PROMPT_RETRY_DELAYS` (prompt-retry schedule), `OPENAI_API_KEY` (codex credential). Full inventory in [Environment variables](env-vars.md).
 
-### Custom agent commands
+## Backend selection
+{: #backend-selection}
 
-Only the **cursor** backend consults **`agent.command`**. For **`claude`** and **`codex`**, Jaiph always invokes the Claude CLI or the Codex HTTP path (`prompt.ts`), regardless of `agent.command`.
+| Backend | Required credential | Endpoint / CLI |
+|---|---|---|
+| `cursor` (default) | `CURSOR_API_KEY` (or stored `cursor-agent login` on host runs) | Runs `agent.command` (default `cursor-agent`) with `stream-json` framing. |
+| `claude` | `ANTHROPIC_API_KEY` **or** `CLAUDE_CODE_OAUTH_TOKEN` (or stored Claude CLI login on host runs) | Runs `claude` on `PATH`. |
+| `codex` | `OPENAI_API_KEY` | Calls the OpenAI Chat Completions endpoint directly (`JAIPH_CODEX_API_URL` overrides the URL). No CLI-login fallback. |
 
-When **`agent.backend` is `cursor`** (the default) and `agent.command`’s basename is anything other than `cursor-agent`, Jaiph treats it as a **custom agent command**. That lets you use a shell script, Python wrapper, or other CLI as a prompt backend — no need to implement the `stream-json` protocol.
+Backend-specific flags come from `agent.cursor_flags` / `agent.claude_flags` (or the matching env vars). There is no per-`prompt` backend override.
 
-**How it works:**
+### Credential pre-flight
+{: #credential-pre-flight}
 
-1. Jaiph pipes the prompt text to the command's **stdin**.
-2. The command's **stdout** is captured as the prompt response (raw text, no JSON framing).
-3. **stderr** passes through to the terminal.
-4. No cursor-specific flags (`--output-format`, `--stream-partial-output`, `--workspace`, etc.) are appended.
+Before `jaiph run` spawns the workflow runner or Docker container, the host CLI runs a credential pre-flight (`src/cli/run/preflight-credentials.ts`). It collects the distinct backend(s) declared in the entry file's module-level `config` block and each workflow-level block, plus the effective default (`JAIPH_AGENT_BACKEND` env, or `cursor` when unset). Deeper per-import overrides resolved at runtime are not followed.
 
-**Display:** The run tree shows the command's basename as the step name — e.g., `prompt echo-wc.sh "..."` instead of `prompt cursor "..."`.
+| Backend | Required credential | Host run (no Docker) | Docker run (any mode incl. `inplace`) |
+|---|---|---|---|
+| `codex` | `OPENAI_API_KEY` | hard error (`E_AGENT_CREDENTIALS`) | hard error (`E_AGENT_CREDENTIALS`) |
+| `claude` | `ANTHROPIC_API_KEY` or `CLAUDE_CODE_OAUTH_TOKEN` | warn (CLI login may still work) | hard error (`E_AGENT_CREDENTIALS`) |
+| `cursor` | `CURSOR_API_KEY` | warn (CLI login may still work) | hard error (`E_AGENT_CREDENTIALS`) |
 
-```jh
-config {
-  agent.command = "./agents/my-agent.sh"
-}
+Hard errors exit non-zero with no runner or container launched. Warnings go to stderr and the run proceeds. Skip cases: entry file declares no explicit backend and uses no `prompt` step → no pre-flight; `jaiph run --raw` → no pre-flight; `JAIPH_UNSAFE=true` / `--unsafe` → no pre-flight (host escape hatch — runtime backend guards remain).
 
-workflow default() {
-  answer = prompt "Summarize this codebase"
-  log "${answer}"
-}
-```
+Every error and warning names: the backend; the model when `agent.default_model` is set; the entry `.jh` file; the config scope (`module config`, `workflow <name>`, `JAIPH_AGENT_BACKEND env`, or `default`); and the concrete remedy. Docker-mode messages also note that the variable must be set on the host so it gets forwarded.
 
-The custom agent script just reads stdin and prints its answer:
+## Model resolution
+{: #model-resolution}
 
-```bash
-#!/usr/bin/env bash
-input=$(cat)
-# ... process the input ...
-echo "Here is my summary: ..."
-```
+Resolution order for a `prompt` step:
 
-Custom commands still participate in the normal prompt lifecycle — `PROMPT_START` / `PROMPT_END` events are emitted, artifacts are written, and `returns` schema validation applies to the captured output.
+| Step | Source | Notes |
+|---|---|---|
+| 1 | Explicit model — `agent.default_model` / `JAIPH_AGENT_MODEL` non-empty. | `model_reason: explicit`. |
+| 2 | Flags model — `--model <name>` inside `agent.cursor_flags` / `agent.claude_flags`. | `model_reason: flags`. Codex has no flag channel; this step does not apply. |
+| 3 | Backend default — Cursor/Claude binaries pick their own. Codex defaults to `gpt-4o` in code. | `model_reason: backend-default`. |
 
-### Codex setup
+For the Claude backend, when `agent.default_model` is set and `agent.claude_flags` does not already contain `--model`, Jaiph passes `--model <value>` to the Claude CLI automatically. If both are set, the value in `agent.claude_flags` wins (appended last).
 
-```jh
-config {
-  agent.backend = "codex"
-  agent.default_model = "gpt-4o"
-}
+`PROMPT_START` / `PROMPT_END` records in `run_summary.jsonl` carry `model` (resolved string, or null when backend auto-selects) and `model_reason`.
 
-workflow default() {
-  prompt "Explain this codebase"
-}
-```
+## Prompt retry on transport failure
+{: #prompt-retry-on-transport-failure}
 
-Set the API key in your environment:
+`NodeWorkflowRuntime` retries transport-failed prompt invocations on an escalating backoff schedule before propagating the failure to any enclosing `recover` / `catch`.
 
-```bash
-export OPENAI_API_KEY="sk-..."
-jaiph run main.jh
-```
+| Attempt | Delay before this attempt |
+|---|---|
+| 1 | _(none — initial call)_ |
+| 2 | 15s |
+| 3 | 1m |
+| 4 | 10m |
+| 5 | 30m |
+| 6 | 2h |
 
-The codex backend streams responses from the OpenAI API and supports structured `returns` schemas like the other backends. The default model is `gpt-4o` when `agent.default_model` is not set. To use a custom-compatible endpoint, set `JAIPH_CODEX_API_URL`.
+Total worst-case wall-clock: ~2h41m. Under Docker, `runtime.docker_timeout_seconds` caps this.
 
-### Model resolution
+Only transport failures are retried (non-zero exit from cursor/claude, codex HTTP error, spawn failure). Deterministic post-processing failures — invalid JSON, schema validation — fail on the first attempt and return `{ ok: false }`.
 
-When a `prompt` step runs, Jaiph resolves the effective model using this order:
+Each attempt emits its own `PROMPT_START` / `PROMPT_END` and `STEP_START` / `STEP_END`. Each failure logs a `LOGERR` line; the final termination logs another. The captured value reflects the successful attempt.
 
-1. **Explicit model** — `agent.default_model` / `JAIPH_AGENT_MODEL` is set and non-empty → use it.
-2. **Flags model** — for **cursor** and **claude**, `--model <name>` is found inside the corresponding flags (`agent.cursor_flags` or `agent.claude_flags`) → use it. **Codex** has no flag channel for the model; only step 1 or 3 apply.
-3. **Backend default** — **cursor** and **claude** use each CLI’s default when nothing else picks a model. **Codex** defaults to `gpt-4o` in code when no explicit model is set (see [Codex setup](#codex-setup)).
+| Variable | Effect |
+|---|---|
+| `JAIPH_PROMPT_RETRY=0` | Disable retry entirely (one attempt, fail on transport failure). |
+| `JAIPH_PROMPT_RETRY_DELAYS` | Comma-separated list of non-negative integer milliseconds. Invalid entries abort the prompt. |
 
-`agent.default_model` applies to **cursor**, **claude**, and **codex**. For the **Claude** backend, when `agent.default_model` is set and `agent.claude_flags` does not already contain `--model`, Jaiph passes `--model <value>` to the Claude CLI automatically. If both are set, the value in `agent.claude_flags` takes precedence (it is appended last).
+`jaiph test` defaults `JAIPH_PROMPT_RETRY=0`. Backoff sleep is interruptible: workflow abort, SIGINT, or SIGTERM cancels the pending wait without further backend calls.
 
-**Diagnostics.** Every prompt step records model metadata in **`PROMPT_START`** and **`PROMPT_END`** in **`run_summary.jsonl`** (`model`, `model_reason`):
+## Prompt watchdog timeouts
+{: #prompt-watchdog-timeouts}
 
-```jsonl
-{"type":"PROMPT_START","backend":"cursor","model":"gpt-4","model_reason":"explicit",...}
-```
+The retry backoff above handles a backend that *fails*. A separate set of watchdogs handles a backend that *hangs* — it never exits, so without them the runtime would block on the subprocess indefinitely (no commit, no queue progress, no retry). Each prompt invocation installs three independent layers over the spawned backend process:
 
-`model_reason` is one of: **`explicit`** (non-empty **`agent.default_model` / `JAIPH_AGENT_MODEL`**), **`flags`** (`--model` taken from **`agent.cursor_flags`** or **`agent.claude_flags`**), or **`backend-default`** (no resolved model string — Cursor/Claude binaries choose their own; **codex** also reports this when no model is configured, **even though** the HTTP client defaults to **`gpt-4o`**, so the **`model`** field may be omitted there). Inspect these events directly in the summary file.
+| Layer | Variable | Default | Trigger | Outcome |
+|---|---|---|---|---|
+| Completion grace | `JAIPH_PROMPT_COMPLETION_GRACE_SECONDS` | `30` | The backend emitted its terminal `result` event (work is done) but the process has not exited within the grace window. | Terminate the process, return **success** with the captured answer. |
+| Idle timeout | `JAIPH_PROMPT_IDLE_TIMEOUT_SECONDS` | `900` (15m) | No stdout/stderr for the whole window — the backend is stuck mid-work. | Terminate the process, return **failure** → feeds the [retry backoff](#prompt-retry-on-transport-failure). |
+| Absolute cap | `JAIPH_PROMPT_MAX_SECONDS` | `7200` (2h) | Total wall-clock for the single invocation exceeds the cap, regardless of activity. | Terminate the process, return **failure** → feeds the retry backoff. |
 
-**No-model troubleshooting.** If the backend rejects the auto-selected default, set **`agent.default_model`** (all backends). For **cursor** and **claude** you can also pass **`--model <name>`** in **`agent.cursor_flags`** / **`agent.claude_flags`**; **codex** has no flag channel — use **`agent.default_model`** or env **`JAIPH_AGENT_MODEL`** only.
+Set any variable to `0` to disable that layer. The idle timer resets on every chunk of backend output, so a slow-but-active run is bounded only by the absolute cap.
 
-## Testing with `jaiph test`
+The completion-grace layer specifically addresses the known `claude -p` failure mode where the CLI streams its final answer (and the terminal `result` event) but the process never exits — often because a descendant it spawned is still holding the output pipe open. When a watchdog fires it sends `SIGTERM`, escalating to `SIGKILL` after 5s, and tears down the runtime's handles on the child's stdio so a lingering descendant cannot keep the run alive. Under Docker, `runtime.docker_timeout_seconds` remains the outer backstop for the whole container.
 
-`jaiph test` never calls `resolveRuntimeEnv`. For a `test_run_workflow` step, the test runner builds a child `env` by **spreading `process.env`**, then sets `JAIPH_TEST_MODE`, `JAIPH_WORKSPACE`, `JAIPH_RUNS_DIR` (an ephemeral test path), `JAIPH_SCRIPTS`, and mock fields (`JAIPH_MOCK_RESPONSES_FILE` and/or `JAIPH_MOCK_DISPATCH_SCRIPT`) as needed. There is no CLI pass that pre-merges in-file `config` into that env; **`JAIPH_*_LOCKED` flags are not set** unless you export them in the parent environment yourself.
+## Custom agent commands
 
-`NodeWorkflowRuntime` still layers module- and workflow-level in-file `config` with `applyMetadataScope` (same `*_LOCKED` rules: metadata wins only when the key is not locked in the current env). To pin agent settings in CI, set `JAIPH_AGENT_*` / `JAIPH_RUNS_DIR` / `JAIPH_DEBUG` in the environment, and/or keep `config` in the `.jh` module that defines the workflow you exercise. Note: `jaiph run`’s `resolveRuntimeEnv` resolves `agent.trusted_workspace` to an absolute path against the workspace; **metadata-only** merging uses the in-file string as given — for tests, a relative `agent.trusted_workspace` may end up in `JAIPH_AGENT_TRUSTED_WORKSPACE` as-is, so set an absolute path in env or config if you need parity with a normal run.
+`agent.command` is consumed by the **cursor** backend only. For `claude` and `codex`, Jaiph always invokes the Claude CLI or the codex HTTP path, regardless of `agent.command`.
 
-## Config-to-env mapping
+When `agent.backend = "cursor"` and `agent.command`'s basename is anything other than `cursor-agent`, Jaiph treats it as a custom agent command:
 
-Quick reference for all in-file keys and their environment variable equivalents:
+| Channel | Behaviour |
+|---|---|
+| stdin | Prompt text piped to the command. |
+| stdout | Captured as the prompt response (raw text, no JSON framing). |
+| stderr | Passes through to the terminal. |
+| Cursor-specific flags (`--output-format`, `--stream-partial-output`, `--workspace`, …) | Not appended. |
+| Step display name | Command basename instead of `cursor`. |
 
-| In-file key | Environment variable |
-|-------------|----------------------|
-| `agent.default_model` | `JAIPH_AGENT_MODEL` |
-| `agent.command` | `JAIPH_AGENT_COMMAND` |
-| `agent.backend` | `JAIPH_AGENT_BACKEND` |
-| `agent.trusted_workspace` | `JAIPH_AGENT_TRUSTED_WORKSPACE` |
-| `agent.cursor_flags` | `JAIPH_AGENT_CURSOR_FLAGS` |
-| `agent.claude_flags` | `JAIPH_AGENT_CLAUDE_FLAGS` |
-| `run.logs_dir` | `JAIPH_RUNS_DIR` |
-| `run.debug` | `JAIPH_DEBUG` |
-| `run.recover_limit` | _(no env override)_ |
-| `runtime.docker_image` | `JAIPH_DOCKER_IMAGE` |
-| `runtime.docker_network` | `JAIPH_DOCKER_NETWORK` |
-| `runtime.docker_timeout_seconds` | `JAIPH_DOCKER_TIMEOUT` |
-| `module.name` | _(no env override)_ |
-| `module.version` | _(no env override)_ |
-| `module.description` | _(no env override)_ |
+Custom commands still participate in `PROMPT_START` / `PROMPT_END`, write artifacts, and apply `returns` schema validation when configured.
 
-There is **no in-file key** for the Codex HTTP endpoint or API key. Use environment only:
+## Test runner
 
-| Purpose | Environment variable |
-|---------|----------------------|
-| OpenAI-compatible API key (required for **codex**) | `OPENAI_API_KEY` |
-| OpenAI-compatible chat-completions URL override | `JAIPH_CODEX_API_URL` |
+`jaiph test` does not call `resolveRuntimeEnv`. The test runner spreads `process.env`, then sets `JAIPH_TEST_MODE`, `JAIPH_WORKSPACE`, `JAIPH_RUNS_DIR` (ephemeral), `JAIPH_SCRIPTS`, and mock fields (`JAIPH_MOCK_RESPONSES_JSON`, `JAIPH_MOCK_PROMPT_ARMS_JSON`). `JAIPH_*_LOCKED` flags are not set unless inherited from the parent env. `NodeWorkflowRuntime` still applies in-file `config` via `applyMetadataScope` with the same lock rules.
 
 ## Inspecting effective config at runtime
 
-Inside workflows, rules, and scripts, agent and run settings are visible as `JAIPH_*` environment variables. In orchestration strings, `${IDENTIFIER}` resolves from workflow variables first, then from the process environment.
+Agent and run settings are visible inside workflows, rules, and scripts as `JAIPH_*` environment variables. In orchestration strings, `${IDENT}` resolves against workflow bindings first, then against the process environment.
 
-```jh
-workflow default() {
-  log "backend=${JAIPH_AGENT_BACKEND} trusted_workspace=${JAIPH_AGENT_TRUSTED_WORKSPACE}"
-}
-```
+`JAIPH_DOCKER_*` variables are not populated from in-file `runtime.*` inside the workflow runner. Docker config is consumed when the CLI spawns the runner (or container); if a script needs Docker-related variables in its environment, export them from the parent shell.
 
-The runtime also sets `JAIPH_ARTIFACTS_DIR` — the absolute path to the writable artifacts directory for the current run (`.jaiph/runs/<run_id>/artifacts/` on the host, `/jaiph/run/artifacts` inside the Docker sandbox). The `jaiphlang/artifacts` library reads this variable; you can also use it directly in scripts. See [Libraries — `jaiphlang/artifacts`](libraries.md#jaiphlangartifacts--publishing-files-out-of-the-sandbox).
+## Created by `jaiph init`
 
-`JAIPH_DOCKER_*` variables are **not** populated from in-file `runtime.*` inside the workflow runner process. Docker is configured when the CLI spawns the runner (or container). If you need Docker-related variables inside a `script` step, export them yourself or inherit them from the parent shell.
+`jaiph init` creates `.jaiph/bootstrap.jh`, `.jaiph/SKILL.md`, and `.jaiph/.gitignore`. There is no separate config file — `config { … }` blocks live in workflow source. See [CLI — `jaiph init`](cli.md#jaiph-init).
 
-## Created by `jaiph init`
+## Related
 
-`jaiph init` creates `.jaiph/bootstrap.jh`, writes `.jaiph/SKILL.md` from the skill file bundled with your installation (see `JAIPH_SKILL_PATH` in the [CLI](cli.md) reference), and ensures `.jaiph/.gitignore` matches the canonical template (lists `runs` and `tmp` under `.jaiph/`). It does not add a separate config file — use `config { ... }` in your workflow sources.
+- [Environment variables](env-vars.md) — every variable Jaiph reads.
+- [CLI](cli.md) — flags that front-end these config knobs.
+- [Sandboxing](sandboxing.md) — Docker sandbox model.
+- [Grammar](grammar.md) — `config` block syntax in the formal grammar.
diff --git a/docs/configure-backend.md b/docs/configure-backend.md
new file mode 100644
index 00000000..472e89c5
--- /dev/null
+++ b/docs/configure-backend.md
@@ -0,0 +1,84 @@
+---
+title: Configure backend & model
+permalink: /how-to/configure-backend
+diataxis: how-to
+---
+
+# Configure the agent backend and model
+
+This recipe picks which agent backend `prompt` steps use (`cursor`, `claude`, or `codex`) and which model to ask for. Configuration can live in the workflow file (`config { … }`) or in the environment. Environment wins over in-file when both are set.
+
+For the full key/default/precedence reference, see [Configuration](/reference/configuration). For credential setup per backend, see [Authenticate agent backends](/how-to/agent-auth).
+
+## Prerequisites
+
+- The agent CLI for the chosen backend is on `PATH` (`cursor-agent` for `cursor`, `claude` for `claude`; `codex` uses HTTP and needs no CLI).
+- Credentials are set per [Authenticate agent backends](/how-to/agent-auth).
+
+## 1. Set the backend in the entry file
+
+Add a module-level `config { … }` block at the top of your `.jh` file:
+
+```jh
+config {
+  agent.backend = "claude"
+  agent.default_model = "sonnet-4"
+}
+
+workflow default() {
+  const answer = prompt "Summarize this codebase"
+  log "${answer}"
+}
+```
+
+The valid backend values are `"cursor"` (the default), `"claude"`, and `"codex"`. The model string is forwarded to the backend — use a name the backend recognizes (e.g. `gpt-4o` for codex, `sonnet-4` for claude).
+
+## 2. Override per-workflow
+
+To use a different backend for one workflow in the same file, add a workflow-level `config { … }` block (it must be the first non-comment construct in the body):
+
+```jh
+workflow fast_check() {
+  config {
+    agent.backend = "cursor"
+    agent.default_model = "gpt-3.5"
+  }
+  ensure some_rule()
+}
+```
+
+Only `agent.*` and `run.*` keys are allowed at workflow scope. `runtime.*` and `module.*` keys are module-only.
+
+## 3. Override from the environment
+
+```bash
+export JAIPH_AGENT_BACKEND="claude"
+export JAIPH_AGENT_MODEL="sonnet-4"
+jaiph run ./flow.jh
+```
+
+When set, the environment value wins over both the workflow-level and module-level `config` blocks. The CLI marks each inherited agent/run env var as locked (`JAIPH_AGENT_BACKEND_LOCKED=1`, `JAIPH_AGENT_MODEL_LOCKED=1`, …) for the lifetime of that run so in-file overrides never silently take effect.
+
+## 4. (Codex) Override the API URL
+
+The `codex` backend defaults to `https://api.openai.com/v1/chat/completions`. To target an OpenAI-compatible endpoint:
+
+```bash
+export JAIPH_CODEX_API_URL="https://api.example.com/v1/chat/completions"
+```
+
+## Verification
+
+Each `prompt` step records the resolved backend and model in `run_summary.jsonl`. After the run, inspect the first `PROMPT_START` line:
+
+```bash
+jq -c 'select(.type=="PROMPT_START")' .jaiph/runs/<date>/<time>-<entry>/run_summary.jsonl | head -1
+```
+
+The line includes `"backend":"<backend>"`, `"model"` (the resolved string, or `null` when the backend auto-selects), and `model_reason` (`explicit`, `flags`, or `backend-default`). When `model_reason` is `backend-default`, codex still calls the API with `gpt-4o` even though `"model"` is `null` in the summary.
+
+## Related
+
+- [Authenticate agent backends](/how-to/agent-auth) — the credentials each backend needs.
+- [Configuration — Precedence](/reference/configuration#precedence) — env vs module vs workflow layering, lock flags, and nested-call scoping.
+- [Configuration](/reference/configuration) — the full set of config keys, defaults, and env equivalents.
diff --git a/docs/contributing.md b/docs/contributing.md
index fbbd1422..05119b24 100644
--- a/docs/contributing.md
+++ b/docs/contributing.md
@@ -1,6 +1,7 @@
 ---
 title: Contributing
 permalink: /contributing
+diataxis: contributor
 redirect_from:
   - /contributing.md
 ---
@@ -9,9 +10,9 @@ redirect_from:
 
 Contributor docs answer a narrow question: **where changes belong**, **how to run the same checks CI runs**, and **which test layer** should encode a behavior change.
 
-At a high level, Jaiph is built as described in [Architecture](architecture.md) — transpile path (`emitScriptsForModule`, `buildScripts`), parse-only **`buildRuntimeGraph()`**, **`jaiph compile`** (validate-only), **`NodeWorkflowRuntime`**, artifact layout, and Docker helper contracts. Treat that page as authoritative for pipelines and boundaries; if anything here diverges from it or from the implementation, prefer **architecture + source**.
+At a high level, Jaiph is built as described in [Architecture](architecture.md) — **`loadModuleGraph`** → per-module **`validateModule`** + script emit via **`buildScriptsFromGraph`** / **`emitScriptsForModuleFromGraph`**, the same graph consumed by **`buildRuntimeGraph(graph)`**, validate-only **`jaiph compile`** (**`collectDiagnostics`**), **`NodeWorkflowRuntime`**, artifact layout, and Docker helper contracts. Treat that page as authoritative for pipelines and boundaries; if anything here diverges from it or from the implementation, prefer **architecture + source**.
 
-For workflow syntax, library usage, tooling setup, and grammar details, see [Language](language.md), [Setup](setup.md), [Grammar](grammar.md), and the overview in [Getting Started](getting-started.md).
+For workflow syntax, library usage, tooling setup, and grammar details, see [Language](language.md), [Install & switch versions](setup.md), [Grammar](grammar.md), and [Your first workflow](first-workflow.md). For the `*.test.jh` language and test blocks, see [Write & run tests](testing.md).
 
 ## Branching and pull requests
 
@@ -37,25 +38,28 @@ jaiph --version
 jaiph --help
 ```
 
-The script installs from local source (including uncommitted changes) and places the CLI in `~/.local/bin` by default (or `JAIPH_BIN_DIR` if set).
+The script builds the self-contained standalone binary from local source (`npm install` + `npm run build:standalone`, including uncommitted changes) and installs `dist/jaiph` to `~/.local/bin` by default (or `JAIPH_BIN_DIR` if set). The result is the same single-file artifact that `docs/install` downloads from a GitHub Release; only the origin of the binary differs.
+
+**From-source prerequisites:** **`npm`** and **[Bun](https://bun.sh)** (`bun build --compile` produces the standalone binary). Node is not required to *run* the result, but `npm install` still pulls dev dependencies; on most Linux/macOS hosts the system `npm` ships with Node 20+.
 
 ## Developing in the repository
 
 For day-to-day work on the compiler and CLI you usually stay inside the clone: install dev dependencies once, then build and run tests from npm scripts.
 
-**Prerequisites:** Node.js **20.x** and npm (same **`setup-node`** version as `.github/workflows/ci.yml`). The installers also expect `git` and `bash`. End-to-end tests are written in bash and are run by `e2e/test_all.sh`.
+**Prerequisites:** Node.js **20.x** and **`npm`** (matching `.github/workflows/ci.yml`). **[Bun](https://bun.sh)** is also required for `npm run build:standalone` and `./docs/install-from-local.sh`; standalone cross-compiles run in `.github/workflows/release.yml` via `oven-sh/setup-bun`, not in the main `ci.yml` unit/E2E jobs. End-user installs from `docs/install` need only `curl` and `shasum` / `sha256sum`. The installers also expect `bash`. End-to-end tests are written in bash and are run by `e2e/test_all.sh`.
 
 **Typical commands** (from the repo root):
 
 | Command | What it runs |
 |---------|----------------|
 | `npm install` | Installs TypeScript and types (dev dependencies). |
-| `npm run build` | Runs `tsc`, then copies **`src/runtime`** → **`dist/src/runtime`** (kernel JS for the compiled CLI) and **`runtime/overlay-run.sh`** → **`dist/src/runtime/overlay-run.sh`** (Docker overlay entrypoint). |
-| `npm run build:standalone` | `npm run build`, then copies **`dist/src/runtime`** → **`dist/runtime`** and runs **`bun build --compile ./src/cli.ts --outfile ./dist/jaiph`**. Requires [Bun](https://bun.sh). Ship **`dist/jaiph`** beside **`dist/runtime`** ([Architecture — Distribution](architecture.md#distribution-node-vs-bun-standalone)). |
-| `npm test` | **`npm run clean`**, then **`npm run build`**, then the Node.js test runner with **`JAIPH_UNSAFE=true`**, **`NODE_OPTIONS`** including **`--enable-source-maps`** and a large heap limit, on every file under `dist/integration/` matching `*.test.js`, every file under `dist/src/` matching `*.test.js` or `*.acceptance.test.js` (via `find`), `dist/test-infra/compiler-test-runner.js` (txtar compiler tests), and `dist/test-infra/golden-ast-runner.js` (golden AST tests). |
+| `npm run build` | Runs **`npm run embed-assets`** (regenerates **`src/runtime/embedded-assets.ts`** from `runtime/overlay-run.sh` and `docs/jaiph-skill.md`, and **`src/version.ts`** from `package.json`'s `version` field), then `tsc`, then copies **`src/runtime`** → **`dist/src/runtime`** (kernel JS for the compiled CLI) and **`runtime/overlay-run.sh`** → **`dist/src/runtime/overlay-run.sh`** (Docker overlay entrypoint). |
+| `npm run embed-assets` | Runs `tools/embed-assets.js` to regenerate **`src/runtime/embedded-assets.ts`** and **`src/version.ts`**. Invoked automatically by `npm run build` and by `npm install` (via the `prepare` lifecycle script, so gitignored **`src/version.ts`** exists on a fresh checkout before **`tsc`**); run it standalone after editing embedded source files if you want to refresh the generated copies without a full rebuild. **`src/runtime/embedded-assets.test.ts`** fails CI if checked-in **`src/runtime/embedded-assets.ts`** drifts from **`runtime/overlay-run.sh`** or **`docs/jaiph-skill.md`**. |
+| `npm run build:standalone` | `npm run build`, then copies **`dist/src/runtime`** → **`dist/runtime`** and runs **`bun build --compile ./src/cli.ts --outfile ./dist/jaiph`**. Requires [Bun](https://bun.sh). The resulting **`dist/jaiph`** is **fully self-contained** — `overlay-run.sh` and `jaiph-skill.md` are baked into the binary, and workflow launch self-spawns via the internal `__workflow-runner` argv marker, so the binary needs no sibling `runtime/` or `docs/` files and no `node` / `npm` on the host. The `dist/runtime` copy is kept for parity with the npm layout ([Architecture — Distribution](architecture.md#distribution-node-vs-bun-standalone)). |
+| `npm test` | **`npm run clean`**, then **`npm run build`**, then the Node.js test runner with **`JAIPH_UNSAFE=true`**, **`NODE_OPTIONS`** including **`--enable-source-maps`** and a large heap limit, on every file under `dist/integration/` matching `*.test.js`, every file under `dist/src/` matching `*.test.js` or `*.acceptance.test.js` (via `find`), `scripts/build-registry.test.mjs`, `dist/test-infra/compiler-test-runner.js` (txtar compiler tests), and `dist/test-infra/golden-ast-runner.js` (golden AST tests). |
 | `npm run test:compiler` | **`npm run build`**, then **`node --test`** on `dist/test-infra/compiler-test-runner.js` — runs txtar-based compiler test fixtures from `test-fixtures/compiler-txtar/`. |
 | `npm run test:golden-ast` | **`npm run build`**, then **`node --test`** on `dist/test-infra/golden-ast-runner.js` — runs golden AST tests from `test-fixtures/golden-ast/`. Use `UPDATE_GOLDEN=1 npm run test:golden-ast` to regenerate goldens after intentional parser changes. |
-| `npm run test:acceptance:compiler` | **`npm run build`**, then **`node --test`** with only `*.acceptance.test.js` files under **`dist/src/`** (same `find … -name '*.acceptance.test.js'` fragment as **`package.json`**) — compiler acceptance tests without the full unit suite or E2E. |
+| `npm run test:acceptance:compiler` | **`npm run build`**, then **`node --test`** with only `*.acceptance.test.js` files under **`dist/src/`** — compiler acceptance tests without the full unit suite or E2E. |
 | `npm run test:acceptance:runtime` | **`bash ./e2e/test_all.sh`** only — same E2E driver as below **without** an implicit rebuild; ensure `dist/` is up to date before running. |
 | `npm run test:acceptance` | **`npm run test:acceptance:compiler`** then **`npm run test:acceptance:runtime`**. |
 | `npm run test:e2e` | **`npm run build`**, then **`bash ./e2e/test_all.sh`**. Prefer this when you want a fresh `dist/` before E2E. **`e2e::prepare_shared_context`** in `e2e/lib/common.sh` exports **`JAIPH_DOCKER_ENABLED=false`** after clearing most **`JAIPH_*`** variables, so typical tests run on the **host**; Docker coverage lives in scripts that set **`JAIPH_DOCKER_ENABLED=true`** — see [E2E testing](#e2e-testing) and **`resolveDockerConfig`** in `src/runtime/docker.ts` / [Architecture — Core components](architecture.md#core-components). |
@@ -74,7 +78,8 @@ The root `.gitignore` blocks common debug and temp directory patterns so they ne
 | `nested-*/` | Nested-run debug directories |
 | `overlay-*/` | Overlay/fuse debug directories |
 | `local-*/` | Local debug directories |
-| `.tmp*/` | Temp build/debug directories |
+| `.tmp/` | Temp build/debug directory (exact name) |
+| `.tmp*/` | Temp build/debug directories (prefix) |
 | `QUEUE.md.tmp.*` | Stale queue temp files |
 
 If you create throwaway directories during development, use one of these prefixes so they are automatically ignored. To track a file that matches a blocked pattern, use `git add -f`.
@@ -102,27 +107,36 @@ Jaiph uses several test layers. Each layer catches a different class of bug. Use
 | **Module tests** | `src/**/*.test.ts` (colocated) | Bugs in pure functions (event parsing, param formatting, path resolution, config merging) | The function is self-contained, takes input and returns output, no I/O |
 | **Compiler acceptance tests** | `src/transpile/*.acceptance.test.ts` (colocated) | Cross-module compiler behavior: validation errors, resolution, and other cases that need a temp project tree or subprocess | You need a deterministic error string, multi-file `buildScripts`, or behavior that does not fit a tiny golden snippet |
 | **Compiler golden tests** | `src/transpile/compiler-golden.test.ts` (colocated) | Regressions in the parser, validation messages, and scripts-only extraction (`buildScriptFiles` in `emit-script.ts`) — expectations are inline in the test file | You changed the parser, validator, or script extraction and need to lock an exact error string, extracted script shape, or corpus behavior |
-| **Compiler tests (txtar)** | `test-fixtures/compiler-txtar/*.txt` | Parse and validate outcomes — success, parse errors, validation errors — using language-agnostic txtar fixtures (hundreds of `===` cases across the four `*.txt` files) | You want a portable test case that can be reused by alternative compiler implementations; the test is a `.jh` input paired with an expected outcome |
-| **Golden AST tests** | `test-fixtures/golden-ast/fixtures/*.jh` + `test-fixtures/golden-ast/expected/*.json` | Parse tree shape for successful parses — serialized to deterministic JSON with locations stripped (9 fixtures: e.g. imports, brace-if, log, match and match-multiline, params, prompt-capture, run-ensure, script-defs) | You changed the parser and need to verify the AST structure hasn't drifted; txtar tests only check pass/fail, goldens lock in the actual tree shape |
-| **Integration tests** | `integration/*.test.ts`, `integration/sample-build/*.test.ts` | Process-level integration behavior: signal handling, TTY rendering, run summary structure, sample builds | The test spans multiple modules or requires subprocess/PTY harnesses |
+| **Trivia / formatter round-trip** | `src/parse/trivia-ast-shape.test.ts`, `src/parse/trivia-grep.test.ts`, `src/format/roundtrip.test.ts` | Source-fidelity invariants: no trivia fields on semantic AST types (compile-time), validator/emitter sources do not reference `Trivia`, and `parse → format → parse → format` is bit-for-bit on every fixture under `examples/` and `test-fixtures/golden-ast/fixtures/` | You changed the parser, formatter, AST types, or anything that touches source-fidelity round-trip (see [Architecture — Trivia (CST layer)](architecture.md#trivia-cst-layer)) |
+| **Call-args AST shape** | `src/parse/arg-ast-shape.test.ts`, `src/parse/arg-grep.test.ts` | Pins the typed-`Arg[]` invariant: no `bareIdentifierArgs` field on any call-bearing AST type (compile-time), no `args.split(",")` or `bareIdentifierArgs` text in production `src/parse/` or `src/transpile/` sources, and no `validateBareIdentifierArgs` helper in the validator | You changed how call arguments flow through the parser, validator, or emitter |
+| **`Expr` / step-variant shape** | `src/types-shape.test.ts` | Pins exactly 8 `WorkflowStepDef` variants and 8 `Expr` kinds, no AST placeholder strings (`"__match__"`, `"run inline_script"`, `"__JAIPH_MANAGED__"`) anywhere under `src/`, and `ConstRhs` / `SendRhsDef` no longer exported from `src/types.ts` | You added or renamed a step variant or `Expr` kind |
+| **Validator single-walk shape** | `src/transpile/validate-single-walk.test.ts` | Pins the validator's "one descent per workflow / rule" invariant | You touched `walkStepTree` or added a new pre-pass over workflow steps |
+| **Validator visitor-table shape** | `src/transpile/validate-visitor.test.ts` | Caps `validate.ts` at **≤700 lines**; snapshot-pins `{ code, line, col, message }` from `validate-errors.txt` and `validate-errors-multi-module.txt` into `test-fixtures/compiler-txtar/validate-diagnostics-snapshot.json`; asserts unknown step types produce exactly one `internal: no validator for step type "…"` diagnostic | You touched the `VALIDATORS` table or changed `E_VALIDATE` message wording — refresh snapshots with `UPDATE_SNAPSHOTS=1` only after confirming the change is intentional |
+| **Statement-dispatch-table shape** | `src/parse/parse-synthetic-keyword.test.ts`, `src/parse/parse-error-snapshot.test.ts` | Pins the `STATEMENT` keyword-dispatch refactor of `parseBlockStatement`; snapshot-pins every parse error in `test-fixtures/compiler-txtar/parse-errors.txt` into `test-fixtures/compiler-txtar/parse-errors-snapshot.json` | You added a top-level keyword or changed any `E_PARSE` message — refresh snapshots with `UPDATE_SNAPSHOTS=1` only after confirming the change is intentional |
+| **Attached-block parser shape** | `src/parse/parse-attached-block.test.ts` | Caps `src/parse/steps.ts` at **≤200 lines**; asserts `catch` / `recover` bodies share `parseBlockStatement` | You touched `parseAttachedBlock` / `parseRunOrEnsure` |
+| **Compile-time / runtime layering** | `src/transpile/no-runtime-imports.test.ts`, `src/parse/canonicalize-triple-quoted.test.ts` | No `from "…/runtime/…"` imports under `src/transpile/`; triple-quoted match-arm bodies match `canonicalizeTripleQuotedString` bit-for-bit | You added a helper used by both validator and runtime (it belongs in `src/parse/`) |
+| **Diagnostics collector shape** | `src/transpile/diagnostics-collector.test.ts` | `collectDiagnostics(graph)` returns all recoverable errors; `validate.ts` and `validate-step.ts` have zero `throw jaiphError(` sites; `jaiph compile --json` returns the full diagnostic array | You migrated checks to the collector or changed `jaiph compile` output |
+| **Compiler tests (txtar)** | `test-fixtures/compiler-txtar/*.txt` | Parse and validate outcomes using language-agnostic txtar fixtures | Portable test cases reusable by alternative compiler implementations |
+| **Golden AST tests** | `test-fixtures/golden-ast/fixtures/*.jh` + `test-fixtures/golden-ast/expected/*.json` | Parse tree shape for successful parses — serialized to deterministic JSON with locations stripped (11 fixtures under `fixtures/`) | You changed the parser and need to verify AST structure hasn't drifted |
+| **Integration tests** | `integration/**/*.test.ts` (sample-build, docs parity, top-level) | Process-level integration behavior: signal handling, TTY rendering, run summary structure, sample builds, Diátaxis docs contracts | The test spans multiple modules, requires subprocess/PTY harnesses, or encodes a cross-cutting docs contract |
 | **E2E tests** | `e2e/tests/*.sh` | Runtime behavior — does the workflow actually execute correctly end-to-end? | The behavior involves the CLI launcher, Node runtime, process lifecycle, or file artifacts |
 
 ### Key principles
 
-1. **Compile-time validation vs graph loading.** `buildScripts` / `emitScriptsForModule` run **`validateReferences`** before any script files are written. **`buildRuntimeGraph()`** only parses modules and follows imports — it does **not** re-run that validation. Lock compile errors in the compiler/validator tests; the runtime graph is the wrong layer for that (see [Architecture — Core components](architecture.md#core-components)). **`jaiph compile`** runs **`validateReferences` only** (no **`buildScripts`**, no runner); cover it with txtar/acceptance/E2E such as `e2e/tests/109_compile_command.sh`, not by expecting the full transpile path — see [Architecture — System overview](architecture.md#system-overview).
+1. **Compile-time validation vs graph loading.** `buildScriptsFromGraph` / `emitScriptsForModuleFromGraph` run **`validateModule`** before any script files are written. **`buildRuntimeGraph(graph)`** prepares the runtime view from the in-memory graph — it does **not** re-run compile-time validation. Lock compile errors in validator/txtar/acceptance tests; the runtime graph is the wrong layer for that. **`jaiph compile`** calls **`collectDiagnostics(graph)`** (same checks as **`validateReferences`**, all errors reported) — no **`buildScriptsFromGraph`**, no runner spawn; see [Architecture — System overview](architecture.md#system-overview).
 2. **`jaiph test` vs live events.** **`jaiph test`** reuses **`NodeWorkflowRuntime`** with **`suppressLiveEvents: true`** so **`__JAIPH_EVENT__`** lines are **not** written to stderr alongside **`node --test`** output while **`run_summary.jsonl`** and other artifact paths stay consistent where the harness writes them ([Architecture — Test runner integration](architecture.md#test-runner-integration-testjh-in-the-kernel)).
 3. **Tests are behavior contracts.** E2E tests and acceptance tests define what the product does. Default approach: change production code to satisfy tests, not the other way around.
 4. **Modify existing tests only with a strong reason:** intentional product behavior change, incorrect test expectation, or removal of an obsolete feature. Any such change should be minimal and paired with a clear rationale.
-5. **Golden tests are the compiler's safety net.** After transpiler changes, run `npm test`. Failures in `src/transpile/compiler-golden.test.ts` usually mean updating an explicit expected string or fixture in that file — there is no separate dump script; align expectations with intentional emitter changes and re-run `npm test`. **Golden AST tests** (`test-fixtures/golden-ast/`) complement this by locking in the parse tree shape — if those fail, regenerate with `UPDATE_GOLDEN=1 npm run test:golden-ast` and review the diff.
+5. **Golden tests are the compiler's safety net.** After transpiler changes, run `npm test`. Failures in `src/transpile/compiler-golden.test.ts` usually mean updating an explicit expected string in that file. **Golden AST tests** (`test-fixtures/golden-ast/`) complement this — if those fail, regenerate with `UPDATE_GOLDEN=1 npm run test:golden-ast` and review the diff.
 6. **E2E tests assert two things independently:** what the user sees (CLI tree output via `e2e::expect_stdout`) and what the runtime persists (artifact files via `e2e::expect_out`, `e2e::expect_file`). A bug could break one without the other.
 7. **Prefer the narrowest test layer.** A pure function bug should be caught by a unit test, not an E2E test. E2E tests are expensive to run and hard to debug — reserve them for integration-level behavior.
 
 ### TypeScript test layout
 
 - **Module tests** — live next to the source they validate under `src/` (e.g. `src/parse/parse-core.test.ts`, `src/cli/run/display.test.ts`, `src/transpile/compiler-golden.test.ts`). Names are `*.test.ts` or `*.acceptance.test.ts`.
-- **Integration tests** — span multiple modules or need subprocess/PTY harnesses; they live in `integration/` (see [Integration tests](#integration-tests)).
+- **Integration tests** — span multiple modules, need subprocess/PTY harnesses, or enforce docs structure/contracts; they live in `integration/` (see [Integration tests](#integration-tests)).
 - **E2E** — bash scripts in `e2e/tests/*.sh`, driven by `e2e/test_all.sh`.
-- **`npm test`** discovers colocated files under `src/`, integration tests under `integration/`, and test infrastructure in `test-infra/`; see the [Developing in the repository](#developing-in-the-repository) table for the exact command.
+- **`npm test`** runs the compiled suites under `dist/src/`, `dist/integration/`, and `dist/test-infra/` (after `npm run build`; see the [Developing in the repository](#developing-in-the-repository) table for the exact command).
 
 ### Module test layout (colocated)
 
@@ -138,7 +152,7 @@ find src -type f \( -name '*.test.ts' -o -name '*.acceptance.test.ts' \) | sort
 |------|------------------|------------------------|
 | Parser and tokenizer helpers | `src/parse/*.test.ts`, `src/parse/dedent.test.ts` | `.jh` / `.test.jh` surface: imports, config, steps, strings, channels, fences, `run async`, … |
 | CLI and terminal UX | `src/cli/**/*.test.ts` | Commands, `jaiph run` lifecycle, progress, hooks, `resolve-env` |
-| Transpiler and validation | `src/transpile/*.test.ts` + `*.acceptance.test.ts` | `validateReferences`, `emit`, golden compiler (`compiler-golden.test.ts`), cross-module edge cases (`compiler-edge.acceptance.test.ts`) |
+| Transpiler and validation | `src/transpile/*.test.ts` + `*.acceptance.test.ts` | `validateModule`, `emit`, golden compiler (`compiler-golden.test.ts`), cross-module edge cases (`compiler-edge.acceptance.test.ts`) |
 | Formatter | `src/format/*.test.ts` | `jaiph format` |
 | Runtime and Docker | `src/runtime/kernel/*.test.ts`, `src/runtime/docker.test.ts` | Graph, emit, prompts, test runner, workflow launch, `docker` helper |
 | Standalone root tests | e.g. `src/inline-script-name.test.ts` | Small colocated cases that are not under a feature subtree |
@@ -147,11 +161,17 @@ When adding a new source module or extending an existing one, create or extend t
 
 ### Integration tests
 
-Tests that span multiple modules, require subprocess/PTY harnesses, or exercise process-level behavior live in `integration/`. These do not belong to a single module:
+Tests that span multiple modules, require subprocess/PTY harnesses, exercise process-level behavior, or enforce documentation structure/contracts live in `integration/`. These do not belong to a single module:
 
 | Test file | Kind | What it covers |
 |-----------|------|----------------|
-| `integration/sample-build/build.test.ts` | Integration | Build/transpile behavior — `buildScripts`, `buildScriptFiles`, script extraction |
+| `integration/docs-structure.test.ts` | Integration | Diátaxis docs lint — valid `diataxis:` front matter, nav ↔ page bijection, internal link / permalink / `redirect_from` resolution |
+| `integration/docs-explanation-task3.test.ts` | Integration | Four greenfield explanation pages (`why-jaiph`, `inbox`, `spec-async-handles`, `sandboxing`) — permalinks, nav placement; **`sandboxing.md`** shape (threat model present; no how-to procedure headings or config-key tables) |
+| `integration/docs-how-to-task4.test.ts` | Integration | How-to quadrant — permalinks, retired-path redirects, recipe shape, `agent-auth` credential / pre-flight error pinning |
+| `integration/docs-reference-task5.test.ts` | Integration | Reference quadrant — permalinks, nav placement, `env-vars.md` source parity against `src/`, anti-tutorial shape guards |
+| `integration/docs-tutorials-task6.test.ts` | Integration | Tutorial quadrant — permalinks, `/getting-started` redirect absorption, runnable `first-workflow` snippet with documented output |
+| `integration/docs-nav-structure-task7.test.ts` | Integration | Nav spine — five Diátaxis section headings in documented order; every published page under its quadrant exactly once |
+| `integration/sample-build/build.test.ts` | Integration | Build/transpile behavior — `buildScripts`, script extraction |
 | `integration/sample-build/cli-tree.test.ts` | Integration | CLI tree output rendering for sample workflows |
 | `integration/sample-build/run-core.test.ts` | Integration | Core runtime execution — workflow runs, step sequencing, artifacts |
 | `integration/sample-build/run-prompt-agent.test.ts` | Integration | Prompt and agent interaction in sample workflows |
@@ -160,32 +180,61 @@ Tests that span multiple modules, require subprocess/PTY harnesses, or exercise
 | `integration/sample-build/test-framework.test.ts` | Integration | Test framework basics — `mock prompt`, `expect_*`, test block lifecycle |
 | `integration/run-summary-jsonl.test.ts` | Integration | Runs the CLI on a small workflow and asserts structure and fields of `run_summary.jsonl` under `.jaiph/runs/` |
 | `integration/signal-lifecycle.test.ts` | Acceptance | After SIGINT/SIGTERM, verifies `jaiph run` exits within a time bound and leaves no stale child processes |
+| `integration/subcommand-help.test.ts` | Integration | `--help` / usage text for CLI subcommands |
 | `integration/tty-running-timer.test.ts` | Acceptance | In a TTY, verifies the “RUNNING workflow” line updates over time (requires Python 3 PTY harness) |
 
 The `integration/sample-build/` directory also has a shared `helpers.ts` module used by the sample-build tests. Shared test fixtures (`.jh` source files and expected output) live in `test-fixtures/sample-build/`.
 
 ## CI pipeline
 
-The project uses GitHub Actions (`.github/workflows/ci.yml`). The workflow defines **six** jobs; on a typical feature-branch push, **five** of them run. The sixth — **Publish Docker runtime image** — runs only on pushes to **`nightly`** and on **`v*`** version tags, after the other jobs succeed. It builds and pushes `ghcr.io/jaiphlang/jaiph-runtime` (the default `runtime.docker_image` / `JAIPH_DOCKER_IMAGE` when Docker sandboxing is on; see **Docker runtime helper** in [Architecture](architecture.md#core-components)).
+The project uses GitHub Actions (`.github/workflows/ci.yml`). The workflow defines **six** jobs; on a typical feature-branch push, **five** of them run. The sixth — **Publish Docker runtime image** — runs only on pushes to **`nightly`** and on **`v*`** version tags, after the test, E2E, docs, and WSL jobs succeed (ShellCheck is not a publish gate). It builds and pushes `ghcr.io/jaiphlang/jaiph-runtime` (the default `runtime.docker_image` / `JAIPH_DOCKER_IMAGE` when Docker sandboxing is on; see **Docker runtime helper** in [Architecture](architecture.md#core-components)).
 
 | Job | Runner | Purpose |
 |-----|--------|---------|
 | **ShellCheck** | `ubuntu-latest` | Runs `shellcheck` on `runtime/overlay-run.sh` to lint the standalone shell script shipped in the npm package. |
 | **Compiler and unit tests** | `ubuntu-latest` | `npm test` (TypeScript unit + acceptance + golden tests), plus a `curl` check that the public install URL responds and a git-tag verification on `main`. |
-| **E2E** | Matrix: **`ubuntu-latest` twice** + **`macos-latest`** | Job id `e2e`; in the Actions UI each leg appears as **`E2E (<os>, <label>)`**. Runs `npm run test:e2e`. The **`docker`** Ubuntu leg builds **`jaiph-ci-runtime:local`** from **`runtime/Dockerfile`** and exports **`JAIPH_DOCKER_IMAGE=jaiph-ci-runtime:local`** so scripts that set **`JAIPH_DOCKER_ENABLED=true`** do not pull **`ghcr.io/…`** during the job. **`JAIPH_UNSAFE`** is unset on that leg and set to **`true`** on Ubuntu **host** plus **macOS** — unlike manual **`jaiph run`** (see **`resolveDockerConfig`** / [Sandboxing](sandboxing.md)), that matrix choice does **not** mean “everything runs in Docker”: **`e2e/lib/common.sh`** sets **`JAIPH_DOCKER_ENABLED=false`** by default, so only scripts that explicitly re-enable Docker hit the sandbox. Container-only assertions on non-Linux runners use **`e2e::skip`** or availability guards. Implementation: **`src/runtime/docker.ts`**; overview: [Architecture — Core components](architecture.md#core-components). |
-| **Getting started (local)** | `ubuntu-latest` | Serves the Jekyll site from `docs/` on `127.0.0.1:4000`, smoke-checks key routes with `curl`, builds the same local runtime image as E2E for any Docker-backed sample paths, installs Playwright (Chromium), and runs `npx playwright test` for landing-page samples. The Playwright step builds Jaiph, checks sample source against `examples/*.jh`, and runs deterministic samples through the CLI. No runtime dependency on `jaiph.org` for the site content. |
+| **E2E** | Matrix: **`ubuntu-latest` twice** + **`macos-latest`** | Job id `e2e`; in the Actions UI each leg appears as **`E2E (<os>, <label>)`**. Runs `npm run test:e2e`. The **`docker`** Ubuntu leg builds **`jaiph-ci-runtime:local`** from **`runtime/Dockerfile`** and exports **`JAIPH_DOCKER_IMAGE=jaiph-ci-runtime:local`** into the job env (also used by **Getting started (local)**). **`e2e::prepare_shared_context`** clears most inherited **`JAIPH_*`** variables before each test, so Docker E2E scripts that need a local image call **`e2e::ensure_docker_test_image`** (builds **`jaiph-e2e-runtime:local`** from the same **`runtime/Dockerfile`**) and pass **`JAIPH_DOCKER_IMAGE="${E2E_DOCKER_TEST_IMAGE}"`**. **`JAIPH_UNSAFE`** is unset on that leg and set to **`true`** on Ubuntu **host** plus **macOS** — unlike manual **`jaiph run`** (see **`resolveDockerConfig`** / [Sandboxing](sandboxing.md)), that matrix choice does **not** mean “everything runs in Docker”: **`e2e/lib/common.sh`** sets **`JAIPH_DOCKER_ENABLED=false`** by default, so only scripts that explicitly re-enable Docker hit the sandbox. Container-only assertions on non-Linux runners use **`e2e::skip`** or availability guards. |
+| **Getting started (local)** | `ubuntu-latest` | Serves the Jekyll site from `docs/` on `127.0.0.1:4000`, smoke-checks key routes with `curl`, builds the same local runtime image as E2E for any Docker-backed sample paths, installs Playwright (Chromium), and runs `npx playwright test` for landing-page samples. |
 | **E2E install and CLI workflow (windows-latest + wsl)** | `windows-latest` | Provisions or selects a WSL distro, installs Node inside it, and runs `npm run test:e2e` under WSL with **`JAIPH_UNSAFE=true`**. |
 | **Publish Docker runtime image** | `ubuntu-latest` | *Conditional (see above).* Multi-arch push to GHCR. |
 
-### Version tags and npm
+### Version tags, releases, and npm
+
+The supported release-prep path is the **`.jaiph/prepare_release.jh`** workflow. Run it as:
+
+```bash
+jaiph run .jaiph/prepare_release.jh -- 0.10.0    # explicit X.Y.Z
+jaiph run .jaiph/prepare_release.jh             # next patch from package.json
+```
+
+The workflow refuses to start when the git tree is dirty or when `v<version>` already exists, then bumps `package.json` + `package-lock.json` via `npm version X.Y.Z --no-git-tag-version --allow-same-version`, refreshes the hardcoded release ref in `docs/install`, runs **`npm run build`** (rebuilding **`dist/`**), asserts **`node dist/src/cli.js --version`** matches the new version, and runs **`npm run registry:build`** to regenerate **`docs/registry`**. It creates **no commits, no tags, and no `git add`** — review the diff (`git diff`), stage the changes, commit, then `git tag v<version>` and push branch + tag yourself. The CLI version is single-sourced from `package.json`'s `version` field (codegen'd into `src/version.ts` by `npm run embed-assets`).
+
+Pushing a **`v*`** tag triggers two things in this repo:
 
-Pushing a **`v*`** ref does **not** run any npm publish step from this repository: the automation checked in under **`.github/workflows/`** is **`ci.yml`** (push CI) and **`nightly-engineer.yml`** (optional manual engineer run) — **neither publishes to npm**. The same tag pattern **does** satisfy the `if:` on the **`docker-publish`** job in **`ci.yml`**, which pushes `ghcr.io/jaiphlang/jaiph-runtime` after the other CI jobs succeed.
+1. **Docker image publish** — the `docker-publish` job in `ci.yml` pushes `ghcr.io/jaiphlang/jaiph-runtime:<version>` and `:latest` after the other CI jobs succeed.
+2. **Standalone-binary release** — `.github/workflows/release.yml` cross-compiles the Bun-compiled standalone binary for four targets via `oven-sh/setup-bun` and `bun build --compile --target=…`, generates a `SHA256SUMS` file, runs a Linux x64 sanity gate (`./jaiph-linux-x64 --version` must equal `jaiph <tag-without-v>`), and uploads all five assets to the GitHub Release for the tag (creating it if needed). The release job waits for the `CI` workflow on the same SHA to succeed before publishing. Re-runs are available via `workflow_dispatch`.
 
-If you are preparing a release that includes the **npm** package, coordinate version bumps, registry publish, and smoke checks with the maintainers — that flow is intentionally outside this repo’s workflows.
+Pushes to the **`nightly`** branch follow the same matrix and upload to a **rolling prerelease** tagged `nightly` (`gh release upload nightly --clobber`), so `jaiph use nightly` keeps working under the binary installer.
+
+Pushing a **`v*`** ref does **not** run any npm publish step from this repository — `.github/workflows/` contains `ci.yml` (push CI), `release.yml` (standalone binaries; see above), and `nightly-engineer.yml` (optional manual engineer run), and **none publishes to npm**. If you are preparing a release that includes the **npm** package, coordinate version bumps, registry publish, and smoke checks with the maintainers — that flow is intentionally outside this repo's workflows.
+
+#### Release asset naming contract
+
+The installer (`docs/install`) downloads these exact filenames from the release for the resolved ref. The contract is fixed; do not rename or add architecture variants without updating the installer:
+
+| Bun target (`bun build --compile --target=…`) | Asset name |
+|----------------------------------------------|------------|
+| `bun-darwin-arm64` | `jaiph-darwin-arm64` |
+| `bun-darwin-x64`   | `jaiph-darwin-x64` |
+| `bun-linux-x64`    | `jaiph-linux-x64` |
+| `bun-linux-arm64`  | `jaiph-linux-arm64` |
+| —                  | `SHA256SUMS` (covers all four binaries) |
+
+Every release (stable `v*` and rolling `nightly`) ships exactly these five assets.
 
 ### Local docs site (Jekyll)
 
-The **Getting started (local)** CI job validates that the documentation site under `docs/` can be built and served from source. It uses Ruby 3.2 with `bundler-cache`, runs `bundle exec jekyll serve --host 127.0.0.1 --port 4000` in the background, and polls `http://127.0.0.1:4000/` for up to 30 seconds before asserting HTTP 200 on `/`, `/getting-started`, `/setup`, `/libraries`, and `/artifacts`. The same job also prepares Node, a local `jaiph-ci-runtime:local` image, Playwright Chromium, and (for samples that need them) external CLIs — see the `docs-local` job in `.github/workflows/ci.yml` for the exact package list, which can change.
+The **Getting started (local)** CI job validates that the documentation site under `docs/` can be built and served from source. It uses Ruby 3.2 with `bundler-cache`, runs `bundle exec jekyll serve --host 127.0.0.1 --port 4000` in the background, and polls `http://127.0.0.1:4000/` for up to 30 seconds before asserting HTTP 200 on `/`, `/getting-started`, `/setup`, `/libraries`, and `/artifacts`. The same job also prepares Node, a local `jaiph-ci-runtime:local` image, Playwright Chromium, and external CLIs — see the `docs-local` job in `.github/workflows/ci.yml` for the exact package list.
 
 To run the same check locally:
 
@@ -206,7 +255,7 @@ After the Jekyll smoke-check, the CI job also verifies that code samples shown o
 The test does two things:
 
 1. **Source parity** — extracts each sample's source code from the DOM (`[data-sample-source]` elements inside `[data-sample]` tab panels) and compares it byte-for-byte against the corresponding file in `examples/` (identified by `data-sample-file`).
-2. **Output verification** — for each **`[data-sample-output]`** block whose sample/output key is **not** listed in **`SKIP_OUTPUT`** (`e2e/playwright/landing-page.spec.ts`), the test parses the **`➜`** command line, runs it against the temp copy of the page source (the executable **`.jh`** from **`examples/`** named by **`data-sample-file`**, with **`say_hello.test.jh`** also copying companion **`say_hello.jh`**), and compares normalized CLI output to the block. Normalization mirrors **`e2e::normalize_output`** (ANSI, durations, `<agent-command>` / `<script-path>`, log/summary/out/err path lines collapsed to `<path>`, spacing before **`✓ PASS`**). Entries in **`SKIP_OUTPUT`** mark nondeterministic model or agent-backed tabs (e.g. **`say-hello` / success**, **`async` / run**, **`recover-loop` / run**).
+2. **Output verification** — for each **`[data-sample-output]`** block whose sample/output key is **not** listed in **`SKIP_OUTPUT`** (`e2e/playwright/landing-page.spec.ts`), the test parses the **`➜`** command line, runs it against the temp copy of the page source (the executable **`.jh`** from **`examples/`** named by **`data-sample-file`**, with **`say_hello.test.jh`** also copying companion **`say_hello.jh`**), and compares CLI output after Playwright's **`normalize()`** in that spec file. It shares core rules with **`e2e::normalize_output`** (ANSI stripping, `<time>` placeholders, `<agent-command>`, `<script-path>`) and additionally collapses Logs/Summary/out/err path lines to **`<path>`** and normalizes spacing before **`✓ PASS`** — it does **not** apply E2E-only rules such as **`__inline_<hash>`** → **`__inline_<id>`** or async subscript line sorting. Entries in **`SKIP_OUTPUT`** mark nondeterministic model or agent-backed tabs (e.g. **`say-hello` / success**, **`async` / run**, **`recover-loop` / run**).
 
 To run locally:
 
@@ -214,13 +263,15 @@ To run locally:
 npm run test:samples
 ```
 
+The suite runs **serially** (`test.describe.serial` in `landing-page.spec.ts`): the **Try it out** case installs Jaiph from the local repo first (same Node / npm / Bun requirements as [Installing from source](#installing-from-source)), then the tabbed sample checks run `./examples/…` files via the `jaiph` shebang with `~/.local/bin` prepended to **`PATH`**. Install Playwright once with `npx playwright install chromium` if you have not already (also listed in the table above).
+
 If a Jekyll server is already running on **`http://127.0.0.1:4000`**, Playwright reuses it (`reuseExistingServer` in `playwright.config.ts`). Otherwise it starts one.
 
-Samples whose rendered output embeds nondeterministic model or agent transcripts skip output comparison per-tab via **`SKIP_OUTPUT`** in **`e2e/playwright/landing-page.spec.ts`** (see [Landing-page sample verification](#landing-page-sample-verification-playwright)); those tabs still participate in DOM **source parity**.
+Samples whose rendered output embeds nondeterministic model or agent transcripts skip output comparison per-tab via **`SKIP_OUTPUT`** in **`e2e/playwright/landing-page.spec.ts`**; those tabs still participate in DOM **source parity**.
 
 ## E2E testing
 
-The E2E test suite (`e2e/tests/*.sh`) drives the toolchain from outside the TypeScript harness: **`e2e::prepare_test_env`** (via **`prepare_shared_context`** in **`e2e/lib/common.sh`**) prepends a **`jaiph` shim** to **`PATH`** (preferring **`dist/src/cli.js`** when built), sanitizes stray **`JAIPH_*`** vars, wires **`JAIPH_REPO_URL`** to the cloned tree, exports **`JAIPH_DOCKER_ENABLED=false`** by default, then each script invokes **`jaiph run`**; Docker-specific assertions set **`JAIPH_DOCKER_ENABLED=true`** and expect **`JAIPH_DOCKER_IMAGE`** (for example **`jaiph-ci-runtime:local`** on the CI **`e2e`** **docker** matrix leg). Scripts assert on both the CLI tree (**`e2e::expect_stdout`**) and **`*.out` / `.err`** / **`run_summary.jsonl`** under **`.jaiph/runs/`** — see also [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout).
+The E2E test suite (`e2e/tests/*.sh`) drives the toolchain from outside the TypeScript harness: **`e2e::prepare_test_env`** in **`e2e/lib/common.sh`** calls **`e2e::prepare_shared_context`** (sanitizes stray **`JAIPH_*`** vars, prepends **`JAIPH_E2E_BIN_DIR`** to **`PATH`**, wires **`JAIPH_REPO_URL`** to the cloned tree, exports **`JAIPH_DOCKER_ENABLED=false`** by default) and **`e2e::ensure_local_install`** (builds a **`jaiph` shim** that prefers **`dist/src/cli.js`** when present). Each script then invokes **`jaiph run`**; Docker-specific assertions set **`JAIPH_DOCKER_ENABLED=true`** and usually call **`e2e::ensure_docker_test_image`** first, then pass **`JAIPH_DOCKER_IMAGE="${E2E_DOCKER_TEST_IMAGE}"`** ( **`jaiph-e2e-runtime:local`** when the harness builds it). Scripts assert on both the CLI tree (**`e2e::expect_stdout`**) and **`*.out` / `.err`** / **`run_summary.jsonl`** under **`.jaiph/runs/`** — see also [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout).
 
 Some scripts are **contract** tests: they validate persisted machine-readable output (for example `e2e/tests/88_run_summary_event_contract.sh` and `run_summary.jsonl`) in addition to or instead of golden CLI trees.
 
@@ -241,7 +292,7 @@ E2E tests are the outermost **behavior contracts** for the CLI and runtime. Each
 
 **Normalization:** `e2e::normalize_output` (in `e2e/lib/common.sh`) strips ANSI codes, replaces timing values with `<time>`, normalizes **`__inline_<hash>`** script names to **`__inline_<id>`**, swaps some CLI-specific strings (`<agent-command>`, `<script-path>`), and **sorts** a class of async progress lines (UTF-8 subscript markers) so strict equality stays stable when parallel branches finish in different orders. This keeps full-equality heredocs usable across machines.
 
-**Where files land on disk** (directory tree, sequence prefixes): [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout). Runtime testing with `*.test.jh` is covered in [Testing](testing.md). The `run_summary.jsonl` event contract is exercised in `e2e/tests/88_run_summary_event_contract.sh`.
+**Where files land on disk** (directory tree, sequence prefixes): [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout). Runtime testing with `*.test.jh` is covered in [Write & run tests](testing.md). The `run_summary.jsonl` event contract is exercised in `e2e/tests/88_run_summary_event_contract.sh`.
 
 ### Test structure
 
@@ -309,7 +360,7 @@ All helpers are defined in `e2e/lib/common.sh`.
 | Helper | Description |
 |--------|-------------|
 | `e2e::file "name" <<'EOF' ... EOF` | Write a workflow file into the test directory from a heredoc. Creates parent directories as needed. |
-| `e2e::run "file" [args...]` | Build and run a workflow file. Returns the CLI stdout for capture. |
+| `e2e::run "file" [args...]` | Run `jaiph run` on a file in the test directory. Capture stdout with `out="$(e2e::run …)"`. |
 | `e2e::expect_fail "file" [args...]` | Assert that running the workflow fails (non-zero exit). |
 | `e2e::run_dir "file"` | Return the path of the single run directory for `file` under `.jaiph/runs/`. Fails if zero or more than one match. |
 | `e2e::run_dir_at "base" "file"` | Same as `e2e::run_dir` but searches under a custom base directory. |
@@ -363,9 +414,9 @@ rg 'e2e::assert_contains' e2e/tests -n
 
 ### Orphan sample guard
 
-Every `.jh` and `.test.jh` file under `e2e/` must be referenced by at least one test script (`e2e/tests/*.sh`, `e2e/test_all.sh`, or `e2e/lib/`). Unreferenced samples confuse contributors, hide drift from the canonical `examples/` corpus, and make it unclear which fixtures are load-bearing.
+Every top-level `.jh` and `.test.jh` file in `e2e/` must be referenced by at least one test script (`e2e/tests/*.sh`, `e2e/test_all.sh`, or `e2e/lib/`). Unreferenced samples confuse contributors, hide drift from the canonical `examples/` corpus, and make it unclear which fixtures are load-bearing.
 
-The guard script `e2e/check_orphan_samples.sh` detects orphans automatically. It scans every `.jh` and `.test.jh` file under `e2e/`, checks whether its basename appears in any test runner or helper, and also resolves indirect references (a file imported by another `.jh` that is itself referenced counts as covered). Any file that is neither directly nor indirectly referenced is reported as an orphan.
+The guard script `e2e/check_orphan_samples.sh` detects orphans automatically. It scans top-level `e2e/*.jh` and `e2e/*.test.jh` only (not nested paths), checks whether each basename appears in any test runner or helper, and also resolves indirect references (a file imported by another `.jh` that is itself referenced counts as covered). Any file that is neither directly nor indirectly referenced is reported as an orphan.
 
 ```bash
 # Run manually from the repo root
diff --git a/docs/env-vars.md b/docs/env-vars.md
new file mode 100644
index 00000000..5f232352
--- /dev/null
+++ b/docs/env-vars.md
@@ -0,0 +1,136 @@
+---
+title: Environment variables
+permalink: /reference/env-vars
+diataxis: reference
+redirect_from:
+  - /env-vars
+  - /env-vars.md
+---
+
+# Environment variables
+
+This page is the canonical inventory of every environment variable Jaiph reads from process state. It aggregates `JAIPH_*` variables read by the TypeScript runtime/CLI (`src/`), the vendor credentials Jaiph checks before launching workflows, and the host-side variables the installer script consumes.
+
+For role-oriented overviews see [Configuration](configuration.md), [CLI](cli.md), and [Sandboxing](sandboxing.md). For the credential pre-flight contract see [Authenticate agent backends](/how-to/agent-auth).
+
+Symbols used below:
+
+- **Type** — `string`, `path`, `bool` (the literal text `"true"` / `"1"` enables; anything else disables, with per-variable rules noted), `int` (decimal milliseconds or seconds), `int-list` (comma-separated non-negative integers).
+- **Scope** — `host` = read by the host CLI before spawning the runner; `runtime` = read inside the workflow runner (and inside the Docker container when forwarded); `internal` = set automatically by the CLI on the child process and must not be exported manually.
+- **Default** — `—` means the variable has no built-in default (an absent value disables the feature, or the surrounding code falls back to a config-key default).
+
+## Runtime, CLI, and internal variables
+
+The table below covers every `JAIPH_*` name read from `process.env` / `env` in `src/`. It is bidirectionally pinned by the docs-lint harness — a `JAIPH_*` name added or removed in source must be added or removed here in the same change.
+
+<!-- begin: src-parity -->
+
+| Variable | Scope | Type | Default | Related config | Role |
+|---|---|---|---|---|---|
+| `JAIPH_AGENT_BACKEND` | host, runtime | string (`cursor`, `claude`, `codex`) | `cursor` | `agent.backend` | Selects the `prompt` backend. Locked once seen in the parent env. |
+| `JAIPH_AGENT_BACKEND_LOCKED` | internal | bool | — | — | Set to `1` by the CLI when `JAIPH_AGENT_BACKEND` was inherited; blocks lower-precedence layers from overriding. |
+| `JAIPH_AGENT_CLAUDE_FLAGS` | host, runtime | string (whitespace-split) | — | `agent.claude_flags` | Extra flags appended to the Claude CLI invocation. |
+| `JAIPH_AGENT_CLAUDE_FLAGS_LOCKED` | internal | bool | — | — | Lock flag for `JAIPH_AGENT_CLAUDE_FLAGS`. |
+| `JAIPH_AGENT_COMMAND` | host, runtime | string | `cursor-agent` | `agent.command` | Executable line for the Cursor backend. A basename other than `cursor-agent` selects custom-command mode (stdin → command → stdout). |
+| `JAIPH_AGENT_COMMAND_LOCKED` | internal | bool | — | — | Lock flag for `JAIPH_AGENT_COMMAND`. |
+| `JAIPH_AGENT_CURSOR_FLAGS` | host, runtime | string (whitespace-split) | — | `agent.cursor_flags` | Extra flags appended to the Cursor backend invocation. |
+| `JAIPH_AGENT_CURSOR_FLAGS_LOCKED` | internal | bool | — | — | Lock flag for `JAIPH_AGENT_CURSOR_FLAGS`. |
+| `JAIPH_AGENT_MODEL` | host, runtime | string | — | `agent.default_model` | Default model for `prompt` steps. |
+| `JAIPH_AGENT_MODEL_LOCKED` | internal | bool | — | — | Lock flag for `JAIPH_AGENT_MODEL`. |
+| `JAIPH_AGENT_TRUSTED_WORKSPACE` | host, runtime | path | workspace root | `agent.trusted_workspace` | Directory passed to Cursor as `--trust`. Rewritten to `/jaiph/workspace`-relative on Docker forwarding when inside the workspace. |
+| `JAIPH_AGENT_TRUSTED_WORKSPACE_LOCKED` | internal | bool | — | — | Lock flag for `JAIPH_AGENT_TRUSTED_WORKSPACE`. |
+| `JAIPH_ARTIFACTS_DIR` | runtime | path | `<run_dir>/artifacts` | — | Absolute path to the writable artifacts directory for the current run. Set by the runtime; read by `jaiphlang/artifacts` and user scripts. |
+| `JAIPH_CODEX_API_URL` | runtime | string | `https://api.openai.com/v1/chat/completions` | — | Chat-completions endpoint for the `codex` backend. |
+| `JAIPH_DEBUG` | host, runtime | bool (exact `"true"`) | `false` | `run.debug` | Enable debug tracing for the run. |
+| `JAIPH_DEBUG_LOCKED` | internal | bool | — | — | Lock flag for `JAIPH_DEBUG`. |
+| `JAIPH_DOCKER_ENABLED` | host | bool (exact `true`) | — | — | Force Docker on (`true`) or off (any other value). When unset, Docker is on unless `JAIPH_UNSAFE=true`. |
+| `JAIPH_DOCKER_IMAGE` | host | string | `ghcr.io/jaiphlang/jaiph-runtime:<version>` | `runtime.docker_image` | Container image. Must already contain `jaiph`. |
+| `JAIPH_DOCKER_KEEP_SANDBOX` | host | bool (`1` / `true`) | `false` | — | Copy mode only — when enabled, leave the host-side `.sandbox-<id>/` clone on disk after exit for debugging. |
+| `JAIPH_DOCKER_NETWORK` | host | string (`default`, `none`, or named network) | `default` | `runtime.docker_network` | `docker run --network` value. `none` disables egress. |
+| `JAIPH_DOCKER_NO_OVERLAY` | host | bool (`1` / `true`) | `false` | — | Force copy mode even when `/dev/fuse` is available. |
+| `JAIPH_DOCKER_TIMEOUT` | host | int (seconds) | `14400` (4h) | `runtime.docker_timeout_seconds` | Container execution timeout. `0` disables. Invalid values produce `E_DOCKER_TIMEOUT`. |
+| `JAIPH_INBOX_MAX_DISPATCH` | runtime | int | `1000` | — | Maximum inbox messages a single workflow frame may drain before aborting with `E_INBOX_DISPATCH_LIMIT`. |
+| `JAIPH_INBOX_PARALLEL` | — | — | — | — | Unused — the runtime does not read this variable (tests assert setting it has no effect on inbox dispatch order). |
+| `JAIPH_INPLACE` | host | bool (`1` / `true`) | `false` | — | Opt into inplace sandbox mode (host workspace bind-mounted read-write). Not forwarded into the container. |
+| `JAIPH_INPLACE_YES` | host | bool (`1` / `true`) | `false` | — | Auto-confirm the inplace destructive-edit prompt. Required when `JAIPH_INPLACE` is set and stdin is not a TTY. Not forwarded into the container. |
+| `JAIPH_INSTALL_COMMAND` | host | string | `curl -fsSL https://jaiph.org/install \| bash` | — | Command `jaiph use` re-invokes to reinstall. |
+| `JAIPH_LIB` | host | path | — | — | Removed from the product. The CLI strips it from the launched env before each run. |
+| `JAIPH_META_FILE` | internal | path | — | — | Absolute path to the run-metadata file. Set on the detached workflow runner child; stripped from the parent env before launch. |
+| `JAIPH_MOCK_PROMPT_ARMS_JSON` | runtime | string (JSON) | — | — | Test-only — injects a mock-arm dispatch table for `prompt` steps. Set by `jaiph test`. |
+| `JAIPH_MOCK_RESPONSES_JSON` | runtime | string (JSON) | — | — | Test-only — supplies sequential mock prompt responses. Set by `jaiph test`. |
+| `JAIPH_MODULE_GRAPH_FILE` | internal | path | — | — | Absolute path to the serialized `ModuleGraph` JSON. Set by the CLI only on the default local (non-Docker, non-`--raw`) `jaiph run` path. |
+| `JAIPH_NON_TTY_HEARTBEAT_FIRST_SEC` | host | int (seconds) | `60` | — | Seconds before the first non-TTY heartbeat line. |
+| `JAIPH_NON_TTY_HEARTBEAT_INTERVAL_MS` | host | int (ms; floor `250`) | `30000` | — | Minimum interval between subsequent non-TTY heartbeat lines. |
+| `JAIPH_PRECEDING_FILES` | host | string | — | — | Removed from the product. Stripped from the launched env. |
+| `JAIPH_PROMPT_COMPLETION_GRACE_SECONDS` | runtime | int (seconds) | `30` | — | Prompt watchdog — once the backend emits its terminal `result` event, the grace period it may take to exit before Jaiph terminates it and returns success. Guards the case where `claude -p` finishes the work but never exits. `0` disables. |
+| `JAIPH_PROMPT_FINAL_FILE` | runtime | path | — | — | Optional path; when set, `executePrompt` writes the final assistant message there. Jaiph does not set this automatically. |
+| `JAIPH_PROMPT_IDLE_TIMEOUT_SECONDS` | runtime | int (seconds) | `900` (15m) | — | Prompt watchdog — terminate the backend and fail the prompt (feeding the retry backoff) when it produces no stdout/stderr for this long. `0` disables. |
+| `JAIPH_PROMPT_MAX_SECONDS` | runtime | int (seconds) | `7200` (2h) | — | Prompt watchdog — absolute wall-clock cap on a single prompt invocation regardless of activity; on expiry the backend is terminated and the prompt fails into the retry backoff. `0` disables. |
+| `JAIPH_PROMPT_RETRY` | runtime | bool (`0` disables) | enabled | — | Set to `0` to skip the prompt retry backoff. `jaiph test` defaults to `0` so mock failures fail fast. |
+| `JAIPH_PROMPT_RETRY_DELAYS` | runtime | int-list (ms) | `15000,60000,600000,1800000,7200000` | — | Override the prompt retry delay schedule. Invalid entries abort the prompt. |
+| `JAIPH_REGISTRY` | host | path or URL | `https://jaiph.org/registry` | — | Source of the lib registry index used by `jaiph install <name>`. Disk paths (no scheme or `file://`) are read locally; everything else is fetched. |
+| `JAIPH_RUN_DIR` | internal | path | — | — | Absolute path to the active run directory. Set by the runtime inside the runner. |
+| `JAIPH_RUN_ID` | internal | string (UUID) | runner-generated | — | Stable run identifier. Set by the host CLI on the default (non-`--raw`) `jaiph run` path; otherwise the runner generates one at startup. Forwarded into Docker when set. |
+| `JAIPH_RUN_SUMMARY_FILE` | internal | path | `<run_dir>/run_summary.jsonl` | — | Absolute path the runtime writes durable summary events to. |
+| `JAIPH_RUNS_DIR` | host, runtime | path | `.jaiph/runs` under the workspace | `run.logs_dir` | Root directory for run logs. Inside Docker the host CLI overrides this to `/jaiph/run`. |
+| `JAIPH_RUNS_DIR_LOCKED` | internal | bool | — | — | Lock flag for `JAIPH_RUNS_DIR`. |
+| `JAIPH_SCRIPTS` | internal | path | — | — | Directory of emitted `script` files for this run. Set after `buildScripts()`. Any parent-shell value is cleared before launch. |
+| `JAIPH_SKILL_PATH` | host | path | — | — | When set and the path exists, `jaiph init` writes `.jaiph/SKILL.md` from that file. Otherwise the CLI walks an install-relative search. |
+| `JAIPH_SOURCE_ABS` | internal | path | — | — | Absolute path to the entry `.jh` file. Set by the CLI before spawning the runner. |
+| `JAIPH_SOURCE_FILE` | internal | string (basename) | entry-file basename | — | Used to name run directories. |
+| `JAIPH_STDLIB` | host | path | — | — | Removed from the product. Stripped from the launched env. |
+| `JAIPH_TEST_MODE` | runtime | bool (exact `"1"`) | `false` | — | Set by `jaiph test` so the runtime skips production-only branches (e.g. file-mode normalization). |
+| `JAIPH_UNSAFE` | host | bool (`true` only) | `false` | — | Disable Docker for this run; execute on the host. `--unsafe` is the `jaiph run` flag form. |
+| `JAIPH_WORKSPACE` | host, runtime | path | autodetected | — | Workspace root. Inside Docker the host CLI overrides this to `/jaiph/workspace`. |
+
+<!-- end: src-parity -->
+
+## Agent credentials
+
+The host CLI checks these before spawning the runner or container when [credential pre-flight](configuration.md#credential-pre-flight) applies. Pre-flight is skipped when the entry file declares no explicit backend and uses no `prompt` step, on `jaiph run --raw`, and when `JAIPH_UNSAFE=true`. See [Authenticate agent backends](/how-to/agent-auth) for per-backend rules and [Sandboxing](sandboxing.md) for which credentials cross the container boundary.
+
+| Variable | Backend | Host behaviour | Docker behaviour | Notes |
+|---|---|---|---|---|
+| `ANTHROPIC_API_KEY` | `claude` | warning if absent | hard error (`E_AGENT_CREDENTIALS`) | Either this **or** `CLAUDE_CODE_OAUTH_TOKEN` satisfies Claude. |
+| `CLAUDE_CODE_OAUTH_TOKEN` | `claude` | warning if absent | hard error (`E_AGENT_CREDENTIALS`) | Long-lived OAuth token from `claude setup-token`. |
+| `CURSOR_API_KEY` | `cursor` | warning if absent | hard error (`E_AGENT_CREDENTIALS`) | A stored `cursor-agent login` may still work on host runs. |
+| `OPENAI_API_KEY` | `codex` | hard error (`E_AGENT_CREDENTIALS`) | hard error (`E_AGENT_CREDENTIALS`) | No CLI-login fallback. `OPENAI_*` is outside the Docker forwarding allowlist, so sandboxed runs fail preflight even when the key is set on the host. |
+
+Forwarding allowlist prefixes into the Docker container: `JAIPH_*` (except `JAIPH_DOCKER_*`, `JAIPH_INPLACE`, and `JAIPH_INPLACE_YES`), `ANTHROPIC_*`, `CLAUDE_*`, `CURSOR_*`. Everything else — including `OPENAI_*` — is silently dropped — see [Sandboxing](sandboxing.md).
+
+## Installer and `jaiph use`
+
+These variables are consumed by `docs/install` (the installer shell script) and by `jaiph use` when it re-invokes the installer. They are **not** read from inside the Jaiph TypeScript source.
+
+| Variable | Type | Default | Role |
+|---|---|---|---|
+| `JAIPH_REPO_REF` | string | `v0.10.0` (installer default when unset) | Release ref the installer downloads (`v0.10.0`, `nightly`, …). `jaiph use <version>` sets this to `v<version>` or `nightly`. |
+| `JAIPH_BIN_DIR` | path | `$HOME/.local/bin` | Target bin directory for the installed `jaiph` binary. |
+| `JAIPH_RELEASE_BASE_URL` | string | `https://github.com/jaiphlang/jaiph/releases/download/<ref>` | Override the GitHub Release base URL the installer downloads from. |
+| `JAIPH_REPO_URL` | path | — | Local repo path (directory containing `package.json`) for the from-source installer branch (`docs/install-from-local.sh`). Ignored on the binary-download path. |
+
+## Docker sandbox failure modes
+
+These error codes surface during Docker-backed `jaiph run` invocations. They are emitted to stderr (and to the failure footer) and produce non-zero exit codes. Most are `E_DOCKER_*`; `E_TIMEOUT`, `E_VALIDATE_MOUNT`, and `E_FLAG_CONFLICT` appear in Docker contexts but are not strictly Docker-scoped.
+
+| Code | Trigger | Behaviour |
+|---|---|---|
+| `E_DOCKER_NOT_FOUND` | `docker info` fails (Docker not installed or daemon not running). | Run exits before launch. No fallback to local execution. |
+| `E_DOCKER_PULL` | `docker pull` fails (network error, image not found, auth failure). | Run exits before launch. |
+| `E_DOCKER_NO_JAIPH` | Selected image does not contain a `jaiph` CLI. | Run exits before launch. |
+| `E_DOCKER_RUNS_DIR` | Absolute `JAIPH_RUNS_DIR` points outside the workspace. | Run exits before launch. |
+| `E_DOCKER_OVERLAY` | Overlay mode selected but `fuse-overlayfs` is missing or the mount fails. | Container exits with code 78. |
+| `E_DOCKER_TIMEOUT` | `JAIPH_DOCKER_TIMEOUT` is empty, non-numeric, negative, or has trailing junk; or `runtime.docker_timeout_seconds` is negative. | Run exits before launch. |
+| `E_DOCKER_UID` | Linux host UID/GID detection failed. | Run exits before launch. |
+| `E_DOCKER_SANDBOX_COPY` | Copy mode failed to clone the host workspace. | Run exits before launch. |
+| `E_DOCKER_INPLACE_NO_CONFIRM` | `JAIPH_INPLACE` is set but stdin is not a TTY and `JAIPH_INPLACE_YES` is not set. | Run exits before launch. |
+| `E_FLAG_CONFLICT` | `--inplace` / `JAIPH_INPLACE` and `--unsafe` / `JAIPH_UNSAFE=true` are both set. | Run exits before launch. |
+| `E_VALIDATE_MOUNT` | Mount targets a denied host path (`/`, `/proc`, docker socket, etc.). | Run exits before launch. |
+| `E_TIMEOUT` | Container runs longer than the effective Docker timeout. | Container receives SIGTERM, then SIGKILL after 5s grace. |
+| `E_AGENT_CREDENTIALS` | Credential pre-flight detected a missing agent credential. | Run exits before launch. |
+
+## Related
+
+- [Configuration](configuration.md) — config keys and their environment-variable equivalents.
+- [CLI](cli.md) — commands and flags that front-end these variables.
+- [Sandboxing](sandboxing.md) — what the Docker sandbox protects and what it does not.
diff --git a/docs/first-agent-run.md b/docs/first-agent-run.md
new file mode 100644
index 00000000..6088e5db
--- /dev/null
+++ b/docs/first-agent-run.md
@@ -0,0 +1,171 @@
+---
+title: Your first agent + sandboxed run
+permalink: /tutorials/first-agent-run
+diataxis: tutorial
+---
+
+# Your first agent + sandboxed run
+
+This tutorial builds on [Your first workflow](/tutorials/first-workflow). You already have the `jaiph` CLI on `PATH`, you have run a script-only workflow, and you have inspected the artifacts under `.jaiph/runs/`. Here you will add a `prompt` step that calls an agent backend, then run the same workflow inside the Docker sandbox so the agent's actions stay isolated from your host.
+
+## What you will build
+
+A two-step workflow: one `ensure` step that validates a name with a `rule`, and one `prompt` step that asks an agent to greet that name. The workflow runs in Docker by default.
+
+## Prerequisites — credentials
+
+`prompt` steps call an agent backend. Before spawning the runner or Docker container, the CLI runs a [credential pre-flight](/how-to/agent-auth). Under Docker, missing credentials are a hard error (`E_AGENT_CREDENTIALS`) — host-side stored CLI logins (`~/.claude`, macOS Keychain, `cursor-agent login`) do **not** cross the container boundary. On host-only runs, `claude` and `cursor` may warn instead of aborting when a stored CLI login might still work.
+
+Pick one backend and set its env var on the host:
+
+```bash
+# Cursor (the default backend if nothing else is configured)
+export CURSOR_API_KEY="..."
+
+# Claude
+export ANTHROPIC_API_KEY="sk-ant-..."
+# or, after running `claude setup-token`:
+export CLAUDE_CODE_OAUTH_TOKEN="..."
+
+# Codex (OpenAI)
+export OPENAI_API_KEY="sk-..."
+```
+
+For the full per-backend matrix (which CLI logins fall back, which env vars Docker forwards), see [Authenticate agent backends](/how-to/agent-auth).
+
+## Prerequisites — Docker
+
+Install Docker and confirm:
+
+```bash
+docker info
+```
+
+Docker is on by default for `jaiph run`. There is no `--docker` flag — sandboxing is driven by `JAIPH_DOCKER_ENABLED` / `JAIPH_UNSAFE`. The CLI picks a workspace-presentation mode automatically:
+
+- **Overlay mode** when `/dev/fuse` exists (typically Linux).
+- **Copy mode** when `/dev/fuse` is missing (typically macOS Docker Desktop).
+
+Both modes leave your host workspace unmodified at run end. See [Run in a Docker sandbox](/how-to/sandbox-run) for inplace mode (live host edits, opt-in) and for the CLI-line / env-var matrix.
+
+## 1. Configure the backend (optional)
+
+If you set `CURSOR_API_KEY` above, skip this step — `cursor` is the default backend. Otherwise, add a module-level `config { … }` block to the top of your file so the entry workflow picks your backend.
+
+The full file you build in this tutorial is:
+
+```jh
+config {
+  agent.backend = "claude"
+  agent.default_model = "sonnet-4"
+}
+
+rule valid_name(name_arg) {
+  return match name_arg {
+    /[A-Z][a-z]+/ => name_arg
+    "" => fail "You didn't provide your name :("
+    _ => fail "You provided an invalid name :("
+  }
+}
+
+workflow default(name_arg) {
+  const name = ensure valid_name(name_arg)
+
+  const response = prompt """
+    Say hello to ${name} and add one fun fact about a person with the same name.
+    Respond with a single line. Do not inspect files or run tools.
+  """
+
+  return response
+}
+```
+
+Three pieces of new syntax compared with [Your first workflow](/tutorials/first-workflow):
+
+- `config { agent.backend = "claude" }` selects the agent backend at module scope. Drop the block entirely to use the `cursor` default, or set `JAIPH_AGENT_BACKEND` in the environment to override either form (env wins; see [Configure backend & model](/how-to/configure-backend)).
+- `rule valid_name(name_arg) { … }` is a read-only validator. Rules cannot use `prompt` or raw shell — they enforce structure on inputs before the workflow continues. `ensure valid_name(name_arg)` runs the rule and aborts the workflow with the failure message if any arm matches `fail`.
+- `prompt """ … """` is a managed agent call. The triple-quoted body is dedented at parse time and sent to the selected backend's CLI; the agent's stdout is captured as the step value. The `${name}` substitution happens before the prompt is sent.
+
+Save the file as `greet.jh`.
+
+## 2. Run it in the Docker sandbox
+
+```bash
+jaiph run ./greet.jh "Adam"
+```
+
+The CLI does a few things before any workflow step runs:
+
+1. **Loads the module graph** (parses the entry file — one file in this tutorial).
+2. **Resolves Docker mode**: picks overlay (`fusefs` banner) when `/dev/fuse` is present, copy (`tmp workspace`) otherwise.
+3. **Runs the credential pre-flight** for the selected backend. Under Docker, missing env vars abort with `E_AGENT_CREDENTIALS` — no container is launched.
+4. **Pulls the runtime image** (`ghcr.io/jaiphlang/jaiph-runtime:<version>`) if it is not already local. Status lines stream on stderr before the banner.
+5. **Validates the module, emits scripts, prints the banner**, then **spawns the container** — workspace mounted read-only (overlay) or as a disposable clone (copy), and `.jaiph/runs/` read-write for artifacts.
+
+You should see (timings, model output, and exact step name will differ):
+
+```text
+Jaiph: Running greet.jh (Docker sandbox, fusefs)
+
+workflow default (name_arg="Adam")
+  ▸ rule valid_name (name_arg="Adam")
+  ✓ rule valid_name (0s)
+  ▸ prompt claude "Say hello to ${name} and..." (name="Adam")
+  ✓ prompt claude (5s)
+
+✓ PASS workflow default (5.1s)
+
+Hello, Adam — Adam Smith, the 18th-century Scottish economist, is often called the father of modern economics.
+```
+
+Three things to notice:
+
+- The `(Docker sandbox, fusefs)` / `(Docker sandbox, tmp workspace)` banner confirms isolation is on.
+- The `prompt` step line names the backend (`claude` here) and a truncated preview of the prompt body. The full body is in `run_summary.jsonl`.
+- The line printed after `PASS` is `workflow default`'s return value (`return response`).
+
+## 3. Make the rule reject a bad name
+
+Re-run with an empty string so `valid_name` matches the `""` arm:
+
+```bash
+jaiph run ./greet.jh ""
+```
+
+The output ends with the failure footer:
+
+```text
+  ▸ rule valid_name
+  ✗ rule valid_name (0s)
+
+✗ FAIL workflow default (0.3s)
+  Logs: …/.jaiph/runs/…
+  Summary: …/run_summary.jsonl
+    out: …/000002-rule__valid_name.out
+    err: …/000002-rule__valid_name.err
+
+  Output of failed step:
+    You didn't provide your name :(
+```
+
+The `prompt` step is never reached — `ensure` aborted the workflow when the rule failed. The captured `.err` file is the source for the `Output of failed step:` excerpt. Under Docker, container-internal `/jaiph/run/*` paths are remapped to host paths before the footer is printed, so the paths you see point at your host workspace.
+
+## 4. Inspect the prompt record
+
+Each `prompt` step writes a `PROMPT_START` and `PROMPT_END` line to `run_summary.jsonl`. Filter the latest run:
+
+```bash
+jq -c 'select(.type=="PROMPT_START")' .jaiph/runs/*/*/run_summary.jsonl | tail -1
+```
+
+The record includes the resolved `backend`, the `model` (when one was set), and a `model_reason` of `explicit`, `flags`, or `backend-default` — the same information [Configure backend & model](/how-to/configure-backend) uses to verify config precedence.
+
+## Where to go next
+
+You now have a working agent workflow under Docker. Useful next directions:
+
+- [Reference — Language](/reference/language) — every step type, including `run async`, `match`, `for_lines`, `send`, and `if`.
+- [Spec: Async Handles](/spec-async-handles) — fan out two `prompt` steps in parallel and rendezvous at the end of the workflow.
+- [Inbox & Dispatch](/inbox) — route work between workflows without tight coupling.
+- [Sandboxing](/sandboxing) — the threat model: what the Docker sandbox protects against and what it does not.
+- [Write & run tests](/how-to/testing) — author a `*.test.jh` file with mock prompts so the workflow stays deterministic in CI.
diff --git a/docs/first-workflow.md b/docs/first-workflow.md
new file mode 100644
index 00000000..563938a7
--- /dev/null
+++ b/docs/first-workflow.md
@@ -0,0 +1,148 @@
+---
+title: Your first workflow
+permalink: /tutorials/first-workflow
+diataxis: tutorial
+redirect_from:
+  - /getting-started
+  - /getting-started.md
+---
+
+# Your first workflow
+
+This is a learning-oriented walkthrough. By the end of it you will have authored a single `.jh` file, run it with the `jaiph` CLI, watched the live progress tree, and inspected the durable artifacts the runtime wrote under `.jaiph/runs/`.
+
+This tutorial deliberately uses **only `script` steps** — no agent backend, no API keys, no Docker. The follow-up tutorial [Your first agent + sandboxed run](/tutorials/first-agent-run) adds a `prompt` step and the Docker sandbox on top of what you build here.
+
+## What you will build
+
+A workflow that runs one script step which prints a greeting, and a `return` step that propagates the script's output as the workflow's return value. The whole file is five lines.
+
+## Prerequisites
+
+- A POSIX shell (`sh`, `bash`, `zsh`) with `curl` and either `shasum` or `sha256sum` available.
+- About five minutes.
+
+Node, Docker, and API keys are **not** required for this tutorial. Runs use `jaiph run --unsafe` so execution stays on the host (Docker is on by default for `jaiph run`).
+
+## 1. Install the CLI
+
+Install the standalone binary:
+
+```bash
+curl -fsSL https://jaiph.org/install | bash
+```
+
+The installer downloads a per-platform binary, verifies its checksum, and writes it to `~/.local/bin/jaiph`. See [Install & switch versions](/how-to/install) for alternatives (npm, `JAIPH_BIN_DIR`, version switching).
+
+Confirm the install:
+
+```bash
+jaiph --version
+```
+
+If the command is not found, prepend the install directory to `PATH`:
+
+```bash
+export PATH="$HOME/.local/bin:$PATH"
+```
+
+## 2. Author the workflow
+
+Create a fresh directory and write a file named `hello.jh`:
+
+```jh
+script greet = `echo "Hello, ${1:-world}!"`
+
+workflow default(who) {
+  return run greet(who)
+}
+```
+
+Three things are happening:
+
+- `` script greet = `…` `` declares a managed script with a single-line bash body. For multi-line bodies, use a fenced block (`` script greet = ```bash … ```) — the fence tag selects the interpreter (`node`, `python3`, etc.); see [Grammar — Script RHS](/reference/grammar#definitions). Script bodies use shell positional args (`$1`, `$2`, …), not Jaiph `${name}` interpolation; `${1:-world}` is bash default expansion when `run greet(...)` passes no value.
+- `workflow default(who)` is the entry workflow. Every `.jh` file invoked with `jaiph run` enters at `workflow default`. The `who` parameter is bound positionally from CLI arguments after the file path.
+- `return run greet(who)` calls the script with `who` as `${1}`, captures its stdout as the step value, and returns it as the workflow's return value.
+
+## 3. Run it
+
+```bash
+jaiph run --unsafe ./hello.jh "Adam"
+```
+
+`--unsafe` sets `JAIPH_UNSAFE=true` for this run only and skips the Docker sandbox. Two notes on what happens before any step runs:
+
+- The CLI loads the entry file plus its import closure into a `ModuleGraph` once (this file has no imports, so the closure is one module).
+- The CLI validates the graph and emits each `script` body as an executable file under a temp `scripts/` directory referenced by `$JAIPH_SCRIPTS`. Workflow steps stay as interpreted AST — there is no transpiled `default.sh`.
+
+You should see this (timings will differ):
+
+```text
+Jaiph: Running hello.jh (no sandbox)
+
+workflow default (who="Adam")
+  ▸ script greet (1="Adam")
+  ✓ script greet (0s)
+
+✓ PASS workflow default (0.2s)
+
+Hello, Adam!
+```
+
+The first line is the sandbox banner. The `workflow default` row and the indented `▸` / `✓` rows are the live progress tree (`▸` = step started, `✓` = step completed; `(0s)` is per-step elapsed time). The root workflow row is static; only nested steps emit `▸` / `✓` lines. The blank line and `Hello, Adam!` after `PASS` are the workflow **return value** — `jaiph run` prints it on stdout after a successful run.
+
+The `(no sandbox)` banner reflects `--unsafe`: the workflow runs on the host with no container. Omit `--unsafe` and `jaiph run` uses the [Docker sandbox by default](/how-to/sandbox-run); the banner then reads `(Docker sandbox, fusefs)` or `(Docker sandbox, tmp workspace)` depending on the host. If Docker is enabled but the daemon is unavailable, the CLI exits with `E_DOCKER_NOT_FOUND` rather than falling back to the host.
+
+## 4. Inspect the run artifacts
+
+Every run writes durable files under `.jaiph/runs/<YYYY-MM-DD>/<HH-MM-SS>-<entry>/` in UTC. List the most recent run:
+
+```bash
+ls -la .jaiph/runs/*/*/
+```
+
+The layout you should see:
+
+- `000001-workflow__default.out` / `.err` — captured stdout/stderr for the entry workflow step.
+- `000002-script__greet.out` / `.err` — captured stdout/stderr for the `greet` script step.
+- `return_value.txt` — the value `workflow default` returned (success only).
+- `run_summary.jsonl` — the durable event timeline (`WORKFLOW_START`, `STEP_START`, `STEP_END`, `WORKFLOW_END`, …).
+- `heartbeat` — epoch-ms liveness file refreshed about every 10s while the run is active.
+
+Read the captured script output and the return value:
+
+```bash
+cat .jaiph/runs/*/*/000002-script__greet.out
+cat .jaiph/runs/*/*/return_value.txt
+```
+
+Both should match the line printed after `PASS`. The full artifact layout is pinned in [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout); the event types in `run_summary.jsonl` are documented in [CLI Reference — Run artifacts](/reference/cli#run-artifacts).
+
+## 5. Make it fail (and observe the failure footer)
+
+Replace the script body with one that exits non-zero:
+
+```jh
+script greet = `echo "Hello, ${1:-world}!" && exit 7`
+
+workflow default(who) {
+  return run greet(who)
+}
+```
+
+Re-run with the same arguments:
+
+```bash
+jaiph run --unsafe ./hello.jh "Adam"
+```
+
+The CLI prints a `✗ FAIL` line on stderr, a `Logs:` / `Summary:` / `out:` / `err:` block pointing to the run directory, and an `Output of failed step:` excerpt. The process exits non-zero. `return_value.txt` is **not** written on failure — only success.
+
+## Where to go next
+
+Revert the failing script body so the workflow passes again, then pick a direction:
+
+- [Your first agent + sandboxed run](/tutorials/first-agent-run) — add a `prompt` step that calls an agent backend, and run the workflow inside the Docker sandbox.
+- [Reference — Language](/reference/language) — every step type and expression kind, with allowed positions and capture rules.
+- [Reference — CLI](/reference/cli) — every `jaiph` subcommand and flag.
+- [Architecture](architecture.md) — how the CLI, parser, validator, transpiler, runtime, and contracts fit together.
diff --git a/docs/getting-started.md b/docs/getting-started.md
deleted file mode 100644
index 0c0a84cd..00000000
--- a/docs/getting-started.md
+++ /dev/null
@@ -1,41 +0,0 @@
----
-title: Getting started
-permalink: /getting-started
-redirect_from:
-  - /getting-started.md
----
-
-# Getting started
-
-**Jaiph** is a language and runtime for defining and orchestrating AI agent workflows.
-
-It allows you to combine agentic workflows with strict checks and script calls. It comes with built-in Docker sandboxing for agentic workflows, and a set of tooling to make your development faster and more efficient.
-
-## Setup
-
-- **[Setup and installation](setup.md)** — Install the CLI, run a one-liner sample without cloning, execute workflows, format sources, and initialize a project with `.jaiph/` and workspace conventions.
-- **[Libraries](libraries.md)** — Install git-based `.jh` modules under `.jaiph/libs/`, pin versions with a lockfile, and import them with paths like **`"lib-name/rest"`** (first segment is the folder under `.jaiph/libs/`).
-
-## Language
-
-- **[Language](language.md)** — Practical guide to rules, scripts, prompts, workflows, and imports, with patterns you can copy.
-- **[Inbox & Dispatch](inbox.md)** — Named channels and `send` for routing work between workflows without tight coupling.
-- **[Testing](testing.md)** — `*.test.jh` suites, mocks, and assertions for deterministic checks around workflows.
-- **[Spec: Async Handles](spec-async-handles.md)** — `Handle<T>` resolution, implicit join, and interaction with `run async`.
-- **[Grammar](grammar.md)** — Formal syntax, types, and step contracts for the whole surface area.
-
-## Runtime
-
-- **[CLI](cli.md)** — `jaiph run`, `test`, `compile`, `format`, `init`, `install`, `use`, flags, environment variables, and [file-path shorthand](cli.md#file-shorthand) for existing `.jh` / `*.test.jh` files. **`jaiph compile`** walks the import closure and runs **`validateReferences` only** — no **`scripts/`** emission, no **`buildRuntimeGraph()`**, no runner ([Architecture — Summary](architecture.md#summary); directory discovery skips **`*.test.jh`** unless you pass a test file explicitly).
-- **[Configuration](configuration.md)** — `config { }` blocks, agent backends, logging, and runtime options (including env overrides).
-- **[Runtime artifacts](artifacts.md)** — What Jaiph writes under `.jaiph/runs/` (per-step captures, **`run_summary.jsonl`**, optional **`inbox/`** files) versus live **`__JAIPH_EVENT__`** lines on stderr for progress and hooks.
-- **[Hooks](hooks.md)** — Project or user `hooks.json` to run shell commands on workflow and step lifecycle events (hooks run on the **host** CLI even when the workflow runs in Docker).
-- **[Sandboxing](sandboxing.md)** — Docker-backed isolation for **`jaiph run` only** (beta; **on by default** when **`JAIPH_DOCKER_ENABLED`** is unset and **`JAIPH_UNSAFE`** is not **`true`**). Enablement is **environment-only** — use **`JAIPH_DOCKER_ENABLED`** and **`JAIPH_UNSAFE`** as described in [Enabling Docker](sandboxing.md#enabling-docker); workflow **`config` cannot turn Docker on or off**. There is no **`jaiph run --docker`** flag. Image, network, and timeout still come from **`runtime.*`** and **`JAIPH_DOCKER_*`** where applicable ([Configuration](configuration.md)). **`jaiph test`** does not use Docker ([Architecture — Test runner integration](architecture.md#test-runner-integration-testjh-in-the-kernel)).
-
-## Other
-
-- **[VS Code extension](https://marketplace.visualstudio.com/items?itemName=jaiph.jaiph-syntax-vscode)** — Syntax highlighting, formatting, and compile feedback in the editor.
-- **[Architecture](architecture.md)** — How the CLI, parser, transpiler, Node runtime, and contracts fit together; aimed at contributors and deep dives.
-- **[Contributing](contributing.md)** — Clone-and-build workflow, branch strategy, test layers, and how to propose changes.
-- **[Agent Skill](jaiph-skill.md)** — Short, opinionated defaults for AI assistants authoring and running Jaiph in a repo (same content as the canonical raw URL: `https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md`).
-- **[Examples](https://github.com/jaiphlang/jaiph/tree/main/examples)** — Runnable samples (async, inbox, testing, recovery) alongside the main tree.
diff --git a/docs/grammar.md b/docs/grammar.md
index 36c95ff8..9e06cb7d 100644
--- a/docs/grammar.md
+++ b/docs/grammar.md
@@ -1,1111 +1,451 @@
 ---
 title: Grammar
-permalink: /grammar
+permalink: /reference/grammar
+diataxis: reference
 redirect_from:
+  - /grammar
   - /grammar.md
 ---
 
-# Jaiph Grammar
+# Grammar
 
-Jaiph source files (`.jh`) combine a small orchestration language with shell execution. **Workflows** and **rules** express Jaiph steps — sequencing, failure handling (`catch`), value branching (`match` / `if`), prompts, channels. **Scripts** contain Bash (or another interpreter via shebang) and run as isolated subprocesses. The runtime interprets the AST directly; only script bodies are emitted as executable files. This page is the **lexical and grammatical** reference (tables, edge cases, EBNF). For a narrative tour of the same primitives, see [Language](language.md). For system boundaries and event contracts, see [Architecture](architecture.md).
+This page is the authoritative syntactic reference for Jaiph: lexical rules, statement shapes, EBNF, and the validator's error catalog. For step semantics see [Language](language.md). For the system around the grammar see [Architecture](architecture.md).
 
-**Scope:** Lexical rules, syntax, and runtime semantics for normal modules (`.jh`). Test files (`*.test.jh`) are described in [Testing](testing.md). CLI and configuration are covered in [CLI](cli.md) and [Configuration](configuration.md).
+**Scope.** Normal modules (`.jh`) and test modules (`*.test.jh`). For `jaiph run` / `jaiph test`, the compile path is `loadModuleGraph` → `buildScriptsFromGraph(graph, outDir)` (per-module `validateModule` + script emit via `emitScriptsForModuleFromGraph`). `jaiph compile` walks the same import closure through `collectDiagnostics(graph)` and emits no scripts. `parsejaiph(source, filePath)` is I/O-pure. `buildRuntimeGraph` consumes an already-loaded graph and never re-runs validation or re-reads `.jh` sources.
 
-**Source of truth:** When this document and the compiler disagree, treat the implementation as authoritative.
+## Lexical rules
 
-**Compile vs. graph load:** Reference and channel rules are checked during **transpile-time validation** (`validateReferences` on each reachable module) when the CLI runs **`buildScripts`** / **`emitScriptsForModule`** (before any script files are written). The same validation alone runs for **`jaiph compile`** — no `scripts/` emission and no runtime graph build ([Architecture](architecture.md)). The runtime’s **`buildRuntimeGraph`** path **parses** the import closure only; it does not re-run **`validateReferences`**, though execution still resolves symbols from the loaded graph and enforces runtime invariants.
-
-## Overview
-
-This guide answers three questions for workflow authors:
-
-1. **What can appear in a `.jh` file?** — Top-level imports, config, channels, module `const` bindings, scripts, rules, and workflows; execution constructs (`run`, `ensure`, `prompt`, control flow, channels) live in workflow and rule bodies with different restrictions.
-2. **Where is it enforced?** — The parser (`src/parser.ts`, `src/parse/*`) builds the AST; **`validateReferences`** (`src/transpile/validate.ts`) rejects invalid references, arity, and disallowed constructs before **`emitScriptsForModule`** extracts **`script`** bodies to `scripts/`. The **Node workflow runtime** interprets everything else from the AST ([Architecture](architecture.md)).
-3. **How do scripts relate to Jaiph?** — Only **`script`** definitions and inline **`run \`…\`()` / `run ```…```()`** bodies become executable files under `scripts/`; they run as child processes while workflows and rules stay in the interpreter.
-
-The sections below go from **values and declarations** through **steps**, **scripts**, **interpolation**, then **formal notes** (lexical, EBNF, validation catalog).
-
-## Types
-
-Jaiph has two primitive value types — **string** and **script** — that are structurally distinct and non-interchangeable.
-
-**String** is the general-purpose value type. Strings can be interpolated (`${name}`), passed as arguments, assigned to `const` bindings, and sent to an agent via `prompt`. All `const` declarations, `env` declarations, captures, and named parameters produce string values.
-
-```jaiph
-const greeting = "Say hello to ${name}."
-prompt greeting       # valid — strings are promptable
-prompt "Say hello."   # valid — inline string literal
-# run greeting()     — E_VALIDATE: strings are not executable
-```
-
-**Script** is an executable unit. Scripts are invoked with `run` and execute as isolated subprocesses. They cannot be interpolated, assigned to variables, or used as prompt bodies — they are definitions, not values.
-
-```jaiph
-script save = `printf '%s' "$1" > "$2"`
-run save(content, path)   # valid — scripts are executable
-# prompt save             — E_VALIDATE: scripts are not promptable
-# const x = save          — E_VALIDATE: scripts are not values
-# log "${save}"           — E_VALIDATE: scripts cannot be interpolated
-```
-
-The compiler enforces these boundaries at every call site. Using a script where a string is expected (or vice versa) produces an `E_VALIDATE` error with a clear, actionable message.
-
-## Language Concepts
-
-Jaiph enforces a strict boundary between **managed** steps (interpreted by the runtime) and **shell task code**. Prefer top-level `script` definitions (or inline `run` scripts) for multi-line bash. **Workflow** bodies may also contain free-form **inline shell** lines; **rule** bodies must not — unstructured shell there is rejected at validation.
-
-- **Workflows** — Named sequences of steps. **Managed** Jaiph steps include `ensure`, `run`, `prompt`, `const`, `fail`, `return`, `log`/`logerr`, inbox `send` (`channel <- …`), `match`, `if`, `for … in … { … }` (line iteration over a string variable), `run async`, `ensure … catch`, `run … catch`, and `run … recover`. A line that does **not** parse as one of those becomes an **inline shell** step (bash text stored as a `shell` AST node). The compiler still validates shell lines (for example a bare name that refers to a local script or workflow must be written as `run name()`, not as a shell line). For non-trivial bash, prefer a top-level `script` and `run name()`.
-
-- **Rules** — Named blocks of the same **managed** step forms as workflows, with restrictions: `ensure` (other rules), `run` (scripts only — not workflows), `const`, `match`, `if`, `for … in … { … }`, `fail`, `log`/`logerr`, `return`, `ensure … catch`, `run … catch`, and `run … recover`. Rules cannot use `prompt`, `const … = prompt`, inbox `send`, or `run async`. **Raw shell lines are not allowed** in rules: if a line parses as unstructured shell, validation fails with `E_VALIDATE` (`inline shell steps are forbidden in rules; use explicit script blocks`).
-
-- **Scripts** — Top-level `script` definitions emitted as separate executable files under the workspace `scripts/` directory. Called from workflows or rules with `run`. Bodies are opaque to the compiler — the parser does not check Jaiph keywords inside them. Use `echo`/`printf` for data output and `return N`/`return $?` for exit status. In **single-line backtick** script bodies, Jaiph `${…}` interpolation is **forbidden** (use `$1`, `$2`, … from the orchestration layer). In **fenced** (`\`\`\`…\`\`\``) script bodies, `${…}` is passed through to the shell. Polyglot support: a fence lang tag (`` ```<tag> ``) maps to `#!/usr/bin/env <tag>` — any tag is valid (no hardcoded allowlist). Alternatively, a manual `#!` shebang as the first line of the body selects the interpreter; if both a fence tag and a `#!` first line are present, it is an error. Without either, `#!/usr/bin/env bash` is used. For trivial one-off commands, **inline scripts** (`` run `body`(args) `` or `` run ```lang...body...```(args) ``) let you embed a script body directly in a step without a named definition — see [`run` — Inline Scripts](#inline-scripts).
-
-- **Channels** — Named message queues declared at top level with `channel name`. Optionally declare inline routes with `channel name -> workflow` or `channel name -> wf1, wf2`. Workflows send messages with `<-`. See [Inbox & Dispatch](inbox.md).
-
-- **Config** — Optional `config { … }` block. At **module** level, keys may include `agent.*`, `run.*`, `runtime.*`, and `module.*` (see `src/parse/metadata.ts`). A **workflow** may contain at most one nested `config { … }`, it must appear before steps, and only `agent.*` and `run.*` are allowed there (`runtime.*` / `module.*` yield `E_PARSE`). See [Configuration](configuration.md).
-
-## Imports and Exports
-
-`import "path" as alias` loads another module. `export rule` / `export workflow` / `export script` marks a declaration as public.
-
-**Export visibility.** If a module contains at least one `export` declaration, only exported names are reachable through the import alias — referencing a non-exported symbol produces `E_VALIDATE`: `"<name>" is not exported from module "<alias>"`. Modules with zero `export` declarations retain legacy behavior: all top-level definitions are implicitly public.
-
-```jaiph
-import "tools/security.jh" as security
-import "bootstrap.jh" as bootstrap
-
-export script build_docs = `mkdocs build`
-
-export workflow default() {
-  ensure security.scan_passes()
-  run bootstrap.nodejs()
-}
-```
-
-Imported symbols use **dot notation**: `alias.name`. A reference is either a bare `IDENT` (local) or `IDENT.IDENT` (module-qualified). The compiler validates that the target exists and matches the calling keyword (`ensure` for rules, `run` for workflows/scripts).
-
-### Script Imports
-
-`import script "<path>" as <name>` imports an external script file and binds it to a local script symbol. The imported script behaves like a locally declared `script` definition: call it with `run name(args)`, capture stdout with `const x = run name(args)`, and treat it as a `script` value (not assignable to `const` by name alone).
-
-```jaiph
-import script "./queue.py" as queue
-
-workflow default() {
-  const result = run queue("get")
-  log result
-}
-```
-
-The target file is treated as complete script source (not as a Jaiph module). Shebangs in the imported file are preserved — the runtime uses them to select the interpreter, just like fence lang tags on inline scripts. The file must exist; missing targets fail at compile time with `E_IMPORT_NOT_FOUND`.
-
-Script import aliases share the unified per-module namespace with channels, rules, workflows, scripts, and top-level `const` — duplicates are `E_PARSE`.
-
-**Path resolution.** The path is always resolved relative to the importing `.jh` file's directory, not the process working directory. The path must be double-quoted (single quotes are rejected).
-
-### Import Resolution
-
-Module import paths (`import "path" as alias`) resolve in two stages:
-
-1. **Relative to the importing file** (existing behavior). The `.jh` extension is appended if omitted.
-2. **Library fallback.** If relative resolution finds no file and the path contains a `/`, it is split as `<lib-name>/<path-inside-lib>` and resolved to `<workspace-root>/.jaiph/libs/<lib-name>/<path-inside-lib>.jh`. Libraries are installed with `jaiph install` (see [CLI — `jaiph install`](cli.md#jaiph-install)).
-
-```jaiph
-import "queue-lib/queue" as queue       # resolves to .jaiph/libs/queue-lib/queue.jh
-import "tools/security.jh" as security  # resolves relative (unchanged)
-```
-
-Script import paths (`import script "<path>" as name`) resolve relative to the importing file only — there is no library fallback. The path refers to a raw script file (e.g. `.py`, `.sh`), not a `.jh` module.
-
-Missing imports fail at compile time with `E_IMPORT_NOT_FOUND`.
-
-## Module-Level Declarations
-
-### Top-Level `const`
-
-`const name = value` declares a module-scoped variable. Values can be double-quoted strings (single-line only), triple-quoted strings (multiline), or bare tokens like numbers. A double-quoted string that spans multiple lines is rejected — use `"""..."""` instead.
-
-```jaiph
-const REPO = "my-project"
-const MAX_RETRIES = 3
-const GREETING = """
-Hello,
-world
-"""
-```
-
-Variables are accessible as `${name}` inside that module's rules and workflows. They are **not** passed to script subprocesses — use arguments or shared libraries instead. Declaration order matters: `${name}` in a value only expands variables already bound above. Names share the unified namespace with channels, rules, workflows, and scripts. All bindings are immutable — see [Immutable Bindings](#immutable-bindings).
-
-Top-level `local` is rejected — use `const`.
-
-### Channel Declarations
-
-```jaiph
-channel alerts
-channel reports
-channel findings -> analyst
-channel events -> handler_a, handler_b
-```
-
-One channel per line. Channels are used with `send` (`<-`) inside workflows. Routes (`->`) are declared inline on the channel declaration — when a message arrives on the channel, the runtime calls each target workflow. See [Inbox & Dispatch](inbox.md).
-
-## Definitions
-
-Rules and workflows use braces on the declaration line and **must include parentheses** — even when parameterless (e.g. `rule check()`, `workflow default()`). The parser rejects definitions without `()` before `{` with a fix hint. **Call sites** also require parentheses for every `run` and `ensure` (including zero-argument calls: `run setup()`). Scripts use `=` with a backtick body (single-line) or fenced block (multi-line). Rules and workflows may declare **named parameters** inside the parentheses.
-
-```jaiph
-rule check_status() { … }              # no params — () required
-workflow default() { … }               # no params — () required
-rule gate(path) { … }                 # one named param
-workflow implement(task, role) { … }  # two named params
-script setup = `echo ok`               # correct (single-line backtick)
-```
-
-Multiline script bodies use triple-backtick fences (shown in HTML so nested fences render correctly):
-
-<pre><code>script setup = ```
-echo ok
-```
-</code></pre>
-
-## Call Arguments and Named Parameters
-
-### Named Parameters on Definitions
-
-All workflow and rule definitions require parentheses. Named parameters go inside the parentheses; empty `()` is used when there are no parameters:
-
-```jaiph
-workflow implement(task, role) {
-  log "Implementing ${task} as ${role}"
-}
-
-rule gate(path) {
-  run check_exists(path)
-}
-```
-
-Parameter names follow identifier rules (`[A-Za-z_][A-Za-z0-9_]*`), must not be reserved keywords, and must be unique within the parameter list. Empty parentheses `()` are required on **definitions** even when there are no parameters — omitting them is a parse error. At **call sites**, parentheses are **always** required as well, including for zero-argument calls (`run setup()`, not `run setup`).
-
-At runtime, named parameters are the only way to access arguments: if `workflow implement(task, role)` is called with `run implement("build docs", "writer")`, then `${task}` = `"build docs"` and `${role}` = `"writer"`.
-
-### Call-Site Arguments
-
-Parentheses are **required** for all call sites — `run setup()`, `ensure gate()`, etc. Bare identifiers without parentheses (e.g. `run setup`) are `E_PARSE`. When arguments are present, they are comma-separated expressions inside the parentheses:
-
-```jaiph
-run setup()                            # zero args
-run implement("my-task", "my-role")    # with args
-ensure gate(path)                      # with args
-```
-
-**Bare identifier arguments:** In-scope variable names must be passed as bare identifiers without quoting. A bare identifier `name` is equivalent to `"${name}"` — the variable's value is passed as the argument:
-
-```jaiph
-const task = run get_next_task()
-run docs.update_from_task(task)          # correct: bare identifier
-run queue.remove(task, "completed")      # mixed bare + quoted literal
-ensure check_branch(branch_name)         # works with ensure too
-```
-
-This rule applies to all call sites: `run`, `ensure`, `return run`/`return ensure`, `send … <- run`, and `const x = run …`. Quoted strings with additional text around the interpolation (e.g. `"prefix_${name}"`) are allowed since they cannot be expressed as bare identifiers.
-
-Bare identifiers must reference a known variable (`const`, capture, or named parameter). Unknown names produce an `E_VALIDATE` error at compile time. Jaiph keywords (`run`, `ensure`, `const`, etc.) cannot be used as bare identifier arguments.
-
-### Nested Managed Calls in Arguments
-
-Call arguments can contain **explicit nested managed calls** using `run` or `ensure`. The nested call executes first and its result is passed as a single argument to the outer call. This is a deliberate language rule: managed execution must always be explicit — scripts and workflows execute only via `run`, rules only via `ensure`, even inside argument lists.
-
-**Valid explicit forms:**
-
-```jaiph
-run mkdir_p_simple(run jaiph_tmp_dir())      # nested run
-run do_work(ensure check_ok())               # nested ensure
-run do_work(run `echo aaa`())                # nested inline script
-```
-
-**Invalid bare call-like forms** — rejected at compile time with actionable errors:
-
-```jaiph
-# run do_work(bar())           — E_VALIDATE: nested managed calls must be explicit
-# run do_work(rule_bar())      — E_VALIDATE: nested managed calls must be explicit
-# run do_work(`echo aaa`())    — E_VALIDATE: nested inline scripts must be explicit
-```
-
-The **capture-then-pass** form is always valid:
-
-```jaiph
-const x = run bar()
-run foo(x)
-```
-
-### Arity Checking
-
-When the callee declares named parameters, the compiler validates that the number of arguments at the call site matches the number of declared parameters. A mismatch produces an `E_VALIDATE` error:
-
-```jaiph
-workflow greet(name) { log "Hello ${name}" }
-
-workflow default() {
-  run greet("Alice")              # OK: 1 arg, 1 param
-  # run greet("Alice", "Bob")    — E_VALIDATE: expects 1 argument(s) (name), but got 2
-  # run greet()                  — E_VALIDATE: expects 1 argument(s) (name), but got 0
-}
-```
-
-Arity checking applies to all `run` and `ensure` call sites (steps, captures, `return run`/`return ensure`, and `send` RHS), including zero-argument calls written as `run ref()` (empty argument list). When the callee has no declared parameters (legacy style), no arity check is performed — any number of arguments is accepted.
-
-Arguments are available as `${paramName}` in orchestration strings (rules and workflows) and `$1`, `$2`, … in script bodies.
-
-## Workflow Steps
-
-### `run` — Execute a Workflow or Script
+| Element | Rule |
+|---|---|
+| Identifier | `[A-Za-z_][A-Za-z0-9_]*`. |
+| Reference | `IDENT` (local) or `IDENT.IDENT` (module-qualified). |
+| Comment | Full-line `#` comment. Trailing `#` on a step line is not a comment. |
+| Blank line | Preserved between steps inside workflow and rule bodies (as `blank_line` trivia). `jaiph format` collapses multiple consecutive body blanks to one and trims trailing blanks before `}`. Top-level blank lines are not preserved — the formatter emits one blank line between emitted sections. |
+| Shebang | A `#!` first line of the file is ignored by the parser. |
+| Single-line string | Double-quoted `"…"`. Single-quoted strings are `E_PARSE`. Use `\"`, `\\`, `\n`, `\t`. |
+| Multiline string | Triple-quoted `"""…"""`. The opening `"""` must end the line; the closing `"""` must be on its own line. |
+| Script body (single-line) | Backtick `` `…` ``. Jaiph `${identifier}` / `${identifier.field}` interpolation is `E_PARSE`; bash parameter expansion (for example `${var:-default}`) passes through. |
+| Script body (fenced) | Triple-backtick `` ``` ``…`` ``` ``. Optional lang tag `` ```<tag> ``. `${…}` passes through to the shell. |
+| Required parentheses | All `run` / `ensure` call sites require parentheses, including zero-argument calls. Bare `run setup` is `E_PARSE`. |
+
+## File structure
 
-In a **workflow**, `run` targets a workflow or script. In a **rule**, `run` targets a script only.
+```ebnf
+file = { top_level } ;
 
-```jaiph
-run setup_env()
-run lib.build_project(task)
-const result = run helper(arg)
-const output = run transform()
+top_level = config_block
+          | import_stmt
+          | import_script_stmt
+          | channel_decl
+          | env_decl
+          | rule_decl
+          | script_decl
+          | workflow_decl ;
 ```
 
-Assignment-style capture without `const` (e.g. `result = run …`) is a parse error — use `const result = run …` only.
-
-Shell redirection or pipelines after `run` (`>`, `|`, `&`) are rejected — use a script for shell I/O.
-
-**Capture:** For a workflow callee, capture gets the explicit `return "…"` value. For a script callee, capture gets stdout.
+`env_decl` is written `const` in source; the parser stores it under `envDecls` / module constants. Test modules may also contain `test` blocks — see [Write & run tests](/how-to/testing).
 
-#### Inline Scripts
+### Top-level ordering
 
-Inline scripts embed a shell command directly in a workflow or rule step without declaring a named `script` definition. Use single backticks for one-liners or triple backticks for multiline bodies. Arguments go in parentheses after the closing backtick(s).
-
-```jaiph
-workflow default() {
-  run `echo hello`()
-  const x = run `echo captured`()
-  const y = run `date +%s`()
-  log "got: ${x}, time: ${y}"
-}
-```
+| Construct | Formatter behaviour |
+|---|---|
+| `import`, `config`, `channel` | Hoisted to the top, in that order, preserving relative source order within each group. Comments immediately before a hoisted construct move with it. |
+| `const`, `rule`, `script`, `workflow`, `test` | Keep their original relative source order. Comments before non-hoisted definitions stay in place. |
 
-Optional arguments are passed as comma-separated expressions inside the parentheses after the closing backtick and are available as `$1`, `$2`, … inside the script:
+### Top-level `const`
 
-```jaiph
-run `echo $1-$2`("hello", "world")   # prints: hello-world
+```ebnf
+env_decl  = "const" IDENT "=" env_value ;
+env_value = double_quoted_string | triple_quoted_block | bare_value ;
 ```
 
-**Fenced block form:** For multiline inline scripts or polyglot one-liners, use triple-backtick fences. An optional lang tag selects the interpreter — same rules as named scripts (`` ```<tag> `` → `#!/usr/bin/env <tag>`). Arguments go in parentheses after the closing fence:
+Values: double-quoted string (single-line; multi-line double-quoted is `E_PARSE`), triple-quoted multiline, or a bare token (e.g. `const N = 42` stores the string `"42"`). Top-level `local` is `E_PARSE` — use `const`. Top-level `const` shares the unified per-module namespace with channels, rules, workflows, and scripts.
 
-```text
-run ```
-echo "line one"
-echo "line two"
-```()
-```
+## Imports and exports
 
-```text
-run ```python3
-import sys
-print(f"args: {sys.argv[1:]}")
-```()
+```ebnf
+import_stmt        = "import" string "as" IDENT ;
+import_script_stmt = "import" "script" string "as" IDENT ;
 ```
 
-Both body forms work with capture:
-
-<pre><code>workflow default() {
-  const x = run `echo captured`()
-  const y = run ```
-date +%s
-```()
-  log "got: ${x} at ${y}"
-}
-</code></pre>
-
-**Deterministic naming:** Inline script bodies are emitted as executable files under `scripts/` with names of the form `__inline_<hash>` where `<hash>` is the first **12** hex digits of the SHA-256 digest of `shebang + "\n" + body` when a shebang is present, or of the body alone when it is not (`src/inline-script-name.ts`). The same body and shebang always produce the same artifact name across runs.
-
-**Isolation:** Inline scripts use the same subprocess mechanism as named scripts: the child inherits the **workflow runner’s environment** (`process.env` passed into `NodeWorkflowRuntime`), including host variables and Jaiph-related keys set by the CLI and layered config — not a freshly emptied environment. **Orchestration bindings** (`const`, parameters, captures) are **not** exported into that environment automatically; pass values as **`$1`, `$2`, …** or rely on variables already exported by the host.
-
-**Restrictions:**
-- `run async` with inline scripts is not supported — inline scripts cannot be used with `run async`.
-- **Backtick** (single-line) inline scripts: Jaiph interpolation (`${...}`) is forbidden — use `$1`, `$2` positional arguments instead.
-- **Fenced block** (triple-backtick) inline scripts: `${...}` is passed through to the shell as standard shell parameter expansion.
-
-### `run async` — Concurrent Execution with Handles
+| Aspect | Rule |
+|---|---|
+| Module import path | Quoted string. `.jh` extension auto-appended when omitted. Relative resolution against the importing file's directory. |
+| Library fallback | When relative resolution finds no file and the path contains `/`, the path is split as `<lib-name>/<sub-path>` and resolved to `<workspace>/.jaiph/libs/<lib-name>/<sub-path>.jh`. |
+| Script import path | Quoted string. Relative-only (no library fallback). The path refers to a raw script file (no `.jh` appended). |
+| Missing target | `E_IMPORT_NOT_FOUND` at compile time. |
+| Alias collision | Aliases share the unified namespace with channels, rules, workflows, scripts, and top-level `const`. Duplicates are `E_VALIDATE`. |
+| `export` | Marks a top-level `rule` / `workflow` / `script` as public. If at least one `export` exists, only exported names are reachable through the alias (`E_VALIDATE: "<name>" is not exported from module "<alias>"`). Modules with zero `export` declarations have implicit-public semantics. |
 
-`run async ref(args)` starts a workflow or script concurrently and returns a **`Handle<T>`** immediately. `T` is the same return type the function would have under a synchronous `run`. The handle resolves to the eventual return value on first non-passthrough read.
+## Channels
 
-```jaiph
-workflow default() {
-  run async lib.task_a()
-  const h = run async lib.task_b()
-  # Reading h forces resolution — blocks until task_b completes
-  log "${h}"
-  # task_a is implicitly joined before workflow returns
-}
+```ebnf
+channel_decl = "channel" IDENT [ "->" REF { "," REF } ] ;
 ```
 
-**Resolution semantics:** A handle resolves on first non-passthrough read. Reads that force resolution: string interpolation (`"${h}"`), passing as argument to `run`, comparison/conditional (`if h == "ok"`), match subject, channel send. Passthrough (initial capture, re-assignment) does not force resolution. Once resolved, the handle is replaced by the resolved string value; subsequent reads return the cached value.
+One channel per line. A `->` route declaration inside a workflow body is `E_PARSE`. Routes are stored on `ChannelDef`. Route targets must be workflows declaring exactly **three** named parameters (message, channel, sender). Multiple routes drain sequentially.
 
-**Implicit join:** When a workflow scope exits, all remaining unresolved handles created in that scope are implicitly joined. This is not an error.
+## Config blocks
 
-**`recover` and `catch` composition:** Both `recover` (retry loop) and `catch` (single-shot) work with `run async`:
-
-```jaiph
-run async foo() recover(err) {
-  log "repairing: ${err}"
-  run fix_it()
-}
-
-run async bar() catch(e) {
-  log "caught: ${e}"
-}
+```ebnf
+config_block = "config" "{" { config_line } "}" ;
+config_line  = config_key "=" config_value ;
+config_value = string | "true" | "false" | integer ;
 ```
 
-`recover` uses the same retry-limit semantics as non-async `recover` (default 10, configurable via `run.recover_limit`).
-
-In the progress tree, each async branch is prefixed with a subscript number (₁₂₃…) assigned in dispatch order. Nested `run async` inside a child workflow gets its own numbering scope at the child's indent level. See [CLI — Async branch numbering](cli.md#run-progress-and-tree-output) for display details.
-
-See [Spec: Async Handles](spec-async-handles.md) for the full value model.
-
-Constraints:
-- Workflow-only — rejected in rules with `E_VALIDATE`.
-- Inline scripts not supported with `run async`.
-- For concurrent bash (pipelines, `&`), put the bash in a script and call with `run`.
-
-### `ensure` — Execute a Rule
-
-`ensure` runs a rule and succeeds if its exit code is 0.
-
-```jaiph
-ensure check_deps()
-const result = ensure lib.validate(input)
-```
+Allowed keys: `agent.default_model`, `agent.command`, `agent.backend`, `agent.trusted_workspace`, `agent.cursor_flags`, `agent.claude_flags`, `run.logs_dir`, `run.debug`, `run.recover_limit`, `runtime.docker_image`, `runtime.docker_network`, `runtime.docker_timeout_seconds`, `module.name`, `module.version`, `module.description`. See [Configuration](configuration.md). Workflow-level `config` permits only `agent.*` and `run.*` (`runtime.*` / `module.*` are `E_PARSE`).
 
-Use `ensure ref()` with parentheses even when there are no arguments.
+The opening line is `config` followed by `{` with optional whitespace between them. Duplicate blocks are `E_PARSE` (`duplicate config block …`). Unknown keys are `E_PARSE` listing the allowed keys. Wrong value types are `E_PARSE`.
 
-### `ensure … catch` — Failure Recovery
+## Types
 
-When `ensure` includes a `catch` clause, a failure in the rule triggers the recovery body **once**. There is no retry loop — the rule runs, and if it fails, the recovery body executes a single time.
+Jaiph has two structurally distinct primitive types:
 
-`catch` requires **explicit bindings** in parentheses — bare `catch` without bindings is `E_PARSE`:
+| Type | Operations |
+|---|---|
+| `string` | Interpolate (`${…}`), pass as argument, assign to `const`, send to `prompt`. |
+| `script` | Invoke with `run`. Not interpolatable, not assignable to `const` by name, not a valid `prompt` body. |
 
-```jaiph
-# Single-statement recovery — one binding
-ensure install_deps() catch (failure) run fix_deps()
+Crossings (`run` on a string, `prompt` on a script, `const x = scriptName`, `${scriptName}`) are `E_VALIDATE` with the specific message.
 
-# Block recovery — one binding
-ensure ci_passes(repo) catch (failure) {
-  log "CI failed, attempting fix"
-  run auto_fix()
-}
+## Definitions
 
+```ebnf
+rule_decl     = [ "export" ] "rule" IDENT "(" [ param_list ] ")" "{" { rule_body_step } "}" ;
+script_decl   = "script" IDENT "=" script_rhs ;
+workflow_decl = [ "export" ] "workflow" IDENT "(" [ param_list ] ")" "{" [ workflow_config ] { workflow_step } "}" ;
+param_list    = IDENT { "," IDENT } ;
 ```
 
-**Bindings:**
-- The binding (e.g. `failure`) receives the merged stdout+stderr from the failed rule execution, including output from nested scripts and rules.
-- Binding names must be valid identifiers. Exactly one binding is required.
-
-Syntax rules:
-- `catch` must be followed by `(<name>)` — bare `catch` or `catch {` without bindings is `E_PARSE`.
-- All rule arguments must appear inside the call parentheses **before** `catch`.
-- `catch` must be followed by at least one recovery step after the bindings.
-
-### `run … catch` — Failure Recovery for Scripts and Workflows
-
-`run` also supports a `catch` clause with the same semantics as `ensure … catch`. When the target script or workflow fails, the recovery body runs **once**.
-
-```jaiph
-# Single-statement recovery
-run deploy() catch (err) run rollback()
+| Aspect | Rule |
+|---|---|
+| Definition parens | Required even when parameterless (e.g. `rule check()`, `workflow default()`). Omitting them is `E_PARSE` with a fix hint. |
+| Parameter names | Identifier syntax, no duplicates, no reserved keywords. |
+| Workflow body | May begin with an optional nested `config { … }` (must precede the first step). |
 
-# Block recovery
-run deploy(env) catch (err) {
-  log "Deploy failed, rolling back"
-  run rollback(env)
-}
+Script RHS:
 
+```ebnf
+script_rhs           = backtick_script_body | fenced_script_block ;
+backtick_script_body = "`" script_text "`" ;
+fenced_script_block  = "```" [ LANG_TAG ] newline { script_line newline } "```" ;
+LANG_TAG             = IDENT ;
 ```
 
-**Bindings** follow the same rules as `ensure … catch`:
-- The binding receives the merged stdout+stderr from the failed execution.
-- Exactly one binding is required.
+The lang tag maps directly to `#!/usr/bin/env <tag>`. Combining a lang tag with a leading `#!` shebang in the body is an error. With neither, the emitter writes `#!/usr/bin/env bash`.
 
-Syntax rules:
-- `catch` must be followed by `(<name>)` — bare `catch` or `catch {` without bindings is `E_PARSE`.
-- All call arguments must appear inside the parentheses **before** `catch`.
-- `catch` must be followed by at least one recovery step after the bindings.
-
-### `run … recover` — Repair-and-Retry Loop
-
-`recover` adds loop semantics to a `run` step. Unlike `catch` (which runs the recovery body once and stops), `recover` retries the target after each repair attempt until it succeeds or the retry limit is exhausted.
-
-```jaiph
-# Single-statement recover
-run deploy() recover(err) run fix_deploy()
+| Fence tag | Resulting shebang |
+|---|---|
+| `` ```bash `` | `#!/usr/bin/env bash` |
+| `` ```node `` | `#!/usr/bin/env node` |
+| `` ```python3 `` | `#!/usr/bin/env python3` |
+| `` ```ruby `` | `#!/usr/bin/env ruby` |
+| `` ```perl `` | `#!/usr/bin/env perl` |
+| `` ```pwsh `` | `#!/usr/bin/env pwsh` |
+| `` ```deno `` | `#!/usr/bin/env deno` |
+| `` ```lua `` | `#!/usr/bin/env lua` |
 
-# Block recover
-run deploy(env) recover(err) {
-  log "Deploy failed: ${err}"
-  run auto_repair(env)
-}
-```
+Any identifier tag is accepted; there is no hardcoded allowlist.
 
-**Loop behavior:**
+## Call sites
 
-1. Execute the `run` target.
-2. If it succeeds, continue (the `recover` body never runs).
-3. If it fails, bind merged stdout+stderr to the binding (e.g. `err`), execute the repair body, then go to step 1.
-4. If the retry limit is reached and the target still fails, the step fails with the last error.
+```ebnf
+call_ref      = REF "(" [ call_args ] ")" ;
+call_args     = call_arg { "," call_arg } ;
+call_arg      = double_quoted_string
+              | IDENT                            (* bare identifier: in-scope variable *)
+              | "${" IDENT "}"
+              | "run" ( call_ref | inline_script )   (* explicit nested managed call *)
+              | "ensure" call_ref ;
+inline_script = backtick_script_body "(" [ call_args ] ")"
+              | fenced_script_block "(" [ call_args ] ")" ;
+```
+
+| Position | Rule |
+|---|---|
+| Bare identifier argument | Must reference an in-scope binding (`const`, capture, parameter). `name` and `"${name}"` are both accepted when the variable is in scope. Unknown names are `E_VALIDATE`. Jaiph keywords are rejected. |
+| Nested managed calls | The `run` / `ensure` keyword is required. `run foo(bar())` / `run foo(rule_bar())` / `run foo(\`echo aaa\`())` are `E_VALIDATE`. Valid: `run foo(run bar())`, `run foo(ensure rule_bar())`, `run foo(run \`echo aaa\`())`. Capture-then-pass is always valid. |
+| Arity | Workflows and rules: argument count must match the declared parameter list (`E_VALIDATE`), including `()` callees (zero arguments required). Scripts accept any argument count (no parameter list to check). |
+| Shell redirection / pipes | Trailing `>`, `>>`, `|`, or `&` after a `run` / `ensure` call is `E_PARSE`. The same operators inside unquoted portions of call arguments are `E_VALIDATE`. Use a `script` for shell I/O. |
 
-**Retry limit:** Default is **10**. Override per-module with `run.recover_limit`:
+## Workflow body statements
 
-```jaiph
-config {
-  run.recover_limit = 3
-}
+```ebnf
+workflow_step = ensure_stmt | run_stmt | run_catch_stmt | run_recover_stmt | run_async_stmt
+              | prompt_stmt | const_decl_step | return_stmt
+              | fail_stmt | log_stmt | logerr_stmt | send_stmt
+              | match_stmt | if_stmt | for_lines_stmt | comment_line ;
 ```
 
-**Bindings** follow the same rules as `catch`:
-- Exactly one binding is required. The binding receives merged stdout+stderr from the failed execution.
-
-Syntax rules:
-- `recover` must be followed by `(<name>)` — bare `recover` or `recover {` without bindings is `E_PARSE`.
-- All call arguments must appear inside the parentheses **before** `recover`.
-- `recover` must be followed by at least one recovery step after the bindings.
-- `recover` and `catch` are mutually exclusive on the same `run` step.
-- `recover` is not supported on `ensure` steps. `recover` works with `run async` — see [`run async`](#run-async--concurrent-execution-with-handles).
-
-### `prompt` — Agent Interaction
-
-Sends text to the configured agent backend. The prompt body can be supplied in three forms: a single-line string literal, a bare identifier referencing an existing binding, or a triple-quoted multiline block.
+Any line that does not match a managed form becomes a **shell** step in workflows. Rules forbid raw shell — the validator's `RULE_SCOPE` rejects unrecognised shell lines with `inline shell steps are forbidden in rules; use explicit script blocks`.
 
-**1. Single-line string literal**
+### `run`
 
-A double-quoted string on one line. `${...}` interpolation works inside the quotes.
-
-```jaiph
-prompt "Review the following code for security issues"
-const answer = prompt "Summarize the report"
+```ebnf
+run_stmt         = "run" ( call_ref | inline_script ) ;
+run_catch_stmt   = "run" ( call_ref | inline_script ) "catch" catch_bindings catch_body ;
+run_recover_stmt = "run" ( call_ref | inline_script ) "recover" recover_bindings recover_body ;
+run_async_stmt   = "run" "async" call_ref [ recover_suffix | catch_suffix ] ;
 ```
 
-If a `"` string has no closing quote on the same line, the parser rejects it — multiline prompt text must use a triple-quoted block (`prompt """..."""`).
+| Position | Allowed targets |
+|---|---|
+| `run` in workflow | Workflow or script. |
+| `run` in rule | Script only. Workflows are `E_VALIDATE`. |
+| `run async` | Workflows only. Inline scripts not supported. |
+| Inline script in `run` | Both workflows and rules. |
 
-**2. Identifier reference**
+Capture: a workflow callee yields the explicit `return` value; a script callee yields trimmed stdout.
 
-A bare identifier after `prompt` uses the string value of an existing binding (e.g. a `const`). The parser greedily takes the first token after `prompt` as the body — `returns` is only recognized as a keyword when it appears **after** a complete body form.
+### `ensure`
 
-```jaiph
-const text = "Analyze this code for security issues"
-prompt text
-const result = prompt text returns "{ type: string, risk: string }"
+```ebnf
+ensure_stmt = "ensure" call_ref [ "catch" catch_bindings catch_body ] ;
 ```
 
-**3. Triple-quoted block (multiline)**
+Targets a rule. Succeeds when the rule's exit code is `0`. `recover` is not supported on `ensure`.
 
-For multiline prompt text, use triple-quote delimiters (`"""`). The opening `"""` must be on the same line as `prompt`. The body supports `${...}` interpolation. Triple backticks (`` ``` ``) are reserved for scripts and rejected in prompt context with a guidance message.
+### `catch` / `recover`
 
-```jaiph
-prompt """
-You are a helpful assistant.
-Analyze the following: ${input}
-"""
+```ebnf
+catch_bindings   = "(" IDENT ")" ;
+catch_body       = workflow_step | "{" { workflow_step } "}" ;
+recover_bindings = "(" IDENT ")" ;
+recover_body     = workflow_step | "{" { workflow_step } "}" ;
 ```
 
-Capture uses **`const` only** — `name = prompt …` is rejected by the parser (use `const name = prompt …`).
-
-```jaiph
-const answer = prompt "Summarize the report"
-const x = prompt myVar
-const y = prompt """
-Analyze this input in detail.
-"""
-```
+| Rule | Behaviour |
+|---|---|
+| Exactly one binding | Required. Bare `catch` / `recover` is `E_PARSE`. |
+| Argument placement | All call arguments appear inside `()` before `catch` / `recover`. |
+| Body content | Parsed by the same `parseBlockStatement` that handles top-level statements; rule scope still rejects shell. |
+| Mutual exclusion | `catch` and `recover` are mutually exclusive on the same `run` step. |
+| Inline-script attachment | `catch` / `recover` only attach to a standalone `run` step. Inline scripts in `log` / `logerr` / `return` / `const` RHS do not accept them. |
 
-**Typed prompt (returns schema):** Ask the agent for structured JSON output. `returns "…"` may follow a single-line string or identifier body on the same line, or appear on the **line after** the closing `"""` of a triple-quoted block.
+### `prompt`
 
-```jaiph
-const result = prompt "Analyze this code" returns "{ type: string, risk: string }"
-const typed = prompt text returns "{ type: string, risk: string }"
+```ebnf
+prompt_stmt    = "prompt" prompt_body [ returns_schema ] ;
+prompt_body    = double_quoted_string | IDENT | triple_quoted_block ;
+returns_schema = "returns" double_quoted_string ;
 ```
 
-For a **triple-quoted** prompt, either put `returns "…"` on the line **immediately after** the closing `"""`, or on the **same line** as the closing delimiter: `""" returns "{ … }"` (nothing else may follow the schema string on that line).
-
-When `returns` is present, **capture is required** — write `const name = prompt … returns "…"`. Uncaptured `prompt … returns` fails at compile time with `E_PARSE` (`validatePromptStepReturns` in `src/transpile/validate-prompt-schema.ts`).
-
-The schema is flat only — allowed types are `string`, `number`, `boolean` (`E_SCHEMA` if invalid). The runtime validates the response: it searches for valid JSON (last non-empty line, fenced code blocks, standalone `{…}`, embedded JSON). On success, the capture variable holds the raw JSON string and each field is accessible via **dot notation** — `${result.type}`, `${result.risk}`. On failure, the step fails with a parse, missing-field, or type error. Bindings in workflows and rules are **strings** end-to-end (including capture, `return`, and `${…}` interpolation). For typed prompts, schema types only constrain the **parsed JSON** from the agent: after validation, each field is coerced with string conversion for storage. For example, `returns "{ n: number }"` with `{"n":42}` stores `42` as the **text** `"42"` in `${x.n}`, not a numeric type. The same applies to `boolean`. Bare `return x.field` in a workflow is sugar for `return "${x.field}"`.
-
-**Dot notation validation:** The compiler validates `${var.field}` references at compile time. If `var` is not a typed prompt capture, the compiler reports an error. If `field` is not defined in the `returns` schema, the error lists available fields.
-
-Prompts are not allowed in rules.
-
-### `const` — Variable Binding
+| Aspect | Rule |
+|---|---|
+| Body forms | Single-line string, in-scope identifier, or triple-quoted block. Triple-backtick fences in prompt context are `E_PARSE`. |
+| Multiline form | Opening `"""` must end the line; closing `"""` must be on its own line. |
+| `returns` placement | After a single-line or identifier body on the same line, or on the line after the closing `"""`, or on the same line as the closing `"""` (nothing else may follow). |
+| `returns` schema | Flat `{ field: type, … }` with types `string`, `number`, `boolean`. Invalid schemas are `E_SCHEMA`. |
+| Capture requirement | `prompt … returns` without `const` capture is `E_PARSE`. |
+| Allowed in | Workflows only. Rules reject `prompt` and `const … = prompt`. |
 
-`const name = <rhs>` introduces an **immutable** variable in the workflow or rule body. The name must not collide with a parameter, an earlier `const`, a capture, or a `script` name in the same scope — see [Immutable Bindings](#immutable-bindings).
+### `const`
 
-```jaiph
-const tag = "v1.0"
-const message = """
-  Hello ${name},
-  Welcome to the project.
-"""
-const result = run helper(arg)
-const check = ensure validator(input)
-const answer = prompt "Summarize the report"
-const reply = prompt myVar
-const analysis = prompt """
-Analyze this input in detail.
-"""
+```ebnf
+const_decl_step = "const" IDENT "=" const_rhs ;
+const_rhs       = double_quoted_string | triple_quoted_block | bash_value_expr
+                | "run" ( call_ref | inline_script ) | "run" "async" call_ref
+                | "ensure" call_ref
+                | "prompt" prompt_body [ returns_schema ]
+                | "match" IDENT "{" { match_arm } "}" ;
 ```
 
-RHS forms: value expressions (`${var}`, quoted strings, triple-quoted `"""..."""` multiline blocks), or explicit `run`/`ensure`/`prompt` capture. Prompt capture supports all three body forms: string literal, identifier, and triple-quoted block. A bare reference like `const x = ref(args)` is rejected — use `const x = run ref(args)`.
-
-Restrictions on const RHS: `$(…)`, `${var:-fallback}`, `${var%%…}`, `${var//…}`, and `${#var}` are all rejected.
+| Position | Rule |
+|---|---|
+| Bare RHS | `const x = ref(args)` is `E_PARSE`. Use `const x = run ref(args)`, `const x = ensure ref(args)`, or `const x = prompt …`. |
+| Assignment without `const` | `name = run …` / `name = prompt …` are `E_PARSE`. |
+| Forbidden expansions on RHS | `$(…)`, `${var:-fallback}`, `${var%%…}`, `${var//…}`, `${#var}` are `E_PARSE`. |
 
-### `send` — Channel Messages
-{: #send--channel-messages}
+### `return`
 
-```jaiph
-alerts <- "Build started"
-reports <- ${output}
-results <- run build_message(data)
-results <- run get_summary()
-alerts <- """
-  Build report for ${project}:
-  Status: ${status}
-"""
+```ebnf
+return_stmt  = "return" return_value ;
+return_value = double_quoted_string | triple_quoted_block | "$" IDENT | "${" IDENT "}"
+             | IDENT
+             | "run" ( call_ref | inline_script )
+             | "ensure" call_ref
+             | "match" IDENT "{" { match_arm } "}" ;
 ```
 
-RHS must be a double-quoted literal, a triple-quoted `"""..."""` multiline block, `$name` or `${…}`, or `run ref(args)` with **parentheses** (same rule as other call sites). An explicit payload is always required — bare `channel <-` without a value is `E_PARSE`. A bare `ref`-shaped word on the RHS (without `run` and `()`) is rejected at **validation** for real workflow, rule, or script names — you must use `run ref(args)` or a string. If `run` is present but the reference has no parentheses, the line does not parse as a `run` send RHS; write `channel <- run target()` instead.
-
-### Channel Routing
-{: #channel-routing}
+`return run helper` (no `()`) becomes a shell `return` step — required to write `return run helper()` / `return ensure check()` for the managed form. Bare identifiers desugar to `return "${ident}"`. Inline-script form requires the `run` keyword (`return run \`echo $1\`("arg")`). Numeric exit codes (`return 0`, `return $?`) are rejected in workflow/rule bodies; use them only in opaque `script` definition bodies.
 
-Routes are declared at the top level on `channel` declarations, not inside workflow bodies:
+### `send`
 
-```jaiph
-channel alerts -> handle_alert
-channel events -> handler_a, handler_b
+```ebnf
+send_stmt = IDENT "<-" send_rhs ;
+send_rhs  = double_quoted_string | triple_quoted_block | "$" IDENT | "${" … "}"
+          | "run" call_ref
+          | shell_fragment ;
 ```
 
-When a routed message is **drained**, the runtime calls each target workflow, binding the three dispatch values (message, channel, sender) to whatever parameter names the target declares. Route targets must declare exactly 3 parameters. Multiple targets dispatch sequentially. Routes are stored on `ChannelDef`, not on workflow definitions or steps. See [Inbox & Dispatch](inbox.md).
-
-**Enqueue vs. dispatch:** `send` appends to an in-memory queue during workflow execution. After that workflow’s steps finish successfully, the runtime **drains** the queue and runs route targets. Sends from **nested** workflows bubble to the **nearest ancestor** workflow context that has routes for that channel (so dispatch stays aligned with the orchestrator workflow — see `NodeWorkflowRuntime`).
-
-A `->` route declaration inside a workflow body is a **parse error** with guidance to move it to the top-level `channel` declaration.
+| Rule | Behaviour |
+|---|---|
+| RHS required | Bare `channel <-` is `E_PARSE`. |
+| Shell fragment RHS | A raw shell expression (for example `findings <- echo "$payload"`) parses as a managed shell payload; allowed only on `send` (`E_VALIDATE` elsewhere). |
+| Bare ref RHS | A bare `ref`-shaped word that names a workflow / rule / script is `E_VALIDATE`. Use `run ref()` or a string. |
+| `run` without `()` | Does not parse as a managed send RHS. |
+| Capture-and-send | `const name = channel <- …` is `E_PARSE`. |
+| Allowed in | Workflows only. Rules forbid `send`. |
 
-### `log` and `logerr`
+### `log` / `logerr`
 
-```jaiph
-log "Processing ${message}"
-logerr "Warning: ${name} not found"
-log status                              # bare identifier — same as log "${status}"
-logerr err_msg                          # bare identifier form works with logerr too
-log """
-  Build started at ${timestamp}
-  Target: ${env}
-"""
+```ebnf
+log_stmt    = "log" ( double_quoted_string | triple_quoted_block | IDENT | "run" inline_script ) ;
+logerr_stmt = "logerr" ( double_quoted_string | triple_quoted_block | IDENT | "run" inline_script ) ;
 ```
 
-`log` writes to stdout; `logerr` writes to stderr (shown with a red `!` marker in the progress tree). Both accept single-line `"..."` strings, triple-quoted `"""..."""` multiline blocks, bare identifiers, or **managed inline-script calls** (`log run \`…\`(args)`). `${identifier}` interpolation works in string forms. At runtime, backslash escapes in the final string are interpreted (`\n` → newline).
-
-**Bare identifier form:** When `log` or `logerr` is followed by a single bare identifier (no quotes), it expands to `"${identifier}"` — the variable's value is logged. The identifier must reference a known binding (`const`, capture, or named parameter).
-
-**Managed inline-script form:** `log run \`script\`(args)` and `logerr run \`script\`(args)` execute the inline script and log its stdout. The `run` keyword is required — bare inline scripts (`log \`…\`()`, `logerr \`…\`()`) are rejected at compile time with a clear error.
+Bare identifier form expands to `"${ident}"`. `log run \`…\`(args)` and `logerr run \`…\`(args)` execute the inline script and log its stdout — the `run` keyword is required (bare inline scripts in `log` / `logerr` are `E_PARSE`).
 
 ### `fail`
 
-```jaiph
-fail "Missing required configuration"
-fail """
-  Multiple issues found:
-  - ${issue1}
-  - ${issue2}
-"""
-```
-
-Aborts the workflow or rule with a message on stderr and non-zero exit. Accepts a single-line `"..."` string or a triple-quoted `"""..."""` multiline block.
-
-### `if` — conditional block
-
-Runs a nested block when a string variable compares equal (or not equal) to a literal, or matches (or does not match) a regex.
-
-```jaiph
-if status == "ok" {
-  log "healthy"
-}
-
-if message =~ /ERROR/ {
-  logerr "matched error pattern"
-}
-```
-
-- **Subject:** bare identifier naming an in-scope variable (`const`, capture, or parameter). If the value is an async **handle**, it is resolved before the test (same resolution rules as other reads).
-- **Operators:** `==` and `!=` take a **double-quoted string** operand; `=~` and `!~` take a **`/regex/`** operand. Mixing operator and operand kinds is a parse error.
-
-Allowed in workflows and rules. Nested steps inside the block follow the same constraints as the surrounding workflow or rule body.
-
-### `for … in …` — iterate lines of a string
-
-```jaiph
-const paths = """
-docs/a.md
-docs/b.md
-"""
-
-for path in paths {
-  log "${path}"
-}
-```
-
-**Syntax:** `for <iterVar> in <sourceVar> { … }` — both names are bare identifiers. `<sourceVar>` must already hold a string; the runtime splits it on newlines (normalizes `\r\n` to `\n`). If the string ends with a final newline, the **trailing empty segment is dropped** — so `"a\nb\n"` yields two iterations (`a`, `b`), not a third empty line (see `linesOfDelimitedString` in `src/runtime/string-lines.ts`).
-
-Inside the body, `<iterVar>` is bound to each line for every iteration. Iterator names participate in the same immutable-binding rules as `const` in that scope.
-
-Allowed in workflows and rules.
-
-### `return`
-
-```jaiph
-return "success"
-return "${result}"
-return response                        # bare identifier — sugar for return "${response}"
-return """
-  Report for ${name}:
-  Status: ${status}
-"""
-return run helper()
-return ensure check(input)
-return run `cat report.txt`()          # inline script — runs and returns stdout
-return run `echo $1`("arg")            # inline script with arguments
+```ebnf
+fail_stmt = "fail" ( double_quoted_string | triple_quoted_block ) ;
 ```
 
-Sets the managed return value in rules and workflows. The value can be a single-line `"..."` string, a triple-quoted `"""..."""` multiline block, a bare identifier, a variable reference, or a **direct managed call** using `return run ref(args)`, `return ensure ref(args)`, or `return run \`script\`(args)`.
-
-**Managed calls need parentheses:** `return run helper` (no `()`) is **not** parsed as a managed return — it becomes a **shell** `return` step. Use `return run helper()` and `return ensure check()` so the parser recognizes the managed form.
+Aborts the workflow or rule with a stderr message and non-zero exit.
 
-**Bare identifier:** `return response` is sugar for `return "${response}"` — the identifier is resolved against the same scope rules used for `${ident}` interpolation (must be a `const`, capture, or parameter). An unknown identifier produces `E_VALIDATE` naming the missing binding, not a shell-step error. Both `return response` and `return "${response}"` remain valid and are equivalent.
+### `if`
 
-A direct managed call executes the target and uses its result as the return value — equivalent to capturing into a variable and returning it, but without the boilerplate:
-
-```jaiph
-# Before: capture then return
-const result = run helper()
-return "${result}"
-
-# After: direct return
-return run helper()
+```ebnf
+if_stmt     = "if" subject_ref if_op if_operand "{" { workflow_step } "}" [ else_clause ] ;
+else_clause = "else" "{" { workflow_step } "}" ;
+subject_ref = IDENT | IDENT "." IDENT ;
+if_op       = "==" | "!=" | "=~" | "!~" ;
+if_operand  = double_quoted_string | "/" regex_source "/" ;
 ```
 
-In workflows, `return run` targets a workflow or script; `return ensure` targets a rule. In rules, `return run` targets a script only; `return ensure` targets another rule. The same validation rules that apply to standalone `run`/`ensure` steps apply here — unknown refs, type mismatches, and shell redirection are all rejected at compile time.
-
-**Inline-script form:** `return run \`script\`(args)` executes the inline script and uses its stdout as the return value. The `run` keyword is required — bare inline scripts (`return \`…\`()`) are rejected at compile time with a clear error.
-
-A bare integer (`return 0`) or `return $?` is a bash exit code, not a Jaiph value return. `return "…"` is not allowed in script bodies — use `echo`/`printf`.
+| Rule | Behaviour |
+|---|---|
+| Subject | Bare identifier or `IDENT.IDENT` (typed-prompt field access). Async handles resolve before the test. |
+| Operator/operand pairing | `==` / `!=` require a double-quoted string. `=~` / `!~` require a `/regex/`. Mixing is `E_PARSE`. |
+| `else` placement | `} else {` must be on a single line. `else if` chaining is not supported — nest `if` inside the `else` block or use `match`. |
+| Value production | `if` is a statement and does not produce a value. Use `match` for value branching. |
+| Allowed in | Workflows and rules. |
 
 ### `match`
 
-```jaiph
-match status {
-  "ok" => "all good"
-  /err/ => "something went wrong"
-  _ => "unknown"
-}
-```
-
-Pattern match on a string value. The subject is always a **bare identifier** (variable name without `$` or `${}`). Arms are tested top-to-bottom; the first match wins. Patterns can be:
-
-- **String literal** (`"ok"`) — exact equality against the subject
-- **Regex** (`/err/`) — tested against the subject
-- **Wildcard** (`_`) — matches anything
-
-Exactly one `_` wildcard arm is required. Arms are **newline-delimited** — commas between or after arms are rejected at parse time with the diagnostic `"commas are not allowed in match arms; use one arm per line"`.
-
-Using `$var` or `${var}` as the match subject is a parse error — use the bare name: `match varName { ... }`.
-
-**Arm bodies** — the expression after `=>` produces the match result. Allowed forms:
-
-- String literal: `"value"` or multiline `"""…"""`
-- Bare in-scope identifier: `name` (must be a `const`, capture, or named parameter)
-- Variable reference / interpolation: `$var`, `${var}`
-- `fail "message"` — aborts the workflow/rule
-- `run ref(args)` / `ensure ref(args)` — managed call whose result becomes the match value
-
-**Disallowed** — rejected at parse/validate time:
-
-- Commas between or after arms (`"x" => "y",` or `"a" => "x", _ => "y"`) — arms are newline-delimited; use one arm per line
-- `return` inside an arm body (`"x" => return "y"`) — the match expression itself produces the value; use `return match x { … }` at the outer level instead
-- Inline script forms (backtick `` `…`() ``) — use a named script with `run script_name(…)`
-- Bare unknown identifiers (`_ => true`, `_ => blorp`) — a bare word that is not an in-scope variable (`const`, capture, or parameter) is rejected with `E_VALIDATE`: `unknown identifier "…" in match arm body`
-
-**Multiline arm bodies** use triple-quoted strings:
-
-```jaiph
-match mode {
-  "verbose" => """
-Detailed output enabled.
-All logs will be shown.
-  """
-  _ => "standard"
-}
-```
-
-**Expression form:** `match` works as an expression with `const` and `return`:
-
-```jaiph
-const label = match status {
-  "ok" => "success"
-  _ => "failure"
-}
-
-return match status {
-  "ok" => "pass"
-  _ => "fail"
-}
-```
-
-The outer `return` applies to the whole match expression — it is not the same as `return` inside an arm body (which is forbidden).
-
-### Variable Binding
-
-All captures require `const`:
-
-```jaiph
-const result = run helper(arg)
-const check = ensure validator(input)
-const answer = prompt "Summarize the report"
-const reply = prompt myVar
-```
-
-### Immutable Bindings
-
-All Jaiph bindings are immutable. Once a name is bound — whether by a parameter declaration, a `const` statement, a capture, or a `script` definition — it cannot be rebound in the same visible scope. The compiler enforces this during validation and rejects violations with `E_VALIDATE`.
-
-**Rejected patterns:**
-
-| Pattern | Error |
+```ebnf
+match_stmt    = "match" subject_ref "{" { match_arm } "}" ;
+match_arm     = match_pattern "=>" arm_body NEWLINE ;
+match_pattern = double_quoted_string | "/" regex_source "/" | "_" ;
+arm_body      = double_quoted_string | triple_quoted_block
+              | IDENT
+              | "$" IDENT | "${" IDENT "}"
+              | "fail" double_quoted_string
+              | "run" call_ref
+              | "ensure" call_ref ;
+```
+
+| Rule | Behaviour |
 |---|---|
-| `workflow w(x) { const x = … }` | parameter `x` cannot be rebound by `const` |
-| `const x = "a"` then `const x = "b"` | duplicate `const` in same scope |
-| `script foo = \`…\`` with param/const `foo` in scope | `script` name collides with immutable binding |
-
-The diagnostic names the conflicting binding and where it was first bound:
-
-```
-E_VALIDATE: cannot rebind immutable name "x"; already bound as parameter at file.jh:1
-```
-
-**Migration:** Code that previously shadowed a parameter with a `const` of the same name (e.g. `workflow w(input) { const input = ensure validate(input) }`) must rename either the parameter or the `const`:
-
-```jaiph
-workflow w(raw_input) {
-  const input = ensure validate(raw_input)
-}
-```
+| Subject | Bare identifier or `IDENT.IDENT`. Subject starting with `$` / `${}` is `E_PARSE`. |
+| Default arm | Exactly one `_` wildcard arm is required. |
+| Arm delimiter | Newlines. Commas between or after arms are `E_PARSE` (`commas are not allowed in match arms; use one arm per line`). |
+| Disallowed in arms | `return` (use `return match … { … }` at the outer level), inline scripts (use a named script with `run`), bare unknown identifiers (`E_VALIDATE: unknown identifier "…" in match arm body`). |
+| Expression form | Usable as `const x = match …` or `return match …`. |
 
-## Scripts
+### `for`
 
-### Bash Scripts (single-line)
-
-```jaiph
-script setup_env = `export BASE_DIR=$(pwd) && mkdir -p "$BASE_DIR/output" && echo "Environment initialized"`
-```
-
-### Bash Scripts (fenced block)
-
-<pre><code>script setup_env = ```
-export BASE_DIR=$(pwd)
-mkdir -p "$BASE_DIR/output"
-echo "Environment initialized"
-```
-</code></pre>
-
-Script bodies are opaque bash — the compiler does not parse them as Jaiph steps. For bash scripts, the emitter applies only lightweight transforms: `return` normalization, `local`/`export`/`readonly` spacing, and import alias resolution.
-
-**Interpolation rules differ by body form:**
-
-- **Backtick** (single-line): Jaiph interpolation (`${...}`) is forbidden — the compiler rejects `${name}` with `E_PARSE` to prevent ambiguity between Jaiph variables and shell parameter expansion. Use `$1`, `$2` positional arguments to pass data from orchestration to scripts.
-- **Fenced block** (triple-backtick): `${...}` is passed through to the shell verbatim. Shell parameter expansion (`${VAR}`, `${VAR:-default}`, `${#VAR}`, etc.) works as expected. The triple-backtick delimiter signals "this is opaque shell", so there is no ambiguity with Jaiph interpolation.
-
-### Polyglot Scripts
-
-#### Fence lang tags (recommended)
-
-Use a fence lang tag (`` ```<tag> ``) to select an interpreter without writing a shebang line. The tag maps directly to a shebang: `` ```<tag> `` becomes `#!/usr/bin/env <tag>`. Any tag is valid — there is no hardcoded allowlist.
-
-<pre><code>script analyze = ```python3
-import sys
-print(f"Analyzing {sys.argv[1]}")
-```
-</code></pre>
-
-<pre><code>script transform = ```node
-const data = process.argv[2];
-console.log(JSON.stringify({ result: data }));
+```ebnf
+for_lines_stmt = "for" IDENT "in" IDENT "{" { workflow_step } "}" ;
 ```
-</code></pre>
 
-Examples of tag-to-shebang mapping:
-
-| Fence tag | Shebang |
+| Rule | Behaviour |
 |---|---|
-| `` ```node `` | `#!/usr/bin/env node` |
-| `` ```python3 `` | `#!/usr/bin/env python3` |
-| `` ```ruby `` | `#!/usr/bin/env ruby` |
-| `` ```perl `` | `#!/usr/bin/env perl` |
-| `` ```pwsh `` | `#!/usr/bin/env pwsh` |
-| `` ```deno `` | `#!/usr/bin/env deno` |
-| `` ```bash `` | `#!/usr/bin/env bash` |
-| `` ```lua `` | `#!/usr/bin/env lua` |
+| Source variable | Must already hold a string (`const`, capture, parameter). Unknown names are `E_VALIDATE`. |
+| Line splitting | Splits on `\n` (normalises `\r\n` → `\n`). If the string ends with a final newline, the trailing empty segment is dropped. Interior empty lines are still yielded. |
+| Iterator name | Subject to the same immutable-binding rules as `const` in the surrounding scope. |
+| Allowed in | Workflows and rules. |
 
-Combining a fence lang tag with a manual `#!` shebang in the body is an error — choose one or the other.
+## Inline scripts
 
-#### Manual shebang (escape hatch)
-
-If no fence tag is present, the user may provide a manual `#!` shebang as the first line of the body:
-
-<pre><code>script run_lua = ```
-#!/usr/bin/env lua
-print("hello from lua")
+```ebnf
+inline_script = backtick_script_body "(" [ call_args ] ")"
+              | fenced_script_block "(" [ call_args ] ")" ;
 ```
-</code></pre>
-
-Non-bash scripts skip Jaiph keyword validation and emit the body verbatim.
-
-### Script Isolation
 
-Managed **script** steps (`run` to a named script, inline script, or `import script`) are spawned with the **same environment object** the workflow runner uses for that scope (`scope.env`): effectively the runner’s `process.env` as augmented by Jaiph (`JAIPH_WORKSPACE`, `JAIPH_SCRIPTS`, run/agent metadata from config, run-directory variables set during execution, etc.). This is **not** an `env -i`-style wipe — inherited host variables remain available unless overwritten.
-
-Module-scoped **`const`** values live only in the interpreter’s variable map — they are **not** automatically exported into script environments. Pass data as **`$1`, `$2`, …**, read Jaiph-provided env vars, or export from the host before starting `jaiph run`.
+| Aspect | Rule |
+|---|---|
+| Allowed positions | `run_stmt` / `run_catch_stmt` / `run_recover_stmt` / `log_stmt` / `logerr_stmt` / `return_stmt`, and `const` RHS. |
+| `run async` | Not supported with inline scripts. |
+| Backtick interpolation | Jaiph `${identifier}` / `${identifier.field}` forms are `E_PARSE`. Bash parameter expansion passes through. Use `$1`, `$2`, … for positional arguments. |
+| Fenced interpolation | All `${…}` passes through to the shell (standard parameter expansion). |
+| `catch` / `recover` suffix | Allowed only on standalone `run` steps with inline-script body. Forbidden in `log` / `logerr` / `return` / `const` RHS positions. |
+| Emitted name | `scripts/__inline_<hash>` where `<hash>` is the first 12 hex digits of `sha256(shebang + "\n" + body)` (or `sha256(body)` if no shebang). Deterministic across runs. |
 
-## String Interpolation {#string-interpolation}
+## String interpolation
 
-Jaiph orchestration strings support `${identifier}` interpolation. Every identifier — whether in a bare argument (`run greet(name)`) or in braced form (`log "hello ${name}"`) — must reference a binding that is in scope: `const`, capture, or named parameter. Unknown names are rejected at compile time with an `E_VALIDATE` error in both forms; `${name}` is **not** a workaround for an undeclared bare identifier.
+`${IDENT}` is the only interpolation form accepted in Jaiph orchestration strings. Every identifier must reference a `const`, capture, or named parameter.
 
 | Form | Status | Where |
 |---|---|---|
-| `${varName}` | Primary | All Jaiph strings |
-| `${var.field}` | Dot notation — typed prompt field access | All Jaiph strings |
-| `${paramName}` | Named parameter access | All Jaiph strings |
-| `${run ref(args)}` | Inline capture — executes call, inlines output | All Jaiph strings |
-| `${ensure ref(args)}` | Inline capture — executes rule, inlines result | All Jaiph strings |
-| `$varName` | Rejected — use `${varName}` | — |
-| `$1`, `$2` | Positional shell args — only in `script` bodies | `script` bodies only |
-| `${var:-fallback}` | Rejected (`E_PARSE`) in orchestration strings and backtick scripts; passes through in fenced script blocks | — |
-| `$(…)` | Rejected (`E_PARSE`) in orchestration strings | — |
-
-**Dot notation** (`${var.field}`) accesses a single field from a typed prompt capture. The variable must be bound to a `prompt … returns` step, and the field must exist in the schema. Both constraints are checked at compile time. See [prompt — Typed prompt](#prompt--agent-interaction) for details.
-
-**Inline captures** execute a managed call directly inside the string:
-
-```jaiph
-log "Got: ${run some_script()}"
-log "Status: ${ensure check_ok()}"
-prompt "Fix the issue: ${ensure get_diagnostics()}"
-return "${run some_script()}"
-```
-
-If any inline capture fails, the enclosing step fails immediately. Nested inline captures (`${run foo(${run bar()})}`) are rejected — extract the inner call to a `const`.
-
-## Step Output Contract
-
-Every step produces three distinct outputs — status, value, and logs:
-
-| Step kind | Status source | Value channel (for `x = …`) | Log channel |
-| --- | --- | --- | --- |
-| `ensure rule` | rule exit code | explicit `return` value | rule body logs to artifacts |
-| `run workflow` | workflow exit code | explicit `return` value | workflow step logs to artifacts |
-| `run script` (named) | script exit code | **stdout** of script body | script stdout/stderr to artifacts |
-| `` run `…`() `` (inline) | script exit code | **stdout** of script body | script stdout/stderr to artifacts |
-| `prompt` | prompt exit code | final assistant answer | transcript to artifacts |
-| `log` / `logerr` | always 0 | empty | event + stdout/stderr |
+| `${varName}` | Primary | All orchestration strings. |
+| `${var.field}` | Typed-prompt field access | All orchestration strings. The base must be a `const x = prompt … returns "{ field: type, … }"` capture and the field must appear in the schema. |
+| `${run ref(args)}` | Inline capture — executes the call, inlines stdout / return value. | All orchestration strings. |
+| `${ensure ref(args)}` | Inline capture — executes the rule, inlines result. | All orchestration strings. |
+| `$varName` (no braces) | `E_PARSE` in orchestration strings. | — |
+| `$1`, `$2` | Positional args | `script` bodies only. |
+| `${var:-fallback}` / `${var%%…}` / `${var//…}` / `${#var}` | `E_PARSE` in orchestration strings; passes through in script bodies (backtick and fenced). | — |
+| `$(…)` | `E_PARSE` in orchestration strings. | — |
+
+If an inline capture fails, the enclosing step fails. Nested inline captures (`${run foo(${run bar()})}`) are rejected — extract the inner call to a `const`.
+
+## Step output contract
+
+Every step produces three distinct outputs — status, capture value, and logs.
+
+| Step | Status | Capture value | Logs |
+|---|---|---|---|
+| `ensure rule` | rule exit code | explicit `return` value | rule artifacts |
+| `run workflow` | workflow exit code | explicit `return` value | workflow artifacts |
+| `run script` (named) | script exit code | trimmed stdout | script `.out` / `.err` |
+| `` run `…`() `` (inline) | script exit code | trimmed stdout | script `.out` / `.err` |
+| `prompt` | prompt exit code | final assistant answer | transcript artifacts |
+| `log` / `logerr` | always 0 | empty | live event stream + stdout/stderr |
 | `fail` | non-zero (abort) | empty | message to stderr |
-| `run async` | aggregated | `Handle<T>` — resolves to return value on read | async step logs to artifacts |
+| `run async` | aggregated | `Handle<T>` — resolves to return value on read | async step artifacts |
 | `const` | same as RHS step | empty (binds local) | n/a |
 
-Key rules:
-- For `ensure`/`run` to a rule or workflow, assignment captures only the callee's explicit `return "…"` (or `return run …` / `return ensure …`).
-- For `run` to a script, assignment captures **stdout**. Use `echo`/`printf` to pass data back.
-- `return "value"` / `return "${var}"` / `return run ref()` / `return ensure ref()` are valid in rules and workflows only, not in scripts.
-
-## Lexical Notes
-
-- **Identifiers:** `[A-Za-z_][A-Za-z0-9_]*`
-- **References:** `IDENT` or `IDENT.IDENT` (module-qualified)
-- **Comments:** Full-line `#` comments.
-- **Blank lines:** Empty lines between steps inside workflow and rule bodies are preserved in the AST as visual grouping markers. A single blank line between steps survives `jaiph format` unchanged; consecutive blank lines are collapsed to one; trailing blank lines before `}` are removed. Outside block bodies (between top-level declarations), blank lines are normalized by the formatter.
-- **Shebang:** A `#!` first line of the file is ignored by the parser.
-- **Import path:** Quoted string in `import "path" as alias`. Missing `.jh` extension is appended automatically. Script imports use `import script "path" as name` — the path refers to a raw script file (no `.jh` extension appended).
-- **String quoting:** Jaiph has a four-delimiter system. `"..."` is the single-line string form (double quotes only — single-quoted strings are parse errors). `"""..."""` is the multiline string form; the opening `"""` must end the line, and the closing `"""` must be on its own line. A double-quoted string that spans multiple lines is rejected with a guidance error pointing to triple quotes. Use `\"` for literal double quotes and `\\` for literal backslashes. `${...}` interpolation works in both forms. Script bodies use single backtick (`` `...` ``) for single-line or triple backtick (`` ```...``` ``) for multi-line — normal shell quoting is allowed inside script bodies. Triple backticks in prompt/string context are rejected.
-- **Required call-site parentheses:** All call sites require parentheses — `run ref()`, not `run ref`. Bare identifiers without parentheses are `E_PARSE`.
-- **Top-level ordering:** The parser accepts top-level definitions in any order. `jaiph format` hoists `import`, `config`, and `channel` declarations to the top (in that order), but preserves the source-file order of all other definitions (`const`, `rule`, `script`, `workflow`, `test`). Comments before a hoisted construct move with it; comments before non-hoisted definitions stay in place. See [CLI — `jaiph format`](cli.md#jaiph-format).
-
-## EBNF (Practical Form)
+## Validation catalog
 
-Informal symbols: `string` = quoted string; `call_ref` = `REF "(" [args] ")"` — parentheses are always required (each argument may be a quoted string, `${var}`, or a **bare identifier** — see [Call Arguments](#call-arguments-and-named-parameters)); `double_quoted_string` = single-line double-quoted string supporting `\$`, `\"`, `\\`, `` \` `` escapes and `${identifier}` / `${run …}` / `${ensure …}` interpolation; `triple_quoted_block` = multiline string delimited by `"""` on opening and closing lines, supporting the same interpolation; `prompt_body` = single-line double-quoted string | bare `IDENT` (reference to an existing binding) | triple-quoted block (`""" … """`).
+Validator entry points (`src/transpile/validate.ts` for the outer layer; `src/transpile/validate-step.ts` for the per-step visitor). The `jaiph compile` command surfaces all of these via `collectDiagnostics`.
 
-```ebnf
-file            = { top_level } ;
-
-top_level       = config_block | import_stmt | import_script_stmt | channel_decl | env_decl | rule_decl | script_decl | workflow_decl ;
- (* env_decl is written `const` in source; parsed into `envDecls` / module constants in `src/parser.ts`.
-    Test modules (`*.test.jh`) may also contain `test` blocks — see `parseTestBlock` / [Testing](testing.md). *)
-
-config_block    = "config" "{" { config_line } "}" ;
-config_line     = config_key "=" config_value ;
-config_key      = "agent.default_model" | "agent.command" | "agent.backend" | "agent.trusted_workspace"
-                | "agent.cursor_flags" | "agent.claude_flags" | "run.logs_dir" | "run.debug"
-                | "run.recover_limit" | "runtime.docker_image" | "runtime.docker_network"
-                | "runtime.docker_timeout_seconds"
-                | "module.name" | "module.version" | "module.description" ;
-config_value    = string | "true" | "false" | integer | string_array ;
-integer         = digit { digit } ;
-string_array    = "[" { array_element } "]" ;
-array_element   = string [ "," ] ;
-
-import_stmt     = "import" string "as" IDENT ;
-import_script_stmt = "import" "script" string "as" IDENT ;
-
-channel_decl    = "channel" IDENT [ "->" REF { "," REF } ] ;
-
-env_decl        = "const" IDENT "=" env_value ;
-env_value       = double_quoted_string | triple_quoted_block | bare_value ;
-
-rule_decl       = [ "export" ] "rule" IDENT [ "(" param_list ")" ] "{" { rule_body_step } "}" ;
-rule_body_step  = comment_line | workflow_step ;
-  (* Parsed with the same statement dispatcher as workflows, but validation rejects
-     shell, prompt, send, const … = prompt, run async, and run targets that are not scripts. *)
-
-script_decl     = "script" IDENT "=" script_rhs ;
-script_rhs      = backtick_script_body | fenced_script_block ;
-backtick_script_body = "`" script_text "`" ;  (* single-line; no newlines; no ${...} interpolation *)
-fenced_script_block = "```" [ LANG_TAG ] newline { script_line newline } "```" ;  (* ${...} passed through to shell *)
-LANG_TAG        = IDENT ;  (* any identifier — maps to #!/usr/bin/env <tag>; rejected when body starts with #! *)
-shebang_line    = "#!" rest_of_line ;  (* rejected when LANG_TAG is present *)
-script_line     = comment_line | command_line ;
-
-workflow_decl   = [ "export" ] "workflow" IDENT [ "(" param_list ")" ] "{" [ workflow_config ] { workflow_step } "}" ;
-param_list      = IDENT { "," IDENT } ;  (* identifiers; no duplicates; no reserved keywords *)
-workflow_config = config_block ;
-  (* optional per-workflow override; must appear before steps;
-     only agent.* and run.* keys allowed; runtime.* and module.* yield E_PARSE *)
-
-workflow_step   = ensure_stmt | run_stmt | run_catch_stmt | run_recover_stmt | run_async_stmt | prompt_stmt
-                | const_decl_step | return_stmt
-                | fail_stmt | log_stmt | logerr_stmt | send_stmt
-                | match_stmt | if_stmt | for_lines_stmt | comment_line ;
-  (* Route declarations (-> workflow) belong at top level in channel_decl, not inside workflow bodies
-     (-> inside a body is E_PARSE). Any line that does not match the managed forms above becomes a
-     shell step in workflows (rules forbid shell — validated separately). *)
-for_lines_stmt  = "for" IDENT "in" IDENT "{" { workflow_step } "}" ;
-
-const_decl_step = "const" IDENT "=" const_rhs ;
-const_rhs       = double_quoted_string | triple_quoted_block | bash_value_expr
-                | "run" ( call_ref | inline_script ) | "run" "async" call_ref
-                | "ensure" call_ref
-                | "prompt" prompt_body [ returns_schema ]
-                | "match" IDENT "{" { match_arm } "}" ;
-
-fail_stmt       = "fail" ( double_quoted_string | triple_quoted_block ) ;
-run_async_stmt  = "run" "async" call_ref [ recover_suffix | catch_suffix ] ;
-recover_suffix  = "recover" recover_bindings recover_body ;
-catch_suffix    = "catch" catch_bindings catch_body ;
-  (* recover and catch are mutually exclusive on a given run async — parser/runtime treat only one as active *)
-return_stmt     = "return" return_value ;
-return_value    = double_quoted_string | triple_quoted_block | "$" IDENT | "${" IDENT "}"
-                | IDENT
-                | "run" ( call_ref | inline_script ) | "ensure" call_ref
-                | "match" IDENT "{" { match_arm } "}" ;
-
-match_stmt      = "match" IDENT "{" { match_arm } "}" ;
-match_expr      = "match" IDENT "{" { match_arm } "}" ;
-
-if_stmt         = "if" IDENT if_op if_operand "{" { workflow_step } "}" ;
-if_op           = "==" | "!=" | "=~" | "!~" ;
-if_operand      = double_quoted_string | "/" regex_source "/" ;
-match_arm       = match_pattern "=>" arm_body NEWLINE ;
-match_pattern   = double_quoted_string | "/" regex_source "/" | "_" ;
-arm_body        = double_quoted_string | triple_quoted_block
-                | IDENT
-                | "$" IDENT | "${" IDENT "}"
-                | "fail" double_quoted_string
-                | "run" call_ref | "ensure" call_ref ;
-
-send_stmt       = IDENT "<-" send_rhs ;
-send_rhs        = double_quoted_string | triple_quoted_block | "$" IDENT | "${" … "}" | "run" call_ref ;
-  (* ${…} is the braced var form (parser supports nesting); a bare ref-shaped token is parsed
-     as bare_ref but validate rejects it for local/imported workflow, rule, or script — use
-     a string, $name / ${…}, or "run" call_ref *)
-
-log_stmt        = "log" ( double_quoted_string | triple_quoted_block | IDENT | "run" inline_script ) ;
-logerr_stmt     = "logerr" ( double_quoted_string | triple_quoted_block | IDENT | "run" inline_script ) ;
-
-ensure_stmt     = "ensure" call_ref [ "catch" catch_bindings catch_body ] ;
-run_catch_stmt  = "run" call_ref "catch" catch_bindings catch_body ;
-run_recover_stmt = "run" call_ref "recover" recover_bindings recover_body ;
-run_stmt        = "run" ( call_ref | inline_script ) ;
-call_ref        = REF "(" [ call_args ] ")" ;  (* parentheses always required *)
-call_arg        = double_quoted_string | IDENT | "${" IDENT "}"
-                | "run" ( call_ref | inline_script )       (* explicit nested managed call *)
-                | "ensure" call_ref ;                      (* explicit nested ensure *)
-call_args       = call_arg { "," call_arg } ;
-inline_script   = backtick_script_body "(" [ call_args ] ")" | fenced_script_block "(" [ call_args ] ")" ;
-prompt_body     = double_quoted_string | IDENT | triple_quoted_block ;
-triple_quoted_block = "\"\"\"" newline { body_line newline } "\"\"\"" ;
-prompt_stmt     = "prompt" prompt_body [ returns_schema ] ;
-returns_schema  = "returns" double_quoted_string ;
-
-catch_bindings  = "(" IDENT ")" ;  (* failure payload *)
-catch_body      = single_workflow_stmt | "{" { workflow_step } "}" ;
-recover_bindings = "(" IDENT ")" ;  (* failure payload — same as catch *)
-recover_body    = single_workflow_stmt | "{" { workflow_step } "}" ;
-single_workflow_stmt = ensure_stmt | run_stmt | run_catch_stmt | run_recover_stmt | prompt_stmt
-                | const_decl_step
-                | return_stmt | fail_stmt | log_stmt | logerr_stmt
-                | send_stmt ;
-  (* Actual catch/recover bodies use parseCatchStatement in src/parse/steps.ts: a richer subset
-     than this sketch, including inline shell text for workflow recovery blocks — rule bodies still
-     reject unstructured shell via validateRuleStep. *)
-```
-
-## Validation Rules
-
-After parsing, the compiler validates references and config (`src/transpile/validate.ts`). Error codes:
-
-- **E_PARSE:** Invalid syntax — duplicate config, invalid keys/values, `$(…)` or `${var:-fallback}` in orchestration strings, `${...}` interpolation in **single-line backtick** script bodies, `prompt … returns` without `const` capture, `name = prompt …` / assignment captures without `const` for `run`/`ensure`, bare `ref(args)` in const RHS (use `run`/`ensure`/`prompt`), `local` at top level, unrecognized workflow/rule line, invalid send RHS, arguments after `catch`, bare `catch` with no recovery step, nested inline captures, shell redirection after `run`/`ensure`, invalid parameter names (non-identifier, duplicate, or reserved keyword), or missing `{` on definition line.
-- **E_SCHEMA:** Invalid `returns` schema — empty, non-flat, unsupported type (only `string`, `number`, `boolean`).
-- **E_VALIDATE:** Reference errors — unknown rule/workflow, duplicate alias, `ensure` on non-rule, `run` on rule, `run` to workflow inside rule, `run async` in rule, forbidden Jaiph usage inside `$(…)`, dot notation on non-prompt variable or invalid field name, bare identifier argument referencing an unknown variable, `${identifier}` in strings referencing an unknown variable, standalone `"${identifier}"` in call arguments (use bare identifier instead), arity mismatch (call-site argument count differs from callee's declared parameter count), **bare nested managed calls** — `run foo(bar())` or `run foo(rule_bar())` without explicit `run`/`ensure` keyword, **bare nested inline script calls** — `run foo(\`echo aaa\`())` without explicit `run`, **type crossing** — `prompt` with a script name (`scripts are not promptable`), `run` with a string const (`strings are not executable`), `const x = scriptName` (`scripts are not values`), `${scriptName}` interpolation (`scripts cannot be interpolated`).
-- **E_IMPORT_NOT_FOUND:** Import target file does not exist.
-
-Validation rules:
-
-1. At most one `config` block per file and per workflow. Workflow config must appear before steps. Only `agent.*` and `run.*` keys in workflow config.
-2. Config values must match expected types. `agent.backend` must be `"cursor"`, `"claude"`, or `"codex"`.
-3. Import aliases must be unique (`E_VALIDATE`). Import targets must exist (`E_IMPORT_NOT_FOUND`). Script import targets (external files) must also exist.
-4. **Unified namespace:** channels, rules, workflows, scripts, script import aliases, and top-level `const` share one namespace per module.
-5. `ensure` must target a rule. `run` in a workflow targets a workflow or script. `run` in a rule targets a script only. These rules also apply to `return run` and `return ensure` forms.
-6. Channel references in `send` must resolve to declared channels. Route targets on channel declarations must be workflows with exactly 3 parameters. Route declarations inside workflow bodies are rejected at parse time.
-7. `ensure … catch`, `run … catch`, and `run … recover` argument ordering: all arguments inside parentheses before `catch`/`recover`.
-8. Shell redirection (`>`, `|`, `&`) after `run`/`ensure` is rejected — use a script.
-9. **Type crossing:** `string` and `script` are non-interchangeable primitive types (see [Types](#types)). `prompt` rejects script names; `run` rejects string consts; assigning a script to a `const` or interpolating a script name with `${…}` is rejected. Each crossing produces an actionable `E_VALIDATE` message.
-10. **Explicit nested managed calls:** Bare call-like forms in argument position (`run foo(bar())`, `run foo(rule_bar())`) are rejected — add the missing `run` or `ensure` keyword. Bare inline script calls in arguments (`run foo(\`echo aaa\`())`) are also rejected — add `run`. Valid forms: `run foo(run bar())`, `run foo(ensure rule_bar())`, `run foo(run \`echo aaa\`())`.
-11. **`for iter in source`:** `source` must name a variable already in scope (`const`, capture, or parameter) — unknown names are `E_VALIDATE`.
-
-## Build Artifacts {#build-artifacts}
-
-`jaiph run` and `jaiph test` do **not** transpile workflows to shell. The CLI calls `buildScripts()`, which emits only per-`script` executable files under `scripts/`. Workflows, rules, prompts, channels, and control flow are interpreted by `NodeWorkflowRuntime` from the AST.
-
-Each `script name = …` becomes `scripts/<name>` with `chmod +x`: shebang (from fence lang tag, manual `#!`, or default `#!/usr/bin/env bash`) plus the body. Inline scripts (`` run `body`(args) `` or `` run ```lang...body...```(args) ``) are emitted as `scripts/__inline_<hash>` with deterministic hash-based names. At runtime, script subprocesses inherit the **workflow runner environment** (host `process.env` plus Jaiph variables — see [Script Isolation](#script-isolation)), not an emptied shell environment.
+| Code | Triggers |
+|---|---|
+| `E_PARSE` | Duplicate config; duplicate top-level names in the unified namespace; invalid keys/values; `$(…)` in orchestration strings; Jaiph `${identifier}` interpolation in single-line backtick script bodies; `prompt … returns` without `const` capture; `name = prompt …` / non-`const` capture; bare `ref(args)` on `const` RHS (use `run` / `ensure` / `prompt`); top-level `local`; invalid send RHS; trailing shell redirection after `run` / `ensure`; arguments after `catch` / `recover`; bare `catch` / `recover` without binding; nested inline captures; removed `wait` keyword; invalid parameter names; missing `{` on definition line. |
+| `E_SCHEMA` | Invalid `returns` schema — empty, non-flat, unsupported type. |
+| `E_VALIDATE` | Unknown rule / workflow / script; duplicate import alias; inline shell in rules; `ensure` on non-rule; `run` to workflow inside rule; `run async` in rule; forbidden Jaiph usage inside `$(…)`; dot notation on non-prompt variable or invalid field name; bare identifier argument referencing an unknown variable; `${ident}` referencing an unknown variable in orchestration strings; arity mismatch; shell redirection (`>`, `>>`, `|`, `&`) inside unquoted call-argument text; bare nested managed calls; bare nested inline-script calls; type crossings (`prompt` on a script, `run` on a string, `const x = scriptName`, `${scriptName}`). |
+| `E_IMPORT_NOT_FOUND` | Import target does not exist (module or script). |
+
+### Validation rules
+
+1. At most one `config` block per file and per workflow. Workflow `config` must precede steps. Workflow `config` allows only `agent.*` / `run.*`.
+2. Config values are type-checked. `agent.backend` must be `cursor`, `claude`, or `codex`.
+3. Import aliases must be unique. Import targets must exist.
+4. Unified per-module namespace: channels, rules, workflows, scripts, script-import aliases, and top-level `const` share one namespace. Duplicate top-level names fail at parse time (`E_PARSE`); duplicate import aliases fail in validation (`E_VALIDATE`).
+5. `ensure` targets a rule. `run` in a workflow targets a workflow or script; `run` in a rule targets a script only. Same rules apply to `return run` and `return ensure`.
+6. Channel references in `send` must resolve to declared channels. Route targets must be workflows with exactly three parameters. Inline routes in workflow bodies are `E_PARSE`.
+7. `catch` / `recover` argument ordering — all call args appear before `catch` / `recover`.
+8. Shell redirection (`>`, `>>`, `|`, `&`) on `run` / `ensure` is rejected — trailing operators are `E_PARSE`; operators in unquoted call-argument text are `E_VALIDATE`.
+9. Type crossings produce specific `E_VALIDATE` messages (see [Types](#types)).
+10. Nested managed calls require explicit `run` / `ensure` keywords. Bare nested forms are `E_VALIDATE`.
+11. `for iter in source` — `source` must name an in-scope variable.
+
+## Build artifacts
+
+`jaiph run` and `jaiph test` do not transpile workflows to shell. `buildScripts` emits only per-`script` executable files under `scripts/`:
+
+| Source form | Emitted artifact |
+|---|---|
+| `script name = \`…\`` (single-line) | `scripts/<name>` with `#!/usr/bin/env bash` (or the fence-tag / manual shebang). |
+| `script name = \`\`\`<tag>…\`\`\`` (fenced) | `scripts/<name>` with `#!/usr/bin/env <tag>` or the manual `#!` line. |
+| `` run `body`(args) `` / `` run ```lang body```(args) `` | `scripts/__inline_<12-hex>` with the deterministic name from `inlineScriptName`. |
+| `import script "path" as name` | No emission; the runtime resolves the existing file at runtime (shebangs preserved). |
 
-## Runtime Execution
+Workflows, rules, prompts, channels, and control flow are interpreted by `NodeWorkflowRuntime` from the AST. There is no workflow-level shell emission. Script subprocesses inherit the runner's `process.env` plus Jaiph metadata.
 
-At runtime, the Node workflow runtime interprets the AST directly:
+## Related
 
-- **Config:** Precedence chain: environment → workflow-level → module-level → defaults.
-- **Script subprocess environment:** Script steps receive the same **`scope.env`** as the interpreter (runner `process.env` plus Jaiph metadata and run paths). Module **`const`** bindings are **not** auto-exported — pass values via arguments or host exports.
-- **Prompt + schema:** JSON extraction and schema validation via the JS kernel. Exit codes: 0=ok, 1=parse error, 2=missing field, 3=type mismatch.
-- **ensure/run … catch:** On failure, the recovery body runs **once**. There is no retry loop. Requires explicit bindings: `catch (failure) { … }`. The binding gets the merged stdout+stderr from the failed execution.
-- **run … recover:** Repair-and-retry loop. On failure, the binding gets merged stdout+stderr, the repair body runs, and the target is retried. Loop stops on success or when `run.recover_limit` (default 10) is exhausted. Requires explicit bindings: `recover(err) { … }`.
-- **Recursion safety:** There is a hard recursion depth limit of 256. Exceeding it produces a runtime error.
-- **Assignment capture:** Rules and workflows use explicit `return "…"`. Scripts use stdout.
-- **`run async`:** Returns a `Handle<T>` value. Handle-based concurrency with implicit resolution on first non-passthrough read and implicit join of unresolved handles at workflow exit. `recover` and `catch` composition supported. Failures aggregated at join.
-- **Channels:** `send` enqueues messages on the active workflow context; after that workflow’s steps complete successfully, the runtime drains the queue and invokes route targets. A send from a nested workflow targets the **nearest ancestor** context that defines routes for that channel. Each route target must declare exactly 3 parameters; the runtime binds message, channel, and sender to the declared names.
+- [Language](language.md) — step semantics and runtime behaviour.
+- [CLI — `jaiph format`](cli.md#jaiph-format) — formatter rules and idempotence.
+- [Configuration](configuration.md) — config-key semantics referenced by the grammar.
diff --git a/docs/hooks.md b/docs/hooks.md
index 82fe6adc..0e8a98b9 100644
--- a/docs/hooks.md
+++ b/docs/hooks.md
@@ -1,152 +1,99 @@
 ---
-title: Hooks
-permalink: /hooks
+title: Add a hook
+permalink: /how-to/hooks
+diataxis: how-to
 redirect_from:
+  - /hooks
   - /hooks.md
 ---
 
-# Hooks
+# Add a hook
 
-Workflow automation often needs **side effects** outside the workflow itself: notifications, structured logging, webhooks, or CI integration. Hard-coding those into `.jh` makes modules noisy and hard to reuse. **Hooks** are a separate mechanism: optional shell commands the **CLI** runs at fixed workflow/step lifecycle points. You declare them in `hooks.json` (global or per-project); they are not part of the Jaiph language and do not run inside `NodeWorkflowRuntime`.
+This recipe wires a shell command to a workflow lifecycle event so the CLI runs it when the event fires. Hooks are observation/notification side effects (HTTP webhooks, log appenders, CI integration) — they are not part of the workflow language.
 
-The CLI parses the same **`__JAIPH_EVENT__`** JSON lines on the runner’s **stderr** that drive the progress tree. For each supported lifecycle event, it forwards a JSON **snapshot** to your commands on **stdin**. Channels, inbox files, and dispatch stay in the runtime — hooks only observe the stream and act on the host. See [Architecture — Runtime vs CLI responsibilities](architecture.md#runtime-vs-cli-responsibilities), [Architecture — Channels and hooks in context](architecture.md#channels-and-hooks-in-context), and [Architecture — Contracts](architecture.md#contracts).
+Hooks run **on the host CLI** even when the workflow runs inside Docker. The CLI dispatches them at lifecycle points — step events from parsed `__JAIPH_EVENT__` lines on the runner's stderr, plus `workflow_start` before the runner spawns and `workflow_end` after it exits — with a JSON payload on stdin per invocation.
 
-## When hooks run
+## Prerequisites
 
-Hooks run only for interactive **`jaiph run`** (including the shorthand **`jaiph <file.jh>`**, which uses the same `runWorkflow` path as **`jaiph run`**). The entry file must be a **non-test** `.jh` file (`src/cli/index.ts` routes `*.test.jh` to `jaiph test`).
+- An entry `.jh` file you can run with `jaiph run` or `jaiph <file.jh>` (hooks do **not** fire for `jaiph test`, `jaiph compile`, `jaiph format`, `jaiph init`, `jaiph install`, `jaiph use`, or `jaiph run --raw`).
+- `sh`, plus whatever tool the hook command needs (`jq`, `curl`, etc.).
 
-Hooks do **not** run for `jaiph test`, `jaiph compile`, `jaiph format`, `jaiph init`, `jaiph install`, `jaiph use`, or other commands. **`jaiph run --raw`** skips hooks (and the banner, progress tree, and failure footer) so stderr stays a clean `__JAIPH_EVENT__` stream — used when embedding Jaiph or when the host wraps a container. See [CLI — `jaiph run`](cli.md#jaiph-run).
+## 1. Create the hooks file
 
-For local runs, hooks use the same machine as the workflow. For **Docker-backed** runs, hook commands still execute on the **host** CLI process, not inside the container. See [Sandboxing — Runtime behavior](sandboxing.md#runtime-behavior).
-
-## Config locations and precedence
+Hooks come from one of two locations. Project hooks override global hooks **per event** (lists are not merged): if the project file defines commands for an event, only those run; omit an event to keep the global commands for that event.
 
 | Scope | Path |
-|-------|------|
+|---|---|
 | Global | `~/.jaiph/hooks.json` |
-| Project-local | `<workspace>/.jaiph/hooks.json` |
-
-Both files are optional. `<workspace>` is resolved the same way as `JAIPH_WORKSPACE` for `jaiph run`: walk up from the entry `.jh` file’s directory, with guards for temp directories and nested sandboxes. Full rules: [CLI — Environment variables](cli.md#environment-variables).
-
-**Precedence is per event:** if the project file defines at least one non-empty command for an event, **only** those commands run and global commands for that event are ignored (lists are not merged). If the project file omits an event or only has empty / skipped entries for it, global commands apply for that event. Changing `step_end` in the project file does not affect how `workflow_start` is resolved.
-
-Unsupported keys in the JSON object are ignored — `parseHookConfig` in `src/cli/run/hooks.ts` only reads the four supported event names.
+| Project | `<workspace>/.jaiph/hooks.json` |
 
-There is no explicit “disable hooks” flag. To silence a global hook for one project, override that event with a no-op, e.g. `"workflow_end": ["true"]`.
+Both files are optional. Invalid JSON logs `jaiph hooks: …` on stderr and is skipped. Create the one you want:
 
-## Schema
+```bash
+mkdir -p .jaiph
+cat > .jaiph/hooks.json <<'EOF'
+{
+  "step_end": [
+    "jq -c '{event,step_kind,step_name,status,elapsed_ms}' >> \"$HOME/.jaiph/step-events.jsonl\""
+  ]
+}
+EOF
+```
 
-Each file must be a single JSON **object** at the root (not an array) mapping **event names** to **arrays of shell commands**:
+## 2. Map events to commands
 
-- Keys must be supported event names (see [Supported events](#supported-events)).
-- Values must be arrays. A non-array value for a known key is skipped for that event.
-- Elements must be non-empty strings (one shell command each). Empty strings and non-string elements are skipped. If every element is skipped, that event is not defined in the normalized config, so the other file’s commands can apply (see [Config locations and precedence](#config-locations-and-precedence)).
+The schema is a JSON object mapping event names to **arrays** of shell commands. The supported events are `workflow_start`, `workflow_end`, `step_start`, `step_end`:
 
 ```json
 {
   "workflow_start": ["echo 'run started'"],
-  "workflow_end": ["curl -s -X POST https://example.com/jaiph/end -d @-"],
-  "step_start": [],
-  "step_end": ["jq -c . >> \"$HOME/.jaiph/step-events.jsonl\""]
+  "step_end":       ["jq -c . >> /tmp/jaiph-steps.jsonl"],
+  "workflow_end":   ["curl -s -X POST https://example.com/jaiph/end -d @-"]
 }
 ```
 
-An empty array normalizes to “no commands from this file for this event,” so resolution falls back to the other config file when the project file does not override that event.
+Each command runs as `sh -c '<command>'` with the JSON payload written to **stdin**. Stdin can only be read once per process; if you need the payload twice, buffer it:
 
-## Supported events
-
-| Event | When it fires |
-|-------|---------------|
-| `workflow_start` | After **`buildScripts`** completes (parse, **`validateReferences`**, script extraction to `scripts/`) on the CLI host, and **before** the workflow runner subprocess is spawned. The interactive **banner** has already been printed (and, when Docker sandboxing is enabled, **`prepareImage`** has already run) — see `runWorkflow` in `src/cli/commands/run.ts`. Does not fire if compilation fails earlier (`buildScripts` throws before `emitter.emit("workflow_start", …)`). |
-| `workflow_end` | At the start of **`reportResult`** in `src/cli/commands/run.ts`: after the runner exits (any status) and stderr has been drained, **before** the CLI prints PASS/FAIL. |
-| `step_start` | When the CLI parses a `STEP_START` **`__JAIPH_EVENT__`** line on the runner’s stderr (same stream as the progress tree). Includes nested steps. The root **`workflow default`** step still emits `STEP_START`; the TTY subscriber skips **drawing** that start row (`data.isRoot` in `registerTTYSubscriber`, `src/cli/run/stderr-handler.ts`). |
-| `step_end` | When the CLI parses a matching `STEP_END` line on that stream. The TTY subscriber also skips drawing the root step’s completion row (`data.isRoot`). |
+```bash
+p=$(cat); echo "$p" | jq -r .status; echo "$p" | jq -r .run_path
+```
 
-Step `kind` values come from the runtime event payload (`workflow`, `rule`, `script`, `prompt`). See [CLI — Run progress and tree output](cli.md#run-progress-and-tree-output).
+Hook stdout is discarded; hook stderr is copied to the CLI's stderr. Hook failures never change the workflow exit code — the CLI logs `jaiph hooks: …` lines and continues.
 
-## Payload
+## 3. Run the workflow
 
-Each command receives one JSON object on **stdin** (UTF-8). Parse with `jq`, `python3 -c`, or your tool of choice. Stdin can only be read once per process; buffer it in a variable if you need the payload multiple times (see [Examples](#examples)).
+```bash
+jaiph run ./flow.jh
+```
 
-### Fields
+Each registered hook fires when the CLI dispatches its event. Step hooks follow a matching `__JAIPH_EVENT__` line on the runner's stderr; `workflow_start` and `workflow_end` are emitted by the CLI itself. For every hook the CLI writes the JSON payload to stdin and does not wait — commands can overlap in wall-clock time. Lifecycle order is still `workflow_start` → `step_*` → `workflow_end`; within one event, commands spawn in config order but may finish in any order.
 
-| Field | Present in | Description |
-|-------|------------|-------------|
-| `event` | all | `workflow_start`, `workflow_end`, `step_start`, or `step_end`. |
-| `workflow_id` | all | Runtime `run_id` from each `STEP_*` line. Empty on `workflow_start`. For `workflow_end`, the CLI reuses the first non-empty `run_id` it buffered while parsing stderr (`workflowRunId` in `RunState`, `src/cli/run/stderr-handler.ts`); it stays empty if the runner never emitted one. `step_start` / `step_end` echo the `run_id` from that event. |
-| `timestamp` | all | ISO 8601 string. For `step_*`, the event’s `ts` when non-empty; otherwise the CLI synthesizes one at hook time. `workflow_start` and `workflow_end` timestamps come from the CLI when those hooks fire. |
-| `run_path` | all | Absolute path to the `.jh` entry file. |
-| `workspace` | all | Workspace root directory (same rules as [Config locations](#config-locations-and-precedence)). |
-| `step_id` | `step_*` | Step id for progress and captures; from the event’s `id`, or a synthesized `legacy:<n>:<func>` value when the runtime left `id` empty so starts and ends still pair (`resolveEventId` in `src/cli/run/stderr-handler.ts`). |
-| `step_kind` | `step_*` | `workflow`, `rule`, `script`, or `prompt`. |
-| `step_name` | `step_*` | Step name (e.g. `default`, `scan_passes`). |
-| `status` | `*_end` | **Step:** exit status from the `STEP_END` event (0 success, non-zero failure; missing / null status becomes `1` in the hook payload via `?? 1`). **Workflow:** the CLI’s resolved outcome — **`0` success or `1` failure** (not the raw child exit code): non-zero subprocess exit or `hasFatalRuntimeStderr` yields `1` (`reportResult` in `src/cli/commands/run.ts`). |
-| `elapsed_ms` | `*_end` | **`workflow_end`:** wall-clock ms from when the CLI recorded `startedAt` (start of the main `try` in `runWorkflow`, after the scratch/target directory exists — so **after** module metadata is read and `outDir` exists, and **including** banner, **`buildScripts`**, the full runner lifetime, and stderr drain) until the hook runs. **`step_end`:** duration from the `STEP_END` event, or `0` if missing. |
-| `run_dir` | `workflow_end` | Absolute run log directory from runner metadata (or Docker discovery). Omitted if unavailable. |
-| `summary_file` | `workflow_end` | Absolute path to `run_summary.jsonl` when metadata provides it. See [CLI — Run summary](cli.md#run-summary-jsonl). |
-| `out_file` | `step_end` | Stdout capture path from the `STEP_END` event. The hook omits this JSON key when the parsed event has an empty `out_file` string (`registerHooksSubscriber` in `src/cli/run/hooks.ts`). Current runtimes normally emit paths for every completed step; files may still be empty. |
-| `err_file` | `step_end` | Stderr capture path; same omission rule as `out_file`. |
+## Verification
 
-### Payload by event
+Tail your hook's output target after a run:
 
-- **`workflow_start`** — `event`, `workflow_id` (empty string), `timestamp`, `run_path`, `workspace`.
-- **`step_start`** — `event`, `workflow_id`, `timestamp`, `run_path`, `workspace`, `step_id`, `step_kind`, `step_name`.
-- **`step_end`** — same base as `step_start`, plus `status`, `elapsed_ms`, and optionally `out_file` / `err_file`.
-- **`workflow_end`** — `event`, `workflow_id`, `status` (0 or 1), `elapsed_ms`, `timestamp`, `run_path`, `workspace`, and optionally `run_dir` / `summary_file`.
+```bash
+tail -n 5 "$HOME/.jaiph/step-events.jsonl"
+```
 
-Example payload (`step_end`):
+A successful step_end record looks like:
 
 ```json
-{
-  "event": "step_end",
-  "workflow_id": "abc-123",
-  "step_id": "run:1:1",
-  "step_kind": "workflow",
-  "step_name": "default",
-  "status": 0,
-  "timestamp": "2026-03-11T12:00:00.000Z",
-  "elapsed_ms": 1500,
-  "run_path": "/repo/flows/ci.jh",
-  "workspace": "/repo",
-  "out_file": "/repo/.jaiph/runs/2026-03-11/12-00-00-ci/000001-ci__step.out",
-  "err_file": "/repo/.jaiph/runs/2026-03-11/12-00-00-ci/000001-ci__step.err"
-}
+{"event":"step_end","step_kind":"workflow","step_name":"default","status":0,"elapsed_ms":1500}
 ```
 
-Shape definitions in repo: **`HookPayload`** / **`HookEventName`** in `src/types.ts`.
+The jq filter above drops several fields. A full `step_end` payload also includes `workflow_id`, `step_id`, `timestamp`, `run_path`, and `workspace`, and may include `out_file` / `err_file` when log captures exist.
 
-## Behavior
+## Disable a global hook for one project
 
-- **Shell:** Each command runs as `sh -c '<command>'` (POSIX `sh` on the **`PATH`** of the `jaiph run` process).
-- **Concurrency:** Every command for one event is spawned in a loop **without** waiting for the previous process to exit, so hook commands for the same event overlap in wall time. The CLI also **does not wait** for hook processes between lifecycle stages: a `workflow_end` hook may start while `step_end` hooks spawned earlier are still running. Causal order is only **when spawns happen**: `workflow_start` → step hooks as stderr lines are processed → `workflow_end` before PASS/FAIL.
-- **Best-effort:** Hook failures never change the CLI exit code. Non-zero exits or spawn errors log `jaiph hooks: …` lines on stderr; the workflow result is unchanged.
-- **I/O:** Hook stdout is discarded. Hook stderr is copied to the CLI’s stderr. The JSON payload is written with `stdin.end(payloadJson, "utf8")` per process; if a hook exits before reading stdin, delivery is best-effort and may log an error.
-- **Environment:** Hooks receive a shallow copy of `process.env` at hook spawn time.
-- **Working directory:** The child’s cwd is **not** reset by the hook runner — it inherits the **`jaiph run` process cwd** (often where you launched the CLI), not necessarily `workspace`. Use the `workspace` field from stdin for project-root paths.
-
-**Invalid or missing config:** Missing files are skipped silently. A file that exists but fails `JSON.parse` or is not a JSON object produces a stderr warning and is ignored. Bad per-event values are skipped without rejecting the rest of the file (`parseHookConfig` in `src/cli/run/hooks.ts`).
-
-## Examples
-
-**Global `~/.jaiph/hooks.json` — POST the workflow-end payload to an HTTP endpoint** (replace the URL with yours):
-
-```json
-{
-  "workflow_end": ["curl -s -X POST https://example.com/jaiph/end -d @-"]
-}
-```
-
-**Project `.jaiph/hooks.json` — append a one-line JSON record per finished step, and log each workflow end under the workspace:**
+There is no explicit "disable" flag. An empty array does not override global hooks. Override the event in the project file with a no-op instead:
 
 ```json
-{
-  "step_end": ["jq -c '{event,step_kind,step_name,status,elapsed_ms}' >> \"$HOME/.jaiph/step-events.jsonl\""],
-  "workflow_end": ["p=$(cat); echo \"$p\" | jq -c '{event,status,run_dir,summary_file}' >> \"$(echo \"$p\" | jq -r .workspace)/.jaiph/workflow-ends.jsonl\""]
-}
+{ "workflow_end": ["true"] }
 ```
 
-Stdin is one-shot per process. The `workflow_end` command stores the payload in `p` so it can feed multiple `jq` invocations. The `step_end` line reads stdin once inside a single `jq` pipeline.
-
-The `step_end` example uses `$HOME` so it does not depend on the shell cwd. The `workflow_end` line resolves the log path via the payload’s `workspace` field.
+## Related
 
-**Project overrides global:** If global defines `workflow_end: ["global-notify.sh"]` and the project defines `workflow_end: ["project-notify.sh"]`, only `project-notify.sh` runs.
+- [Architecture — Channels and hooks in context](architecture.md#channels-and-hooks-in-context) — where hooks sit relative to runtime semantics.
+- [Architecture — Runtime vs CLI responsibilities](architecture.md#runtime-vs-cli-responsibilities) — why hooks run on the host even for Docker runs.
+- [Run a workflow in a Docker sandbox](/how-to/sandbox-run) — Docker runs still hit host hooks.
diff --git a/docs/inbox.md b/docs/inbox.md
index 6875d5eb..f79edfa0 100644
--- a/docs/inbox.md
+++ b/docs/inbox.md
@@ -1,358 +1,96 @@
 ---
 title: Inbox & Dispatch
 permalink: /inbox
+diataxis: explanation
 redirect_from:
   - /inbox.md
 ---
 
-# Inbox & Dispatch
+# Inbox & Dispatch — the design
 
-## Overview
+Workflows often need to hand work off to other workflows without wiring direct calls between them. The sender knows it has produced a finding; it should not have to know which workflows want to react to that finding, or in what order. Jaiph addresses this with **channels** — a small, in-process message-passing model that lives inside the same workflow runtime as everything else.
 
-Many pipelines split work across stages: one part of the system produces a
-payload and another reacts later. Without standing up a message broker, a
-common pattern is an **in-process queue**: producers enqueue messages, and the
-runtime drains that queue at predictable boundaries so receivers run in order.
+This page explains the *model*: how channels behave, why the design is shaped the way it is, and how the pieces fit together. For the surface syntax see the [Language](language.md) and [Grammar](grammar.md) references; for the runtime implementation see [Architecture — Channels and hooks in context](architecture.md#channels-and-hooks-in-context).
 
-**Jaiph’s channels** follow that pattern at workflow granularity. You declare a
-`channel` at module scope, optionally list workflow targets after `->`, and use
-`<-` inside a workflow to enqueue a **string** payload. Routing on the
-`channel … ->` line is **static** (parsed into the AST); nothing “fires” at
-parse time. Delivery happens later: after a workflow’s steps finish — including
-waiting out any **`run async`** handles joined at workflow exit — the runtime
-drains that workflow frame’s queue and **`run`s** each route target in order.
+## What problem channels solve
 
-Under the hood, `NodeWorkflowRuntime` keeps queues and route maps **in memory**
-(see [Architecture — Channels and hooks in context](architecture.md#channels-and-hooks-in-context)).
-**`run_summary.jsonl`** records **`INBOX_ENQUEUE`** on every send (metadata only;
-see [Trigger contract](#trigger-contract)). **`inbox/NNN-<channel>.txt`** files
-are optional **audit** copies of the payload for **routed** sends only; routing
-does not read them back — no filesystem watchers or inbox polling. Which stack
-frame owns routes, and how sends bubble to an ancestor frame, is spelled out in
-[Who registers routes and who drains](#who-registers-routes-and-who-drains).
+Two patterns recur in real workflows:
 
-## At a glance
+- **Late binding** — a workflow produces something (a finding, a summary, a verdict) and another workflow should react to it, but the producer should not be coupled to the consumer's name or signature.
+- **Fan-out without a broker** — multiple subscribers should hear the same event. Standing up a message broker for an in-process workflow runner is heavy and turns durable orchestration into a distributed-systems problem.
 
-```jh
-channel findings -> analyst
-
-workflow researcher() {
-  findings <- "## analysis results"
-}
+Channels give workflows a publish/subscribe surface without leaving the process. The producer declares "this is a finding"; the channel declaration ties findings to one or more listeners; the runtime delivers them.
 
-workflow analyst(message, chan, sender) {
-  log "Received: ${message}"
-}
-
-workflow default() {
-  run researcher()
-}
-```
+## Drain-driven, not file-watched
 
-`researcher` sends data to the `findings` channel. The `channel findings -> analyst`
-declaration routes `findings` messages to `analyst`, which receives the message,
-channel name, and sender bound to its declared parameters `message`, `chan`, and
-`sender` (see [Trigger contract](#trigger-contract)).
+The most important property of the inbox model is that **delivery is drain-driven**. Sends do not "fire" routes the moment the `<-` line executes. Instead, each workflow frame owns an in-memory queue; a `send` enqueues on the nearest stack frame that declares routes for the channel (or on the sender's frame when none do — see [Routed vs unrouted sends](#routed-vs-unrouted-sends)). The runtime drains **that frame's** queue only **after that frame's step list finishes** — including the implicit join of any `run async` handles created in that step list ([Spec: Async Handles](spec-async-handles.md)). Only then does the runtime invoke each route target, sequentially, in declaration order.
 
-## Design principles
+This is intentional:
 
-- **Drain-driven delivery, not a filesystem mailbox.** Messages are drained from an
-  in-memory queue **after each workflow finishes its steps** (including the implicit
-  join for `run async`). `inbox/*.txt` is an optional audit copy for routed sends —
-  routing does **not** read from disk — no `inotifywait`, `fswatch`, or polling loops.
-- **Sequential dispatch.** For each queued message, route targets run **in list
-  order** (declaration order on the `channel` line), strictly **one after
-  another**. Older Jaiph releases exposed parallel inbox dispatch via config /
-  environment variables; that mode is **removed** — `run.inbox_parallel` is an
-  unknown config key and **`JAIPH_INBOX_PARALLEL` has no effect** on ordering.
-- **Inbox is scoped per run.** **`inbox/*.txt`** persists **routed** payloads under that UTC run directory (**[Architecture — Durable artifact layout](architecture.md#durable-artifact-layout)**); there is no repo-wide mailbox outside **`.jaiph/runs`**.
-- **Channels are compile-checked.** Unknown channels, bad route targets, and
-  invalid `send` RHS forms are `E_PARSE` / `E_VALIDATE` from
-  `validateReferences` in the build path; **`buildRuntimeGraph()`** only parses
-  modules and does not repeat that pass (see [Architecture — Summary](architecture.md#summary)).
+- There is **no `inotifywait`, no `fswatch`, no polling loop**. The `inbox/NNN-<channel>.txt` files under the run directory are an audit copy of routed sends, not a delivery mechanism — routing does not read them back.
+- Producers run to completion before any consumer starts. A workflow that emits five findings does not get partly interrupted by a route target firing mid-step list.
+- Delivery is deterministic. For a given send order, the dispatch order is fixed.
 
-## Syntax
+The trade-off is that channels are **not** a low-latency notification primitive. They are an end-of-step-list handoff. For tighter coordination, use a direct `run` call.
 
-### Channel declarations: `channel <name> [-> <workflow>, ...]`
+## Routes belong on the channel, not on workflows
 
-Declare channels at top level, one per line. Optionally declare inline routes
-with `->`:
+A channel declaration carries its targets inline:
 
 ```jh
-channel findings -> analyst
-channel report
-channel events -> handler_a, handler_b
-
-workflow default() { ... }
+channel findings -> analyst, reviewer
 ```
 
-Every channel used by send (`<-`) must be defined in the current module or
-imported from another module (e.g. `shared.findings`). Undefined channels fail
-validation with:
-
-- `Channel "<name>" is not defined`
-
-### Send operator: `<channel_ref> <- <rhs>`
+Routes are top-level static data on `ChannelDef`, not statements inside a workflow body. The design choice has two consequences worth understanding:
 
-The channel reference is always on the left side of the `<-` operator. Valid
-channel forms:
+1. **One canonical subscription list per channel.** The compiler can validate every target up front: targets must be workflows (rules and scripts are rejected), they must declare exactly three parameters, and unknown names fail with `E_VALIDATE` at compile time, not at dispatch time.
+2. **Routes are visible at the module boundary.** A reader can see "who listens on `findings`" without scanning workflow bodies for ad-hoc wiring. Routing intent lives next to the channel it describes.
 
-- local channel: `findings`
-- imported channel: `shared.findings` — checked against the import at compile time; **dispatch** still matches **`routes.has()`** with the **literal** token (see [Module scope](#who-registers-routes-and-who-drains))
+The runtime registers routes only on the **entry** workflow frame when that workflow starts: it reads `channel … ->` declarations from that workflow's module. Nested `run` frames always keep an empty map, so sends from callees walk the workflow stack outward to the orchestrator frame that registered the channel.
 
-The send step resolves the **string** payload from the **RHS**, bumps **`inboxSeq`**, and appends an **`InboxMsg`** to the queue on the workflow context selected by walking **from the sender outward** until **`ctx.routes.has(sendChannel)`** — **`sendChannel`** is the exact text left of **`<-`**. If nothing matches, enqueue on the sender’s context (**`routed === false`**; no **`inbox/*.txt`** row). If a match exists (**`routed === true`**), create **`inbox/`** when needed and write **`NNN-<sendChannel>.txt`** sharing the same **`inbox_seq`** as JSONL.
+A `channel <name>` line without `->` still defines the name for `send` validation but never enters the route map — sends on a bare channel are still queued (and `INBOX_ENQUEUE` is still recorded for the timeline), they just have no consumer.
 
-**`INBOX_ENQUEUE`** is always written (`channel`, **`sender`**, **`inbox_seq`**, **`ts`**, **`run_id`**, **`event_version`**) and **does not** embed the payload body (`node-workflow-runtime.ts`).
+## Sequential dispatch is the only mode
 
-Valid RHS forms:
+For each queued message, route targets run **strictly in declaration order, one at a time**. The next message is not processed until every target for the current message has completed. There is no opt-in parallel mode; older builds exposed one and it has been removed.
 
-| RHS form | Example | Behavior |
-|---|---|---|
-| Double-quoted literal | `findings <- "## results"` | Interpolated string |
-| Triple-quoted block | `findings <- """line1\n  ${x}"""` | Multiline string; margin rules match other `"""` steps (see [Grammar](grammar.md#send--channel-messages)) |
-| Variable expansion | `findings <- ${var}` or `$name` | Value of the variable |
-| `run` capture | `findings <- run build_msg()` | Return value or trimmed stdout of the workflow/script |
+The reason is failure semantics. With sequential dispatch:
 
-The RHS does **not** accept raw shell commands or bare workflow/rule/script
-names (use a string, `$` / `${…}`, or `run ref(…)` — see
-[Grammar — `send`](grammar.md#send--channel-messages) and
-[Grammar — `channel` routing](grammar.md#channel-routing)).
+- A target's failure is the failure of that delivery. Subsequent targets for the same message are skipped (fail-fast).
+- Cascading sends from inside a route target enqueue on the orchestrator frame's queue and are drained in the same pass, so a chain of sends produces a deterministic timeline.
+- There is no need for users to reason about which side effects of two parallel handlers happened first.
 
-```jh
-channel findings
-
-workflow researcher() {
-  findings <- "## findings"
-}
-```
+A single frame's drain pass is bounded (default **1000** messages; override with `JAIPH_INBOX_MAX_DISPATCH`) so circular send loops abort with `E_INBOX_DISPATCH_LIMIT` instead of running forever.
 
-An explicit RHS is always required — bare `channel <-` (without a value) is invalid.
-
-The `<-` operator is only recognized when it appears outside of quoted strings
-on the surrounding line so channel names and literals are not misread as send
-syntax.
-
-Send and route syntax, plus compile-time checks, are summarized under
-[Grammar — `send`](grammar.md#send--channel-messages) and
-[Grammar — `channel` routing](grammar.md#channel-routing); the EBNF and
-validation list live at the end of [Grammar](grammar.md#validation-rules).
-
-### Route declaration: `channel <name> -> <workflow>`
-
-Routes are declared **inline on channel declarations** at the top level, not
-inside workflow bodies. When a message arrives on that channel, the runtime calls
-each listed **workflow** that must declare exactly 3 parameters. The runtime
-binds the dispatch values (message, channel, sender) to whatever names the
-target declares.
-
-Targets must be **workflows** (local or imported as `alias.name`). **Rules**
-and **scripts** are not valid route targets — the compiler uses workflow-only
-reference checks, so a bad target is **`E_VALIDATE`** with messages such as
-`unknown local workflow reference "…"`, `imported workflow "…" does not exist`,
-`rule "…" must be called with ensure`, or `script "…" cannot be called with run`
-(see [Grammar — `channel` routing](grammar.md#channel-routing) for a short
-version of the same rules). A name that is not a valid
-`alias.name` / `name` pattern fails at parse time as **`E_PARSE`**
-`invalid workflow reference in channel route: "…"`. The wrong **parameter
-count** on a resolved workflow is
-`E_VALIDATE: inbox route target "…" must declare exactly 3 parameters (message, channel, sender), but declares N`.
+When concurrency matters, the right tool is `run async` inside a target body, not parallel dispatch across targets.
 
-```jh
-channel findings -> analyst
-channel summary -> reviewer
+## Routed vs unrouted sends
 
-workflow default() {
-  run researcher()
-}
-```
+The same `<-` operator behaves slightly differently depending on whether any frame on the workflow stack has the channel in its route map:
 
-**Multiple targets on one declaration** are comma-separated — they share one
-route and dispatch in **declaration order**, sequentially:
+- **Routed** — some frame on the workflow stack has the bare channel name in its route map (an imported `alias.` prefix is stripped before lookup). The runtime walks outward from the sender until it finds that frame, enqueues the payload on **its** queue, and writes `inbox/NNN-<channel>.txt` under the run directory as an audit copy.
+- **Unrouted** — no frame on the stack has the channel in its route map. The message is still queued on the sender's own frame, and `INBOX_ENQUEUE` is still appended to `run_summary.jsonl`, but no audit file is written and the sender's drain pass skips it (no targets to `run`).
 
-```jh
-channel findings -> analyst, reviewer
-```
+Unrouted sends are intentionally a silent drop, not an error. This lets optional subscribers be just that: a workflow can publish on `metrics` even if no one is listening today, and tomorrow a subscriber can be wired up without touching the producer. If a missing handler should be a hard failure, the right place to assert it is in a test or a `rule` check, not in the channel runtime.
 
-Route declarations are static routing rules stored on `ChannelDef`, not on
-workflow definitions or steps. The compiler validates that all target workflow
-references exist and declare exactly 3 parameters.
+## The trigger contract
 
-A **`channel <name>`** line **without** **`->`** still defines **`name`** for **`send`**
-validation, but the runtime **never** adds **`name`** to **`ctx.routes`** — only
-channels with **at least one** **`->`** target populate the route map
-(**`node-workflow-runtime.ts`** skips bare channels when building **`routes`**).
-Sends on those names therefore behave like **unrouted** sends (no **`inbox/*.txt`**),
-and **`drainWorkflowQueue`** has nothing to **`run`** for them.
+A receiver workflow is a normal workflow, dispatched with three positional arguments bound to the parameters it declares:
 
-A `->` route inside a workflow body is a **parse error** with guidance:
-`route declarations belong at the top level: channel <name> -> <targets>`.
-
-### Capture + send is a parse error
-
-```jh
-# E_PARSE: capture and send cannot be combined; use separate steps
-name = channel <- cmd
-```
-
-Use two steps instead:
-
-```jh
-const payload = run build_message()
-channel <- "${payload}"
-```
+| Position | Meaning |
+|---|---|
+| 1st parameter | The message payload (the string sent on `<-`) |
+| 2nd parameter | The channel name (bare, e.g. `findings`) |
+| 3rd parameter | The sender — the workflow name that performed the send |
 
-## Inbox layout
+The receiver picks its own parameter names. That is the entire contract: no environment plumbing, no special globals, no implicit context object. Targets that declare a different parameter count are rejected at compile time so receivers cannot drift away from the dispatch shape.
 
-Under the run directory (see [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout)):
+## Why this design, in one paragraph
 
-```
-.jaiph/runs/<YYYY-MM-DD>/<HH-MM-SS>-<source-basename>/inbox/
-  001-findings.txt
-  002-summary.txt
-  003-findings.txt
-  ...
-```
+Channels are a deliberately small idea in Jaiph. They are an in-process, drain-driven, sequentially-dispatched, late-binding handoff between workflows — described once at the top of the module, validated at compile time, and recorded in `run_summary.jsonl` (every send) plus `inbox/` audit files (routed sends only) for after-the-fact inspection. Anything more powerful (concurrency, brokers, retries, dead-letter queues) is intentionally out of scope: those problems belong to other tools, and Jaiph keeps channels small enough to reason about without leaving the runtime.
 
-When present, files are **`NNN-<channel>.txt`** (`NNN` = **three**‑digit **`inboxSeq`**,
-same value as **`inbox_seq`** in **`INBOX_ENQUEUE`**). **`inboxSeq`** is shared across
-every `send` in the process for that run, so numbering matches **enqueue order**, not “per channel”.
-Persisted payloads are exactly the **routed** sends — the orchestration queue is always in memory.
-
-## Runtime dispatch
-
-### Who registers routes and who drains
-
-Every entered workflow gets a **`WorkflowContext`**: `workflowName`, a route **`Map`**,
-and a message queue. **`->` bindings are populated only on “entry” workflows:**
-the interpreter passes **`inheritCallerMetadataScope === false`** for **`jaiph run`’s
-`default`**, for **`runNamedWorkflow`** (used by **`jaiph test`**’s
-**`test_run_workflow`**), and for any other path that starts a workflow the same
-way — so **`routes`** mirror **that callee module’s** top-level **`channel ->`** lines,
-not modules you only **`import`**. Each nested **`run child()`** passes **`inheritCallerMetadataScope === true`**, which keeps **`routes`** as an **empty** **`Map`**
-(see **`node-workflow-runtime.ts`** — routes register only when **not** inheriting the caller metadata scope), so **`send`** walks **up the workflow stack** until **`routes.has(step.channel)`** succeeds (**`step.channel`** is the exact AST token left of **`<-`**).
-After **each** workflow body finishes (implicit **`run async` join included), **`drainWorkflowQueue`** runs for **that** frame’s queue and route table **before** the frame pops — nested exits are usually no-ops, while the **`jaiph run`** root drains work that nested sends enqueued onto it.
-
-**Module scope.** `ctx.routes` **keys** are bare names from **`channel <name>`** in the callee module (**`parseChannelLine`**). Imports allow **`lib.topic <-`** (validator proves **`topic`** exists inside **`lib`**) yet **`routes.has("lib.topic")`** is still **false** for default layouts, because registered keys omit the **`alias.`** prefix (**`step.channel`** is compared verbatim). Prefer **`topic <-`** next to **`channel topic -> …`** in the **entry module** (the workflow started by **`jaiph run`** or **`runNamedWorkflow`**), or **`jaiph run lib.jh`** when **`lib.jh`'s **`channel`** lines should supply the **`->`** bindings.
-
-### Dispatch loop
-
-Implementation: `src/runtime/kernel/node-workflow-runtime.ts` — `send` step
-handling and `drainWorkflowQueue`.
-
-1. On workflow entry, push a `WorkflowContext` (route map, empty queue).
-2. When **`inheritCallerMetadataScope === false`**, copy each **`channel <name> -> …`** from **`graph.modules.get(resolved.filePath)`**’s AST into **`ctx.routes`**; nested **`run`** frames leave **`routes`** empty.
-3. Execute workflow steps top to bottom.
-4. On `<-`: resolve payload; bump `inboxSeq` (`NNN` zero-padded to **3** digits);
-   enqueue on the routed context selected by scanning the stack outward; **`if routed`**
-   write `inbox/NNN-<channel>.txt`; always append **`INBOX_ENQUEUE`**
-   (`channel`, `sender`, **`inbox_seq`**, **`ts`**, **`run_id`**, **`event_version`**) to **`run_summary.jsonl`**.
-5. After all steps (and implicit `run async` joins) complete,
-   `drainWorkflowQueue`:
-   - `while (cursor < queue.length)` — new sends during dispatch append to the
-     same queue and are processed in subsequent iterations.
-   - For each message, look up targets for `channel` on **that** workflow's
-     context. If there is no route, **skip** (silent drop).
-   - If there are targets, invoke each target **sequentially** in target-list
-     order, binding message, channel, and sender to the target's 3 declared
-     parameters (see [Ordering and sequence ids](#ordering-and-sequence-ids)).
-6. Pop the workflow context and return.
-
-There is no `E_DISPATCH_DEPTH` / `JAIPH_INBOX_MAX_DISPATCH_DEPTH` check in
-`NodeWorkflowRuntime`'s drain loop. Avoid unbounded circular sends in orchestration.
-
-### Implementation notes
-
-- Routes (from channel-level `->` declarations) and the pending queue live **in-memory** on **`WorkflowContext`**.
-  Routing consults **`ctx.routes` + `ctx.queue`**; **`inbox/NNN-….txt`** is written **only when** **`if (routed)`** after enqueue — see **`send`** in **`node-workflow-runtime.ts`**.
-- **Sender identity** is the **current workflow name** from the context that
-  performed the send (e.g. `researcher`), stable across modules.
-
-### Ordering and sequence ids
-
-Messages are handled **one at a time** in queue order (FIFO). For each message,
-targets run **strictly in list order** on the `channel` line; the next message is
-not processed until all targets for the current message have finished (success, or
-fail-fast on the first non-zero exit).
-
-- **Sequence ids:** Monotonic per run in the runtime (`inboxSeq`); message
-  filenames use the same padded counter.
-
-## Error semantics
-
-- **Undefined channel reference:** validation error `Channel "<name>" is not defined`.
-- **Dispatched workflow exits non-zero:** the owning workflow fails; the first
-  failing target stops further targets for that message (fail-fast).
-- **No route for a channel:** the **`InboxMsg`** is still queued and **`INBOX_ENQUEUE`**
-  is recorded, but **`inbox/*.txt`** is **not** written and **`drainWorkflowQueue`** has
-  no targets (`routes.get(channel)` empty) → the message is **skipped** with no receivers
-  (silent drop). This is intentional for optional subscribers; declare explicit routes if
-  a missing handler should be an error.
-- **Circular sends:** the in-memory queue can grow without a built-in iteration
-  cap in `NodeWorkflowRuntime`. Avoid circular sends that grow the queue without bound.
-
-## Trigger contract
-
-Routed receivers get three dispatch values bound to their declared parameters:
-
-| Param position | Dispatch value |
-|---|---|
-| 1st declared parameter | Message payload (content sent to the channel) |
-| 2nd declared parameter | Channel name (e.g. `findings`) |
-| 3rd declared parameter | Sender name (the **workflow name** that performed the send) |
-
-Receivers get channel and sender via their declared parameter names —
-no environment-variable plumbing.
-
-- **`run_summary.jsonl`:** **`NodeWorkflowRuntime`** appends **`INBOX_ENQUEUE`** on every **`send`**,
-  then **`INBOX_DISPATCH_START`** / **`INBOX_DISPATCH_COMPLETE`** (with **`elapsed_ms`** and **`status`**)
-  per routed-target invocation (`appendRunSummaryLine`).
-
-  **`INBOX_ENQUEUE`** (current **`NodeWorkflowRuntime`**) records **`type`**, **`ts`**, **`run_id`**,
-  **`channel`**, **`sender`**, **`inbox_seq`**, **`event_version`** — **not** the message body.
-
-  Routed sends also get the full payload on disk as **`inbox/NNN-<channel>.txt`**. Tooling must read
-  that file **or** the receiver’s **`STEP_*` / script captures for the full string; unrouted sends
-  have **only** enqueue metadata in JSONL (plus whatever you log around the **`send`**).
-- **Calling a receiver with explicit args:** the CLI’s `jaiph run` only starts
-  the file’s `default` workflow; extra CLI arguments are passed to `default`
-  (see [CLI — `jaiph run`](cli.md#jaiph-run)). There is no `jaiph run
-  <name> <file> …` form. To hand `(message, channel, sender)` to a workflow
-  such as `analyst` outside of inbox dispatch, use a **`run` step** from another
-  workflow, e.g. `run analyst("…", "findings", "researcher")` (or
-  `test_run_workflow` in `*.test.jh`).
-
-## Progress tree integration
-
-- Channel‑level **`channel … ->`** declarations surface in the CLI’s **static** step-tree
-  view (derived from the module AST alongside concrete steps).
-- Dispatched workflows render like other **`run`** steps (same shape as `workflow analyst (message="…", chan="findings", sender="scanner")` in **`e2e/tests/91_inbox_dispatch.sh`**). Live **`STEP_START` / `STEP_END`** payloads from **`NodeWorkflowRuntime`** do **not** add inbox-specific **`dispatched` metadata** (**`events.ts`** still tolerates **`dispatched: true`** for forward compatibility).
-- Dispatched step output follows the same artifact rules as other managed steps.
-  Use `log` inside the receiver to surface lines in the tree. The runtime
-  embeds stdout in `STEP_END` (`out_content`) with the same JSON escaping
-  rules as other steps.
-- Run artifacts and `run_summary.jsonl` provide a browsable history of past runs
-  (see [CLI — Run artifacts](cli.md#run-artifacts-and-live-output)).
-
-### Example output
-
-The shape matches the **`display_inbox.jh`** fixture inline in the same test file (search for **`display_inbox.jh`** in **`e2e/tests/91_inbox_dispatch.sh`**): `scanner` sends on **`findings`**, **`analyst`** sends on **`report`**, **`default`** routes both:
-
-```
-workflow default
-  ▸ workflow scanner
-  ·   ▸ script emit_findings
-  ·   ✓ script emit_findings (<time>)
-  ✓ workflow scanner (<time>)
-  ▸ workflow analyst (message="Found 3 issues in auth module", chan="findings", sender="scanner")
-  ·   ▸ script emit_summary (1="Found 3 issues in auth module")
-  ·   ✓ script emit_summary (<time>)
-  ✓ workflow analyst (<time>)
-  ▸ workflow reviewer (message="Summary: Found 3 issues in auth ...", chan="report", sender="analyst")
-  ·   ▸ script print_reviewed (1="Summary: Found 3 issues in auth ...")
-  ·   ✓ script print_reviewed (<time>)
-  ✓ workflow reviewer (<time>)
-
-✓ PASS workflow default (<time>)
-```
+## Related
 
-A smaller hand-written module with the same routing idea lives at **`examples/agent_inbox.jh`**.
+- [Architecture — Channels and hooks in context](architecture.md#channels-and-hooks-in-context) — where the in-memory queue and dispatch loop live in the runtime.
+- [Spec: Async Handles](spec-async-handles.md) — the implicit join that runs *before* a workflow's queue drains.
+- [Language](language.md) and [Grammar](grammar.md) — the `channel` / `send` syntax surface.
diff --git a/docs/index.html b/docs/index.html
index 2a2e5b2b..67b51670 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -33,7 +33,8 @@
                 <img class="jaiph-logo-dark" src="logo-ninja.png" alt="" />
             </a>
             <div class="top-nav-links">
-                <a href="/getting-started" rel="noopener noreferrer">Docs</a>
+                <a href="/tutorials/first-workflow" rel="noopener noreferrer">Tutorial</a>
+                <a href="/how-to/install" rel="noopener noreferrer">How-to</a>
                 <a href="https://github.com/jaiphlang/jaiph" target="_blank" rel="noopener noreferrer">GitHub</a>
                 <a href="https://marketplace.visualstudio.com/items?itemName=jaiph.jaiph-syntax-vscode" target="_blank"
                     class="no-mobile" rel="noopener noreferrer">VSCode</a>
@@ -49,7 +50,8 @@
     <header>
         <h1>J<span class="jaiph-accent">ai</span>ph</h1>
         <div class="hero-cta">
-            <a href="#samples" rel="noopener noreferrer" class="button button-primary">Samples</a>
+            <a href="/tutorials/first-workflow" rel="noopener noreferrer" class="button button-primary">Tutorial</a>
+            <a href="#samples" rel="noopener noreferrer" class="button button-dark">Samples</a>
             <a href="https://github.com/jaiphlang/jaiph" target="_blank" rel="noopener noreferrer"
                 class="button button-dark">GitHub</a>
             <a href="https://marketplace.visualstudio.com/items?itemName=jaiph.jaiph-syntax-vscode" target="_blank"
@@ -77,7 +79,7 @@ <h2>Try it out!</h2>
 
                 <div class="code-tab-panel is-active" data-panel="try-run-sample">
                     <pre><code class="language-bash static-highlight"><span class="code-line">curl -fsSL https://jaiph.org/run | bash -s '</span><span class="code-line"><span class="ralph-keyword">workflow</span> <span class="ralph-definition">default</span>() {</span><span class="code-line">  <span class="ralph-keyword">const</span> <span class="ralph-variable">response</span> <span class="ralph-operator">=</span> <span class="ralph-keyword">prompt</span> <span class="ralph-string">"Say: Hello, I am [model name]!"</span></span><span class="code-line">  <span class="ralph-keyword">log</span> response</span><span class="code-line">}'</span></code></pre>
-                    <p class="small">Installs Jaiph <strong>v0.9.4</strong> to <strong>~/.local/bin</strong> (if not
+                    <p class="small">Installs Jaiph <strong>v0.10.0</strong> to <strong>~/.local/bin</strong> (if not
                         already
                         installed), and runs the sample workflow with <a href="https://cursor.com/docs/cli/installation"
                             target="_blank" rel="noopener noreferrer">Cursor CLI</a> agent backend (the default one).
@@ -89,14 +91,14 @@ <h2>Try it out!</h2>
                 <div class="code-tab-panel" data-panel="try-init-project">
                     <p class="small">Run the script below from the project directory:</p>
                     <pre><code class="language-bash">curl -fsSL https://jaiph.org/init | bash</code></pre>
-                    <p class="small">Installs Jaiph <strong>v0.9.4</strong> to <strong>~/.local/bin</strong> (if not
+                    <p class="small">Installs Jaiph <strong>v0.10.0</strong> to <strong>~/.local/bin</strong> (if not
                         already installed), and runs <code>jaiph init</code> to initialize the Jaiph workspace in the
                         current directory.</p>
                 </div>
 
                 <div class="code-tab-panel" data-panel="try-install-only">
                     <pre><code class="language-bash">curl -fsSL https://jaiph.org/install | bash</code></pre>
-                    <p class="small">The installer will install the version <strong>0.9.4</strong> of Jaiph to
+                    <p class="small">The installer will install the version <strong>0.10.0</strong> of Jaiph to
                         <strong>~/.local/bin</strong>. To switch versions, use <code>jaiph use nightly</code>
                         or <code>jaiph use &lt;version&gt;</code> to switch.
                     </p>
@@ -344,7 +346,7 @@ <h2 id="samples">Samples</h2>
 - Artifacts: none
 - Next steps: replace with a real report when you add automated reporting</code></pre>
                     <p>For one-shot failure handling without retry, use <code>catch</code> instead. See
-                        <a href="/language#recover--repair-and-retry-loop">Language — recover</a>.
+                        <a href="/reference/language#catch-and-recover">Language — catch and recover</a>.
                     </p>
                 </div>
 
@@ -467,9 +469,9 @@ <h3>Language</h3>
                     <code>script</code>, <code>ensure</code>, and <code>prompt</code> in one executable flow so checks
                     and AI steps stay in the same pipeline. This way you can enforce structure over non-deterministic
                     agent responses.
-                    See <a href="grammar">Grammar</a> and <a href="getting-started">Getting started</a>
-                    (<a href="/getting-started" target="_blank"
-                        rel="noopener noreferrer">jaiph.org/getting-started</a>).
+                    See <a href="grammar">Grammar</a> and <a href="/tutorials/first-workflow">Your first workflow</a>
+                    (<a href="/tutorials/first-workflow" target="_blank"
+                        rel="noopener noreferrer">jaiph.org/tutorials/first-workflow</a>).
                 </p>
                 <p><strong>Embed and run scripts</strong> in the language of your choice. Define them with fence lang
                     tags providing the runtime: <code>```node</code>, <code>```python3</code>, <code>```ruby</code>,
@@ -503,7 +505,7 @@ <h3>Runtime</h3>
                 </p>
                 <p><strong>Hooks.</strong> Attach shell automation to workflow and step lifecycle events via
                     <code>~/.jaiph/hooks.json</code> or <code>&lt;project&gt;/.jaiph/hooks.json</code>. See <a
-                        href="hooks">Hooks</a>.
+                        href="/how-to/hooks">Add a hook</a>.
                 </p>
                 <p><strong>Custom agent backends.</strong> Point <code>agent.command</code> to any
                     executable — a shell script, a Python wrapper, or your own CLI tool — and Jaiph will
@@ -512,7 +514,7 @@ <h3>Runtime</h3>
                 <p><strong>Artifacts library.</strong> Publish files from inside the sandbox to a host-readable
                     location with the built-in <code>jaiphlang/artifacts</code> library (<code>artifacts.save</code>).
                     Works identically in Docker and on the host.
-                    See <a href="libraries#jaiphlangartifacts--publishing-files-out-of-the-sandbox">Libraries</a>.
+                    See <a href="/how-to/artifacts">Save artifacts</a>.
                 </p>
                 <p><strong>Configuration.</strong> Control behavior with <code>config { ... }</code> blocks
                     at the module level or inside individual workflows for per-workflow overrides, plus environment
@@ -521,7 +523,7 @@ <h3>Runtime</h3>
                 </p>
                 <p><strong>Testing Jaiph workflows.</strong> Test workflows with executable <code>*.test.jh</code>
                     suites, mocks, and assertions to cover deterministic and agent-assisted paths. See <a
-                        href="testing">Testing</a>.</p>
+                        href="/how-to/testing">Write &amp; run tests</a>.</p>
                 <p><strong>Formatting.</strong> <code>jaiph format</code> rewrites <code>.jh</code> files to a canonical
                     style &mdash; consistent whitespace and indentation. See <a href="cli#jaiph-format">CLI
                         reference</a>.</p>
@@ -530,7 +532,12 @@ <h3>Samples</h3>
                 <p>Jaiph source code is built mostly with real Jaiph workflows. The
                     <a
                         href="https://github.com/jaiphlang/jaiph/blob/main/.jaiph/docs_parity.jh">.jaiph/docs_parity.jh</a>
-                    workflow runs documentation maintenance checks, changelog updates, and cross-doc consistency guards.
+                    workflow runs documentation maintenance checks, changelog updates, and cross-doc consistency guards;
+                    its three prompts instruct the agent to read and follow a vendored
+                    <a href="https://diataxis.fr/">Diátaxis</a> documentation skill at
+                    <code>.jaiph/skills/documentation-writer/SKILL.md</code> (sourced from
+                    <a href="https://github.com/github/awesome-copilot">github/awesome-copilot</a>) before writing any
+                    docs, so runs stay offline-safe and reproducible.
                     The <a href="https://github.com/jaiphlang/jaiph/blob/main/.jaiph/engineer.jh">.jaiph/engineer.jh</a>
                     workflow implements a queue-driven engineering loop that picks work, implements changes, verifies
                     CI, and updates queue state.
@@ -570,7 +577,7 @@ <h3>Jaiph workflows</h3>
                         raw shell lines are rejected; use <code>script</code> and <code>run</code> for bash.
                         <code>workflow</code> mixes managed steps with optional <strong>inline shell</strong> lines when
                         they do not parse as Jaiph keywords (prefer <code>script</code> + <code>run</code> for
-                        non-trivial shell). See <a href="grammar#language-concepts">Grammar — Language concepts</a>.
+                        non-trivial shell). See <a href="grammar#workflow-body-statements">Grammar — Workflow body statements</a>.
                         <code>script</code> holds bash (or any
                         language via a fence lang tag like <code>```node</code>, <code>```python3</code>, or a custom
                         shebang) invoked with <code>run</code>. Rules and workflows <strong>require parentheses</strong>
@@ -632,7 +639,7 @@ <h3>Jaiph workflows</h3>
                         <code>const x = run helper(arg)</code>,
                         not
                         <code>const x = helper(arg)</code> (compile error with a correction hint). See
-                        <a href="grammar#immutable-bindings">Immutable bindings</a> and
+                        <a href="language#const-bind-a-value">Language — const</a> and
                         <a href="grammar#step-output-contract">Step output contract</a>.
                     </dd>
 
@@ -666,12 +673,14 @@ <h3>Jaiph workflows</h3>
                         is retried automatically. Stops on success or when the retry limit is exhausted
                         (default 10, configurable via <code>run.recover_limit</code>). <code>recover</code>
                         requires explicit bindings. Workflows only. See
-                        <a href="language#recover--repair-and-retry-loop">Language</a>.
+                        <a href="language#catch-and-recover">Language — catch and recover</a>.
                     </dd>
 
                     <dt><code>match var { "lit" =&gt; … ⏎ /re/ =&gt; … ⏎ _ =&gt; … }</code></dt>
                     <dd>Pattern match on a string value. The subject is a bare identifier (no
-                        <code>$</code> or <code>${}</code>). Arms are tested top-to-bottom; first match wins.
+                        <code>$</code> or <code>${}</code>), or <code>IDENT.IDENT</code> reading a field from a
+                        typed prompt capture (<code>match r.verdict { … }</code>). <code>if</code> accepts the
+                        same dot-subject form. Arms are tested top-to-bottom; first match wins.
                         Patterns: string literal (exact), regex, or <code>_</code> wildcard.
                         Arms are newline-delimited — commas between or after arms are rejected.
                         Usable as a statement, expression (<code>const x = match var { … }</code>),
@@ -743,8 +752,8 @@ <h3>Jaiph tests</h3>
     </div>
 
     <div class="footer">
-        <p class="footer-links"><a href="/getting-started">Getting started</a>
-            &middot; <a href="https://jaiph.org/getting-started" target="_blank" rel="noopener noreferrer">jaiph.org/getting-started</a>
+        <p class="footer-links"><a href="/tutorials/first-workflow">Tutorial</a>
+            &middot; <a href="/how-to/install">How-to</a>
             &middot; <a href="https://github.com/jaiphlang/jaiph" target="_blank" rel="noopener noreferrer">GitHub</a>
             &middot; <a href="https://marketplace.visualstudio.com/items?itemName=jaiph.jaiph-syntax-vscode"
                 target="_blank" rel="noopener noreferrer">VSCode</a>
diff --git a/docs/install b/docs/install
index 8c43b126..cd692382 100755
--- a/docs/install
+++ b/docs/install
@@ -18,109 +18,150 @@ else
   NC='\033[0m'
 fi
 
-print_step() {
-  echo -e "${DIM}▸ ${1}${NC}"
-}
-
-print_success() {
-  echo -e "${GREEN}✓ ${1}${NC}"
-}
-
-print_warning() {
-  echo -e "${YELLOW}! ${1}${NC}"
-}
-
-print_error() {
-  echo -e "${RED}✗ ${1}${NC}"
-}
+print_step()    { echo -e "${DIM}▸ ${1}${NC}"; }
+print_success() { echo -e "${GREEN}✓ ${1}${NC}"; }
+print_warning() { echo -e "${YELLOW}! ${1}${NC}"; }
+print_error()   { echo -e "${RED}✗ ${1}${NC}"; }
 
 require_cmd() {
-  local cmd="$1"
-  if ! command -v "$cmd" >/dev/null 2>&1; then
-    print_error "Missing required command: $cmd"
+  if ! command -v "$1" >/dev/null 2>&1; then
+    print_error "Missing required command: $1"
     exit 1
   fi
 }
 
-# When installing from a local path, use it (from env JAIPH_REPO_URL or from first arg) and copy instead of clone.
+# Local-source mode: JAIPH_REPO_URL env or first arg is a local directory
+# containing a package.json. Both env and arg are accepted so callers can
+# supply the repo path either way (docs/install-from-local.sh uses both).
 JAIPH_FROM_LOCAL=
 if [ -n "${JAIPH_REPO_URL+x}" ] && [ -d "${JAIPH_REPO_URL}" ] && [ -f "${JAIPH_REPO_URL}/package.json" ]; then
   JAIPH_FROM_LOCAL=1
   JAIPH_REPO_URL="$(cd "${JAIPH_REPO_URL}" && pwd)"
-  REPO_URL="${JAIPH_REPO_URL}"
 elif [ -n "${1+x}" ] && [ -d "${1}" ] && [ -f "${1}/package.json" ]; then
-  # First argument is a local repo path (e.g. from install-from-local.sh)
   JAIPH_FROM_LOCAL=1
-  REPO_URL="$(cd "${1}" && pwd)"
-  JAIPH_REPO_URL="${REPO_URL}"
-fi
-REPO_URL="${REPO_URL:-${JAIPH_REPO_URL:-https://github.com/jaiphlang/jaiph.git}}"
-# Version/ref: first argument only when not a local path, or JAIPH_REPO_REF env, or default tag v0.9.4.
-if [ -n "${JAIPH_FROM_LOCAL}" ]; then
-  REPO_REF="${JAIPH_REPO_REF:-v0.9.4}"
-else
-  REPO_REF="${1:-${JAIPH_REPO_REF:-v0.9.4}}"
+  JAIPH_REPO_URL="$(cd "${1}" && pwd)"
 fi
+
 BIN_DIR="${JAIPH_BIN_DIR:-$HOME/.local/bin}"
-LIB_DIR="${JAIPH_LIB_DIR:-${BIN_DIR}/.jaiph}"
 TARGET="${BIN_DIR}/jaiph"
-SKILL_TARGET="${LIB_DIR}/jaiph-skill.md"
 
 echo ""
 echo -e "${BOLD}Jaiph installer${NC}"
 echo ""
 
-if [ -z "${JAIPH_FROM_LOCAL}" ]; then
-  require_cmd git
-fi
-require_cmd node
-require_cmd npm
+if [ -n "${JAIPH_FROM_LOCAL}" ]; then
+  # Build the standalone binary from the local checkout. Parity with the
+  # release-asset path: a single self-contained executable, no shim, no
+  # LIB_DIR runtime tree.
+  require_cmd npm
+  require_cmd bun
 
-print_step "Creating bin directory at ${BIN_DIR}..."
-mkdir -p "${BIN_DIR}"
+  print_step "Using local source at ${JAIPH_REPO_URL}"
 
-tmp_dir="$(mktemp -d)"
-cleanup() {
-  rm -rf "${tmp_dir}"
-}
-trap cleanup EXIT
+  tmp_dir="$(mktemp -d)"
+  trap 'rm -rf "${tmp_dir}"' EXIT
 
-if [ -n "${JAIPH_FROM_LOCAL}" ]; then
-  print_step "Using local source at ${REPO_URL}"
   print_step "Copying (includes uncommitted changes)..."
-  cp -R "${REPO_URL}" "${tmp_dir}/src"
-  rm -rf "${tmp_dir}/src/.git"
-  rm -rf "${tmp_dir}/src/node_modules"
-else
-  print_step "Cloning ${REPO_URL} (${REPO_REF})..."
-  git clone --depth 1 --branch "${REPO_REF}" "${REPO_URL}" "${tmp_dir}/src" >/dev/null 2>&1
-fi
+  cp -R "${JAIPH_REPO_URL}" "${tmp_dir}/src"
+  rm -rf "${tmp_dir}/src/.git" "${tmp_dir}/src/node_modules"
 
-JAIPH_VERSION="$(node -p "require(process.argv[1]).version" "${tmp_dir}/src/package.json")"
+  print_step "Installing dependencies..."
+  (cd "${tmp_dir}/src" && npm install >/dev/null 2>&1)
 
-print_step "Installing dependencies..."
-npm --prefix "${tmp_dir}/src" install >/dev/null 2>&1
+  print_step "Building standalone binary..."
+  (cd "${tmp_dir}/src" && npm run build:standalone >/dev/null 2>&1)
 
-print_step "Building CLI..."
-npm --prefix "${tmp_dir}/src" run build >/dev/null 2>&1
+  if [ ! -f "${tmp_dir}/src/dist/jaiph" ]; then
+    print_error "Build did not produce dist/jaiph"
+    exit 1
+  fi
 
-print_step "Installing runtime to ${LIB_DIR}..."
-rm -rf "${LIB_DIR}"
-mkdir -p "${LIB_DIR}"
-cp -R "${tmp_dir}/src/dist/src" "${LIB_DIR}/src"
-cp "${tmp_dir}/src/package.json" "${LIB_DIR}/package.json"
-cp "${tmp_dir}/src/docs/jaiph-skill.md" "${SKILL_TARGET}"
+  print_step "Installing binary to ${TARGET}..."
+  mkdir -p "${BIN_DIR}"
+  cp "${tmp_dir}/src/dist/jaiph" "${TARGET}"
+  chmod 755 "${TARGET}"
 
-print_step "Installing binary to ${TARGET}..."
-cat > "${TARGET}" <<EOF
-#!/usr/bin/env bash
-set -euo pipefail
-exec node "${LIB_DIR}/src/cli.js" "\$@"
-EOF
-chmod 755 "${TARGET}"
+  JAIPH_VERSION="$("${TARGET}" --version 2>/dev/null || echo "jaiph (local)")"
+  echo ""
+  print_success "Installed ${JAIPH_VERSION} to ${TARGET}"
+else
+  # Download a pre-built per-platform binary from the GitHub Release for the
+  # resolved ref. Asset names are fixed by docs/contributing.md → "Release
+  # asset naming contract".
+  require_cmd curl
+
+  if command -v sha256sum >/dev/null 2>&1; then
+    sha256_check() { sha256sum "$1" | awk '{print $1}'; }
+  elif command -v shasum >/dev/null 2>&1; then
+    sha256_check() { shasum -a 256 "$1" | awk '{print $1}'; }
+  else
+    print_error "Missing required command: sha256sum or shasum"
+    exit 1
+  fi
 
-echo ""
-print_success "Installed jaiph ${JAIPH_VERSION} to ${TARGET}"
+  uname_s="$(uname -s)"
+  uname_m="$(uname -m)"
+  case "${uname_s}" in
+    Darwin) os="darwin" ;;
+    Linux)  os="linux" ;;
+    *)
+      print_error "Unsupported platform: ${uname_s} ${uname_m}"
+      echo "Build from source per https://jaiph.org/contributing#installing-from-source"
+      exit 1
+      ;;
+  esac
+  case "${uname_m}" in
+    arm64|aarch64) arch="arm64" ;;
+    x86_64|x64)    arch="x64" ;;
+    *)
+      print_error "Unsupported platform: ${uname_s} ${uname_m}"
+      echo "Build from source per https://jaiph.org/contributing#installing-from-source"
+      exit 1
+      ;;
+  esac
+
+  REPO_REF="${1:-${JAIPH_REPO_REF:-v0.10.0}}"
+  BIN_NAME="jaiph-${os}-${arch}"
+  BASE_URL="${JAIPH_RELEASE_BASE_URL:-https://github.com/jaiphlang/jaiph/releases/download/${REPO_REF}}"
+
+  tmp_dir="$(mktemp -d)"
+  trap 'rm -rf "${tmp_dir}"' EXIT
+
+  print_step "Downloading ${BIN_NAME} (${REPO_REF})..."
+  if ! curl -fsSL -o "${tmp_dir}/${BIN_NAME}" "${BASE_URL}/${BIN_NAME}"; then
+    print_error "Failed to download ${BASE_URL}/${BIN_NAME}"
+    exit 1
+  fi
+
+  print_step "Downloading SHA256SUMS..."
+  if ! curl -fsSL -o "${tmp_dir}/SHA256SUMS" "${BASE_URL}/SHA256SUMS"; then
+    print_error "Failed to download ${BASE_URL}/SHA256SUMS"
+    exit 1
+  fi
+
+  print_step "Verifying checksum..."
+  expected_sum="$(awk -v name="${BIN_NAME}" '$2 == name || $2 == "*"name { print $1 }' "${tmp_dir}/SHA256SUMS")"
+  if [ -z "${expected_sum}" ]; then
+    print_error "No checksum entry for ${BIN_NAME} in SHA256SUMS"
+    exit 1
+  fi
+  actual_sum="$(sha256_check "${tmp_dir}/${BIN_NAME}")"
+  if [ "${expected_sum}" != "${actual_sum}" ]; then
+    print_error "Checksum mismatch for ${BIN_NAME}"
+    echo "  expected: ${expected_sum}"
+    echo "  got:      ${actual_sum}"
+    exit 1
+  fi
+
+  print_step "Installing binary to ${TARGET}..."
+  mkdir -p "${BIN_DIR}"
+  cp "${tmp_dir}/${BIN_NAME}" "${TARGET}"
+  chmod 755 "${TARGET}"
+
+  JAIPH_VERSION="$("${TARGET}" --version 2>/dev/null || echo "jaiph (${REPO_REF})")"
+  echo ""
+  print_success "Installed ${JAIPH_VERSION} to ${TARGET}"
+fi
 
 if [[ ":${PATH}:" == *":${BIN_DIR}:"* ]]; then
   print_success "${BIN_DIR} is already on PATH"
diff --git a/docs/install-from-local.sh b/docs/install-from-local.sh
index 6b88cc27..be85b64f 100755
--- a/docs/install-from-local.sh
+++ b/docs/install-from-local.sh
@@ -1,6 +1,9 @@
 #!/usr/bin/env bash
-# Install Jaiph from a local clone (no network clone). Uses the same logic as
-# docs/install with JAIPH_REPO_URL set to the local repo root.
+# Install Jaiph from a local clone (no network download). Builds the
+# standalone binary from the repo with `npm install` + `npm run build:standalone`
+# (requires bun) and installs it to ${JAIPH_BIN_DIR:-$HOME/.local/bin}/jaiph.
+# Same single-binary artifact as the release-asset path in docs/install; only
+# the origin of the binary differs (compiled locally vs. downloaded).
 #
 # Usage:
 #   ./docs/install-from-local.sh           # install from repo containing this script
diff --git a/docs/jaiph-skill.md b/docs/jaiph-skill.md
index 81ee9346..2019adb3 100644
--- a/docs/jaiph-skill.md
+++ b/docs/jaiph-skill.md
@@ -1,331 +1,446 @@
 ---
 title: Agent Skill
 permalink: /jaiph-skill
+diataxis: contributor
 redirect_from:
   - /jaiph-skill.md
 ---
 
-# Jaiph Bootstrap Skill (for Agents)
+# Jaiph Skill (for Agents)
 
-**Why this page exists.** Agentic work needs the same things human teams need: a clear sequence of steps, explicit checks, and a record of what ran. Jaiph is a small workflow language for that: **workflows** sequence orchestration, **rules** express checks, **`script`** holds real shell, and the runtime logs steps and writes run artifacts. The payoff is behavior that is easier to repeat, verify, and debug than ad-hoc shell snippets alone.
+You are an agent. A user has asked you to automate a repetitive task — a delivery pipeline, a review loop, a recurring check, a queue of work items. This document teaches you to author **Jaiph workflows** that do that. Read it fully before writing any `.jh` file; Jaiph looks like shell plus YAML but is neither, and most authoring mistakes come from guessing syntax instead of following the rules below.
 
-## Overview
+## What Jaiph is
 
-This page is an **agent skill**: it tells an AI assistant how to **author** Jaiph workflows (`.jh` files) and what a sensible `.jaiph/` layout looks like. It is not a full language specification — use [Getting started](getting-started.md) as the documentation map, [Grammar](grammar.md) for syntax and validation details, [Configuration](configuration.md) for `config` keys, [Inbox & Dispatch](inbox.md) for channels, and [Sandboxing](sandboxing.md) for rule design vs optional Docker isolation.
+Jaiph is a small workflow language. A `.jh` file declares:
 
-**Jaiph** is a small language for agentic workflows: **orchestration** (rules, prompts, managed calls) and **shell in `script` definitions**. The **Node workflow runtime** (`NodeWorkflowRuntime`) interprets the parsed AST in process — there is no separate transpiled workflow shell on the execution path ([Architecture](architecture.md)). Before `jaiph run` or `jaiph test`, **`buildScripts()`** takes a single **entry** `.jh` path (the workflow file, or the `*.test.jh` file for tests), runs **compile-time validation** (`validateReferences` inside **`emitScriptsForModule`**), and writes extracted **`script`** files under `scripts/` for that module and every file reachable from it via transitive **`import`** — not the whole workspace unless those files are imported. **`jaiph compile`** runs the same **`validateReferences`** checks by parsing each module in the computed closure **without** **`buildScripts`**, script emission, or the runner ([Architecture](architecture.md)). The runner’s **`buildRuntimeGraph()`** then loads the graph with **parse-only** imports (it does not re-run `validateReferences`).
+| Construct | What it is | How it runs |
+|---|---|---|
+| `workflow` | A named sequence of steps — the orchestration layer | Interpreted in-process by the runtime |
+| `rule` | A non-mutating check (preconditions, verifications) | Interpreted in-process; called with `ensure` |
+| `script` | Real shell (or Python, Node, …) — the only place for shell code | Spawned as a subprocess; called with `run` |
+| `prompt` | A task delegated to an AI agent (Cursor / Claude / Codex backend) | Backend CLI or API call; you capture the answer |
+| `channel` | A message queue with declared workflow listeners | Drained after the sending workflow finishes |
 
-**Contracts (CLI vs runtime):** **Live:** `__JAIPH_EVENT__` JSON lines on **stderr only** (CLI progress and **hooks** — hooks are **CLI-only**, driven by that stream). **Durable:** `.jaiph/runs/...` and **`run_summary.jsonl`**. Channels are enforced at compile time and executed in the runtime (in-memory queue + inbox files under the run dir); they are not hooks.
+Everything is **strings**. Every step is logged. Every run leaves durable artifacts under `.jaiph/runs/` (per-step `.out`/`.err` files and an append-only `run_summary.jsonl`). That is the payoff over ad-hoc shell: repeatable, inspectable, testable automation.
 
-The **JS kernel** (`src/runtime/kernel/`) handles **prompt** execution, **managed script subprocesses**, **inbox** queues and dispatch, and **event/summary emission**. **Rule** bodies run in-process; user **`script`** bodies run as separate OS processes (bash by default, polyglot via fence lang tags like `` ```node ``, `` ```python3 `` or a leading `#!` shebang in the body).
+**Source of truth:** when this document and the compiler disagree, the compiler wins. Full references: [Grammar](grammar.md), [CLI](cli.md), [Configuration](configuration.md), [Write & run tests](testing.md), [Inbox & dispatch](inbox.md), [Sandboxing](sandboxing.md).
 
-**Test lane:** `jaiph test` runs **`*.test.jh`** in-process (`node-test-runner.ts`): for each file it calls **`buildScripts(testFile, …)`** (same helper as `jaiph run`, with the **test file as the entry** so its import closure is validated and scripts are emitted), then **`buildRuntimeGraph(testFile)` once per file**, mocks, and assertions — same `NodeWorkflowRuntime` as `jaiph run`. The runtime enables **`suppressLiveEvents`** for those workflow runs so **`__JAIPH_EVENT__`** lines are not written to **stderr** (keeping `node --test` output readable); **`run_summary.jsonl`** under the run directory is still updated where the emitter records workflow traffic ([Architecture](architecture.md)).
+## Smallest working example
 
-**After `jaiph init`**, a repository gets `.jaiph/bootstrap.jh` (a triple-quoted prompt that tells the agent to read `.jaiph/SKILL.md`) and a copy of this file. The bootstrap prompt asks the agent to scaffold workflows under `.jaiph/` and to end with a clear `WHAT CHANGED` + `WHY` summary. The expected outcome is a **minimal workflow set** for safe feature work: preflight checks, an implementation workflow, verification, and a `workflow default` entrypoint that wires them together (with an optional human-or-agent “review” step when you use a task queue). Docker-backed runs use the official `ghcr.io/jaiphlang/jaiph-runtime` image by default; see [Sandboxing](sandboxing.md) to override with `runtime.docker_image` or `JAIPH_DOCKER_IMAGE`.
-
-**Concepts:**
-
-- **Rules** — Structured checks: `ensure` (other **rules** only), `run` (**scripts** only — not workflows), `const`, `match`, `if`, `for … in …` (line iteration over a string binding), `fail`, `log`/`logerr`, `return "…"` / `return run script()` / `return ensure rule()`, `ensure … catch`, `run … catch`, `run … recover`. No raw shell lines, `prompt`, inbox send/route, or `run async`. Under `jaiph run`, rule bodies are executed **in-process** by the Node runtime; when a rule runs a **script**, that script is a normal managed subprocess (same as scripts from workflows) — see [Sandboxing](sandboxing.md).
-- **Workflows** — Named sequences of **managed** Jaiph steps (`ensure`, `run`, `prompt`, `const`, `fail`, `return`, `log`/`logerr`, inbox **send**, `match`, `if`, `for … in …`, `run async`, `ensure`/`run` with `catch` or `recover`, …) plus optional **inline shell** lines: a line that does not parse as a managed step is treated as bash stored in a `shell` AST node (validated like other shell text). Prefer top-level **`script`** definitions and `run` for multi-line or reusable shell. Route declarations (`->`) belong on top-level `channel` lines, never inside a workflow body (a `->` in a body is `E_PARSE`).
-- **Scripts** — Top-level **`script`** definitions are **bash (or shebang interpreter) source**, not Jaiph orchestration. Defined with `` script name = `body` `` (single-line backtick) or `` script name = ```[lang] ... ``` `` (fenced block). Double-quoted string bodies (`script name = "body"`) and bare identifier bodies (`script name = varName`) are **removed** — both produce parse errors with guidance to use backtick delimiters. The compiler treats all script bodies as **opaque text**: it does not parse lines as Jaiph steps, reject keywords, strip quotes, or validate cross-script calls. This means embedded `node -e` heredocs, inline Python, `const` assignments in JS, and any other valid shell construct compile without interference. Jaiph interpolation (`${...}`) is **forbidden** in **single-line backtick** script bodies — use `$1`, `$2` positional arguments to pass data from orchestration to scripts. In **fenced** (triple-backtick) blocks, `${...}` is passed through to the shell as standard parameter expansion (`${VAR}`, `${VAR:-default}`, etc.). A single-backtick body containing a newline is a hard parse error — use a fenced block for multi-line scripts. Use `return N` / `return $?` for exit status and **stdout** (`echo` / `printf`) for string data to callers. From a **workflow** or **rule**, call with **`run fn()`**. Can be exported (`export script name = ...`) for use by importing modules. Cannot be used with `ensure`, are not valid inbox route targets, and must not be invoked through `$(...)` or as a bare shell step. **Polyglot scripts:** use a fence lang tag (`` ```<tag> ``) to select an interpreter — the tag maps directly to `#!/usr/bin/env <tag>`. Any tag is valid (no hardcoded allowlist). For example: `` ```node ``, `` ```python3 ``, `` ```ruby ``, `` ```lua ``. Alternatively, if no fence tag is present, the first non-empty body line may start with `#!` (e.g. `#!/usr/bin/env lua`), which becomes the script's shebang and the body is emitted verbatim (you cannot combine a fence tag with a manual shebang — that is an error). Without either, `#!/usr/bin/env bash` is used and the emitter applies only lightweight bash-specific transforms (`return` normalization, `local`/`export`/`readonly` spacing, import alias resolution). Scripts are extracted to a `scripts/` directory under the run output tree (`jaiph run --target <dir>` sets that tree; without `--target` the CLI uses a temporary directory) and executed via **`JAIPH_SCRIPTS`**. **Inline scripts:** For trivial one-off commands, use `` run `body`(args) `` or `` run ```lang...body...```(args) `` directly in a workflow or rule step instead of declaring a named `script` definition. The body (single backtick for one-liners or triple backtick for multi-line) comes before the parentheses; optional comma-separated arguments go inside the parentheses: `` run `echo $1`("hello") ``. Fenced blocks support lang tags for polyglot inline scripts: `` run ```python3 ... ```() ``. Capture forms: `` const x = run `echo val`() `` and `` const x = run ```...```() ``. The old `run script() "body"` form is **removed** — use the backtick forms instead. Inline scripts use deterministic hash-based artifact names (`__inline_<hash>`) and run with the same isolation as named scripts. `run async` with inline scripts is not supported.
-- **Channels** — Top-level `channel <name> [-> workflow, ...]` declarations with optional inline routing; **send** uses `channel_ref <- …`. Routes are declared on the channel declaration, not inside workflow bodies (see [Inbox & Dispatch](inbox.md)). Channel names share the per-module namespace with rules, workflows, scripts, and module-scoped `local` / `const` variables.
+```jaiph
+script list_todos = `grep -rn "TODO" src/ || true`
+script worktree_clean = `test -z "$(git status --porcelain)"`
 
-Step semantics (`ensure`, `run`, `prompt`, `catch`, `recover`, `match`, `if`, `for`, `log`, `fail`, `return`, `send`, `run async`) are detailed in the **Steps** section below.
+rule git_clean() {
+  run worktree_clean() catch (err) {
+    fail "working tree is not clean"
+  }
+}
 
-**Audience:** Agents that produce or edit `.jh` files.
+workflow default(task) {
+  ensure git_clean()
+  const todos = run list_todos()
+  prompt """
+  Address the following request: ${task}
+  Known TODOs in the codebase:
+  ${todos}
+  """
+  log "done"
+}
+```
 
----
+Run it: `jaiph run ./flow.jh "clean up the auth module"`. The CLI executes `workflow default` and binds `"clean up the auth module"` to the `task` parameter. **Every runnable file must define `workflow default`.**
 
-## Safe delivery loop (any repository)
+## Your authoring loop
 
-Use this loop whenever you add or change Jaiph workflows so failures surface before work is handed back. When the repo defines a **`workflow default` entrypoint** (often `.jaiph/main.jh`) that wires preflight → implementation → verification, use **`jaiph run`** on that file for end-to-end delivery after the narrower checks below pass.
+Follow this sequence every time you create or edit `.jh` files. Do not skip the compile step — it catches almost every mistake described in this document, with file:line:col positions.
 
-1. **Preflight** — Run the project’s readiness checks if they exist (often `jaiph run .jaiph/readiness.jh` or a named preflight workflow). When the repo ships native tests (`*.test.jh`), run `jaiph test` before large edits when practical.
-2. **Implement** — Edit `.jh` modules using only constructs described in [Grammar](grammar.md); keep managed-call rules (`ensure` for rules, `run` for workflows and scripts); put multi-line or reusable bash in **`script`** definitions (rules **never** allow raw shell lines — use `run` to a script; workflows may use optional inline shell where the grammar allows, but prefer `script` + `run` for anything non-trivial — see [Grammar — Language concepts](grammar.md#language-concepts)).
-3. **Format** — Run `jaiph format <file.jh ...>` on all authored or modified `.jh` files before committing. This normalizes whitespace, indentation, and top-level ordering (imports, config, and channels hoisted to the top; everything else kept in source order). Use `jaiph format --check <file.jh ...>` to verify formatting without writing (non-zero exit on drift — useful in CI).
-4. **Compile check** — Run `jaiph compile <file-or-dir>` on the paths you touched (or `jaiph compile --json …` in automation). Same `validateReferences` checks as before a run, without executing workflows or writing `scripts/` ([Architecture](architecture.md)). With a **directory** argument, only non-test `*.jh` files are used as entrypoints (`*.test.jh` is skipped); pass a test file path explicitly to validate it.
-5. **Verify** — Run `jaiph test` (whole workspace or a focused path) and any verification workflow the repo defines (commonly `jaiph run .jaiph/verification.jh`). Fix failures you introduce.
-6. **Inspect (optional)** — Browse `.jaiph/runs` directly when you need raw step logs or `run_summary.jsonl` instead of only the terminal tree.
+1. **Write** the `.jh` files (syntax below).
+2. **Format:** `jaiph format <files…>` — canonical whitespace and top-level ordering.
+3. **Compile:** `jaiph compile [--json] [--workspace <dir>] <file-or-dir>` — parses and validates the whole import closure without running anything. Reports **all** errors at once as `path:line:col CODE message`. Use `--json` for machine-readable output. Directory arguments skip `*.test.jh`; pass test files explicitly. `--workspace` sets the library root for `jaiph install` paths when auto-detect is wrong.
+4. **Test:** `jaiph test` — runs every `*.test.jh` it finds; zero matches in discovery mode exit 0 with a notice, so this call is always safe to make.
+5. **Run:** `jaiph run <file.jh> [args…]` for the end-to-end check.
 
-**CLI commands:**
+CLI quick reference:
 
 | Command | Purpose |
 |---|---|
-| `jaiph run [--target <dir>] [--raw] <file.jh> [--] [args...]` | Execute `workflow default` in the given file (`--raw`: no banner/tree/hooks; used for embedding and Docker inner runs) |
-| `jaiph test [path]` | Run `*.test.jh` test files (workspace, directory, or single file) |
-| `jaiph format [--check] [--indent <n>] <file.jh ...>` | Reformat `.jh` files (or verify formatting without writing) |
-| `jaiph compile [--json] [--workspace <dir>] <.jh files or dirs…>` | Parse and `validateReferences` only (no script emission, no run) |
-| `jaiph init [workspace]` | Scaffold `.jaiph/` with bootstrap workflow and skill file |
-| `jaiph install [--force] [<url[@version]> …]` | Clone libraries into `.jaiph/libs/` or restore from `.jaiph/libs.lock` |
-| `jaiph use <version\|nightly>` | Reinstall Jaiph at a specific version or nightly |
+| `jaiph run [--target <dir>] [--raw] <file.jh> [--] [args…]` | Execute `workflow default`; args bind to its named parameters |
+| `jaiph test [path]` | Run `*.test.jh` files (workspace, dir, or single file) |
+| `jaiph compile [--json] [--workspace <dir>] <paths…>` | Validate only — no execution, no side effects |
+| `jaiph format [--check] <file.jh …>` | Reformat (or verify formatting in CI) |
+| `jaiph init [workspace]` | Scaffold `.jaiph/` (bootstrap workflow + this skill file) |
+| `jaiph install [<name[@version]> \| <url[@version]>…]` | Install libraries into `.jaiph/libs/` (bare names resolve via `JAIPH_REGISTRY`, else `https://jaiph.org/registry`; URL form is unchanged) |
 
-**File shorthand:** `jaiph ./file.jh` auto-routes — `*.test.jh` files run as tests, other `*.jh` files run as workflows.
+Shorthand: `jaiph ./file.jh` routes by extension (`*.test.jh` → test, other `.jh` → run). A `#!/usr/bin/env jaiph` shebang makes a `.jh` file directly executable.
 
-Full flags and environment variables: [CLI Reference](cli.md).
+**Sandboxing:** by default, interactive `jaiph run` executes the workflow inside a Docker container (`ghcr.io/jaiphlang/jaiph-runtime`). Set `JAIPH_UNSAFE=true` or pass `--unsafe` to run directly on the host, or set `JAIPH_DOCKER_ENABLED=true/false` to force either mode. `jaiph test` always runs on the host (no Docker).
 
----
+## Core rules you must internalize
 
-## When to Use This Guide
+These six rules prevent 90% of compile errors:
 
-Use this guide when generating or updating `.jaiph/*.jh` workflows for a repository after `jaiph init`.
+1. **Parentheses everywhere.** Definitions and call sites both require `()`, even with zero arguments: `workflow default() { … }`, `run setup()`, `ensure check()`. Bare `run setup` is a parse error.
+2. **All captures use `const`, and all bindings are immutable.** `const x = run foo()` — never `x = run foo()`, never rebind `x` later, never shadow a parameter with a `const` of the same name.
+3. **Call keyword must match callee type.** `ensure` → rules only. `run` → workflows and scripts (inside a workflow); scripts **only** (inside a rule). Mixing them is `E_VALIDATE`.
+4. **Shell lives in scripts.** Rules reject raw shell lines entirely. Workflows technically allow inline shell lines, but you should not write them — use a named `script` or an inline script (`` run `cmd`() ``). Shell operators next to managed calls (`run foo() | grep x`, `run foo() > file`, `run foo() &`) are parse errors.
+5. **Interpolation is `${name}` only.** No `$name` in orchestration strings, no `$(…)`, no `${var:-default}`, no `${var//x/y}`. Those shell forms are valid *inside script bodies* only.
+6. **Arguments are not forwarded implicitly.** If `workflow default(task)` calls `run implement()`, the implement workflow does not see `task`. Pass it: `run implement(task)`.
 
-## Source of Truth
+## Syntax reference
 
-When this skill conflicts with the compiler or runtime, follow the implementation. For language rules and validation codes, [Grammar](grammar.md) is the detailed reference. Published docs: [jaiph.org](https://jaiph.org).
+### File layout
 
-`jaiph init` writes this skill to `.jaiph/SKILL.md` when the installer resolves a skill file: if **`JAIPH_SKILL_PATH`** is set, it is used **only when that path exists on disk**; otherwise the CLI searches install-relative locations and `docs/jaiph-skill.md` from the current working directory ([CLI Reference](cli.md)). If no file is found, init skips `SKILL.md` — set **`JAIPH_SKILL_PATH`** to an existing markdown file (for example `docs/jaiph-skill.md` in a checkout) and run `jaiph init` again.
+Top-level forms, in conventional order (`jaiph format` hoists `import`, `config`, and `channel` to the top):
 
-Ignore any outdated Markdown that contradicts the above.
+```jaiph
+import "helpers.jh" as helpers          # module import (relative; .jh appended if omitted)
+import script "./tool.py" as tool       # external script file, callable with run tool(args)
+config { agent.backend = "claude" }     # optional, at most one per file
+channel findings -> analyst             # channels + optional routes, top level only
+const VERSION = "1.0"                   # module-scoped immutable string
+script build = `npm run build`          # shell definitions
+rule tests_pass() { run run_tests() }   # checks
+workflow default() { … }                # orchestration; default = the entrypoint
+```
 
-## What to Produce
+Channels, rules, workflows, scripts, script-import aliases, and module `const` share **one namespace per module** — duplicate top-level names are `E_PARSE`; duplicate import aliases are `E_VALIDATE`. Comments are full-line `#` only.
 
-A **minimal workflow set** under `.jaiph/` that matches the delivery loop above:
+**Imports:** paths resolve relative to the importing file; if not found and the path contains `/`, it falls back to `<workspace>/.jaiph/libs/<lib>/<path>.jh` (installed via `jaiph install`). Reference imported symbols as `alias.name`. If a module uses `export` on any declaration, only exported names are visible to importers; with zero `export`s, everything is public.
 
-1. **Sandbox baseline (optional)** — If the repo uses Docker sandboxing, confirm `runtime.docker_image` / `JAIPH_DOCKER_IMAGE` match the tooling the team needs; the default is `ghcr.io/jaiphlang/jaiph-runtime` (see [Sandboxing](sandboxing.md)).
-2. **Preflight** — Rules and `ensure` for repo state and required tools (e.g. clean git, required binaries). Expose a small workflow (e.g. `workflow default` in `readiness.jh`) that runs these checks.
-3. **Review (optional)** — A workflow that reviews queued tasks before development starts (any filename, e.g. `ba_review.jh`). An agent prompt evaluates the next task for clarity, consistency, conflicts, and feasibility, then either marks it as ready or exits with questions. The implementation workflow gates on this marker so unreviewed tasks cannot proceed. This repository’s `.jaiph/architect_review.jh` is one concrete example; it uses `QUEUE.md` as the task queue.
-4. **Implementation** — A workflow that drives coding changes (typically via `prompt`), e.g. `workflow implement` in `main.jh`. When using a task queue, the implementation workflow should check that the first task is marked as ready (e.g. via a `<!-- dev-ready -->` marker) before proceeding.
-5. **Verification** — Rules and a `workflow default` for lint/test/build (e.g. `verification.jh`). Complement this with repo-native `*.test.jh` suites run by `jaiph test` where appropriate.
-6. **Entrypoint** — A single `workflow default` (e.g. in `.jaiph/main.jh`) that runs: preflight → (optional) review → implementation → verification. This is what `jaiph run .jaiph/main.jh "..."` executes.
+### Strings and interpolation
 
-Prefer composable modules over one large file.
+- `"single line"` — double quotes only; single quotes are parse errors. Escapes: `\"`, `\\`, `\n`, `\t`.
+- `"""…"""` — multiline. Opening `"""` ends its line; closing `"""` is on its own line.
+- A double-quoted string spanning multiple lines is rejected — use `"""`.
 
-## Language Rules You Must Respect
+Inside any orchestration string:
+
+| Form | Meaning |
+|---|---|
+| `${name}` | Value of a `const`, capture, or parameter in scope (unknown names are compile errors) |
+| `${name.field}` | Field of a typed-prompt capture (compile-checked against the schema) |
+| `${run ref(args)}` / `${ensure ref(args)}` | Inline managed call; its output is spliced in. No nesting. |
+| `${JAIPH_WORKSPACE}` etc. | Falls back to process environment when no workflow variable matches |
+
+### Scripts — the shell layer
+
+````jaiph
+# single-line: backticks. NO Jaiph ${name} here — pass data as $1, $2 arguments.
+script count_lines = `wc -l < "$1"`
+
+# multi-line: fenced block. Bash ${…} passes through to the shell untouched.
+script deploy = ```
+set -euo pipefail
+echo "deploying ${TARGET_ENV:-staging}"
+./deploy.sh "$1"
+```
+
+# polyglot: fence tag → #!/usr/bin/env <tag>. Any tag works.
+script parse_json = ```python3
+import json, sys
+print(json.load(open(sys.argv[1]))["version"])
+```
+````
 
-- **Imports:** `import "path.jh" as alias`. Path must be double-quoted. Path is relative to the importing file first; if no file is found and the path contains `/`, the resolver falls back to project-scoped libraries under `<workspace>/.jaiph/libs/` (e.g. `import "queue-lib/queue" as queue` resolves to `.jaiph/libs/queue-lib/queue.jh`). If the path has no extension, the compiler appends `.jh`. Install libraries with `jaiph install <url[@version]>`. **Script imports:** `import script "./helper.py" as helper` imports an external script file and binds it as a local script symbol — callable with `run helper(args)` exactly like an inline `script` definition. The path resolves relative to the importing file. Shebangs in the imported file are preserved. Missing targets fail with `E_IMPORT_NOT_FOUND`.
-- **Definitions:** `channel name` (inbox endpoint); `rule name() { ... }` or `rule name(params) { ... }`, `workflow name() { ... }` or `workflow name(params) { ... }`, `` script name = `body` `` or `` script name = ```[lang] ... ``` ``. **Parentheses are required on all rule and workflow definitions** — even when parameterless (e.g. `workflow default() { ... }`, `rule check() { ... }`). Omitting `()` before `{` is a parse error with a fix hint. Named parameters go inside the parentheses — e.g. `workflow implement(task, role) { ... }`, `rule gate(path) { ... }`. At runtime, named params are the only way to access arguments. The compiler validates call-site arity when the callee declares params. Named scripts require a name at the definition site; for anonymous one-off commands use inline scripts: `` run `echo ok`() `` or `` run ```...```(args) ``. Optional `export` before `rule`, `workflow`, or `script` marks it as public (see [Grammar](grammar.md)). Optional `config { ... }` at the top of a file sets agent, run, and runtime options. An optional `config { ... }` block can also appear inside a `workflow { ... }` body (before any steps) to override module-level settings for that workflow only — only `agent.*` and `run.*` keys are allowed; `runtime.*` and `module.*` yield `E_PARSE` (see [Configuration](configuration.md#workflow-level-config)). Config values can be quoted strings, booleans (`true`/`false`), bare integers, or bracket-delimited arrays of strings (see [Grammar](grammar.md) and [Configuration](configuration.md)).
-- **Module-scoped variables:** `local name = value` or `const name = value` (same value forms). Prefer **`const`** for new files. Values can be single-line `"..."` strings, triple-quoted `"""..."""` multiline strings, or bare tokens. A double-quoted string that spans multiple lines is rejected — use `"""..."""` instead. Accessible as `${name}` inside orchestration strings in the same module. Names share the unified namespace with channels, rules, workflows, and scripts — duplicates are `E_PARSE`. Not exportable; module-scoped only.
-- **Steps:**
-  - **ensure** — `ensure ref()` or `ensure ref(args…)` runs a rule (local or `alias.rule_name`). **Parentheses are required on every call site**, including zero-argument calls (`ensure check()`, not bare `ensure check`). Arguments are comma-separated inside `()`. **Bare identifier arguments** are supported and preferred (when valid): `ensure check(status)` is equivalent to `ensure check("${status}")` — the identifier must reference a known variable (`const`, capture, or named parameter); unknown names fail with `E_VALIDATE`. **Standalone `"${identifier}"` in call arguments is rejected** — use the bare form instead. Quoted strings with extra text (e.g. `"prefix_${name}"`) stay valid. Jaiph keywords cannot be used as bare identifiers. Optionally `ensure ref(…) catch (<name>) <body>`: the recovery body runs **once** on failure (no built-in retry on `ensure` — use `run … recover` for loops). The binding receives merged stdout+stderr from the failed rule. Full output also lives in **`.out` / `.err`** artifacts. Works in workflows and rules.
-  - **run** — `run ref()` or `run ref(args…)` runs a workflow or script (local or `alias.name`). Same **required `()` on every call site** as `ensure`, including zero args (`run setup()`). In a **workflow**, the target may be another workflow or a script; in a **rule**, the target must be a **script** only (`E_VALIDATE` if you name a workflow). **`run` does not forward CLI positional args implicitly** — the entry workflow binds them into named params and must pass values explicitly into callees. **Bare identifier arguments** follow the same rules as `ensure` when applicable. **Nested managed calls inside argument lists must use keywords:** `run foo(run bar())`, `run foo(ensure check())`; bare `run foo(bar())`/`run foo(\`...\`())` forms are rejected. Optionally `catch (<name>)` (runs once on failure, mutually exclusive with `recover`) or `recover (<name>)` (repair-and-retry loop; attempt cap is **`run.recover_limit`** from the **file’s top-level** `config { … }`, default **10** — the runtime does not apply this setting from a workflow’s inner `config` block). **`catch` / `recover` on `run`** are allowed in workflows and rules (rules: callee must remain a script). Also **inline scripts**: `` run `body`(args) `` or `` run ```lang...body...```(args) `` — see Scripts above.
-  - **log** — `log "message"` writes the expanded message to **stdout** and emits a **`LOG`** event; the CLI shows it in the progress tree at the current depth. Double-quoted string; `${identifier}` interpolation works at runtime. For multiline messages, use triple quotes: `log """..."""`. **Bare identifier form:** `log foo` (no quotes) expands to `log "${foo}"` — the variable's value is logged. Works with `const`, capture, and named parameters. **Inline capture interpolation** is also supported: `${run ref([args])}` and `${ensure ref([args])}` execute a managed call and inline the result (e.g. `log "Got: ${run greet()}"`). Nested inline captures are rejected. **`LOG`** events and `run_summary.jsonl` store the **same** message string (JSON-escaped for the payload). No spinner, no timing — a static annotation. See [CLI Reference](cli.md) for tree formatting. Useful for marking workflow phases (e.g. `log "Starting analysis phase"`).
-  - **logerr** — `logerr "message"` is identical to `log` except the message goes to **stderr** and the event type is **`LOGERR`**. In the progress tree, `logerr` lines use a red `!` instead of the dim `ℹ` used by `log`. Same quoting, interpolation, bare identifier, and triple-quote rules as `log` (e.g. `logerr err_msg`, `logerr """..."""`).
-  - **Send** — After `<-`, use a **double-quoted literal**, **triple-quoted block** (`channel <- """..."""`), **`${var}`**, or **`run ref([args])`**. An explicit RHS is always required — bare `channel <-` (without a value) is invalid. Raw shell on the RHS is rejected — use `const x = run helper()` then `channel <- "${x}"`, or `channel <- run fmt_fn()`. Combining capture and send (`name = channel <- …`) is `E_PARSE`. See [Inbox & Dispatch](inbox.md).
-  - **Route** — Routes are declared **at the top level** on channel declarations: `channel name -> workflow_ref` or `channel name -> wf1, wf2`. A `->` inside a workflow body is a **parse error** with guidance to move it to the channel declaration. When a message arrives on the channel, the runtime calls each listed **workflow** (local or `alias.workflow`), binding the dispatch values (message, channel, sender) to the target's 3 declared parameters. Route targets must declare exactly 3 parameters. Scripts and rules are not valid route targets. The dispatch queue drains after the orchestrator completes. **`NodeWorkflowRuntime` does not cap dispatch iterations** — avoid circular sends that grow the queue without bound. See [Inbox & Dispatch](inbox.md).
-  - **Bindings and capture** — `const name = …` (the `const` keyword is required for all captures). All bindings are **immutable**: a name bound by a parameter, `const`, capture, or `script` cannot be rebound in the same scope — the compiler rejects it with `E_VALIDATE: cannot rebind immutable name "…"`. For **`ensure`** / **`run` to a workflow or rule**, capture is the callee’s explicit **`return "…"`**. For **`run` to a script**, capture follows **stdout** from the script body. **`prompt`** capture is the agent answer. **`const`** RHS cannot use `$(...)` or disallowed `${...}` forms — use a **`script`** and `const x = run helper(…)`. **`const`** must not use a **bare** `ref(args…)` call shape: use **`const x = run ref(args…)`** (or **`ensure`** for rules), not **`const x = ref(args…)`** — the compiler fails with **`E_PARSE`** and suggests the **`run`** form. Do not put Jaiph symbols inside `$(...)` — use `ensure` / `run`. See [Grammar](grammar.md#immutable-bindings) and [Grammar](grammar.md#step-output-contract).
-  - **return** — `return "value"` / `return "${var}"` / `return """..."""` sets the managed return value. Also supports **direct managed calls**: `return run ref()` or `return run ref(args)` and `return ensure ref()` or `return ensure ref(args)` — these execute the target and use its result as the return value, equivalent to `const x = run ref(args)` then `return "${x}"`. Parentheses are required on all call sites.
-  - **fail** — `fail "reason"` or `fail """..."""` aborts with stderr message and non-zero exit (workflows; fails the rule when used inside a rule).
-  - **run async** — `run async ref([args...])` starts a workflow or script concurrently and returns a **`Handle<T>`**. Capture is supported: `const h = run async ref()`. The handle resolves on first non-passthrough read (string interpolation, passing as arg to `run`, comparison, conditional, match subject). Passthrough (initial capture, re-assignment) does not force resolution. Unresolved handles are implicitly joined at workflow exit. `recover` (retry loop) and `catch` (single-shot) composition work with `run async`: `run async foo() recover(err) { … }`. Workflows only — rejected in rules.
-  - **match** — `match var { "literal" => …, /regex/ => …, _ => … }` pattern-matches on a string value. The subject is always a bare identifier (no `$` or `${}`). Arms are tested top-to-bottom; the first match wins. Patterns: double-quoted string literal (exact match), `/regex/` (regex match), or `_` (wildcard — exactly one required). Usable as a statement, as an expression (`const x = match var { … }`), or with `return` (`return match var { … }`). Using `$var` or `${var}` as the match subject is a parse error. Allowed in both workflows and rules. See [Grammar](grammar.md#match).
-  - **if** — `if var == "value" { … }` or `if var =~ /pattern/ { … }`. Subject is a bare identifier. Operators: `==` (exact string equality), `!=` (inequality), `=~` (regex match), `!~` (regex non-match). Operand is a `"string"` for `==`/`!=` or `/regex/` for `=~`/`!~`. Body is a brace block of valid workflow/rule steps. No `else` branch — use `match` for exhaustive value branching. `if` is a statement (no value production; cannot use with `const` or `return`). Allowed in both workflows and rules.
-  - **for** — `for iterVar in sourceVar { … }` runs the body once per **line** of the string bound to `sourceVar` (newline-separated text, e.g. from `const`/`prompt`/`run` capture). Each iteration binds `iterVar` to one line (trimming rules match the runtime’s line split — a trailing empty line after a final newline is not an extra iteration). Allowed in workflows and rules. See [Grammar](grammar.md) for the formal production.
-- **Prompts:** Three body forms: (1) **single-line string** `prompt "..."` — double-quoted, single line only; (2) **identifier** `prompt myVar` — uses the value of an existing binding; (3) **triple-quoted block** `prompt """ ... """` — for multiline text, opening `"""` on the same line as `prompt`. Triple backticks (`` ``` ``) in prompt context are rejected with guidance — they are reserved for scripts. Multiline double-quoted strings are rejected — use a triple-quoted block instead. All forms support `${identifier}` interpolation (`${varName}`, `${paramName}`). **Inline capture interpolation** is also supported: `${run ref([args])}` and `${ensure ref([args])}` inside the prompt string or triple-quoted body (e.g. `prompt "Fix: ${ensure get_diagnostics()}"`). Nested inline captures are rejected. Bare `$varName` is not valid in orchestration strings. `$(...)` and `${var:-fallback}` are rejected. Capture: `const name = prompt "..."`, `const x = prompt myVar`, `const y = prompt """ ... """`. Optional **typed prompt:** `const name = prompt "..." returns "{ field: type, ... }"` or `const name = prompt myVar returns "..."` (flat schema; types `string`, `number`, `boolean`) validates the agent's JSON and sets `${name}` plus per-field variables accessible via **dot notation** — `${name.field}`. Dot notation is validated at compile time: the variable must be a typed prompt capture and the field must exist in the schema. **Orchestration bindings are strings:** typed fields are coerced with `String()` after JSON validation, so e.g. a numeric field is still the text `"42"` in scope. See [Grammar](grammar.md).
+Script semantics:
 
-**Quick reference examples:**
+- Bodies are **opaque** to the compiler — full shell/Python/whatever, heredocs included. The one check: do not call Jaiph symbols (`run`, `ensure`, workflow names) from inside a script body or `$(…)`.
+- **Capture = stdout.** `const v = run parse_json("pkg.json")` binds the script's stdout. Use `echo`/`printf` to return data; use exit codes (`return N` / `exit N`) for pass/fail.
+- **Arguments arrive as `$1`, `$2`, …** Module `const` values and workflow bindings are *not* exported into the subprocess environment — pass them explicitly as arguments.
+- Alternatively a manual `#!` shebang as the first body line selects the interpreter (mutually exclusive with a fence tag).
+- A newline inside a single-backtick body is a parse error — use a fenced block.
+
+**Inline scripts** for one-off commands — body before the parens, args inside:
+
+````jaiph
+run `mkdir -p "$1"`("out/reports")
+const now = run `date +%s`()
+const stats = run ```python3
+import sys; print(len(sys.argv[1]))
+```(input_text)
+````
+
+Inline scripts work in `run`, `const … = run`, `return run`, and `log run` positions. They cannot be used with `run async`. A `run` step whose body is an inline script accepts the same optional `catch (name) <body>` / `recover (name) <body>` suffix as a named-ref `run` step (same semantics — `catch` runs once, `recover` retries up to `run.recover_limit`, mutually exclusive). The other inline-script positions (`const … = run`, `return run`, `log run`) do not take those suffixes — wrap in a standalone `run` step.
+
+### Workflow steps
 
 ```jaiph
-# catch — one-shot failure handling
-ensure ci_passes() catch (failure) {
-  prompt "CI failed — fix the code."
-  run deploy(env)
+workflow release(version) {
+  ensure git_clean()                        # run a rule
+  const notes = run gen_notes(version)      # run a script/workflow, capture
+  run publish(version, notes)               # args: bare identifiers for variables
+  log "published ${version}"                # info line in the progress tree (stdout)
+  logerr "warning: slow registry"           # red ! line (stderr)
+  alerts <- "released ${version}"           # send to a channel
+  return notes                              # set this workflow's return value
 }
+```
 
-# recover — repair-and-retry loop (retries until success or limit)
-run deploy(env) recover(err) {
-  log "Deploy failed: ${err}"
-  run auto_repair(env)
-}
+- **Call arguments:** quoted literals (`"main"`), bare identifiers for in-scope variables (`version` — preferred style), quoted interpolation when the whole argument is one variable (`"${version}"` — also accepted when `version` is in scope), or explicit nested calls (`run outer(run inner())`, `run outer(ensure check())`). Bare call shapes like `run outer(inner())` are rejected. Strings mixing text and interpolation (`"v${version}"`) are fine.
+- **Arity is checked** when the callee declares parameters: `run greet("a","b")` against `workflow greet(name)` is `E_VALIDATE`.
+- **`fail "reason"`** aborts with a non-zero exit. **`return`** accepts `"string"`, `"""…"""`, a bare identifier, `run ref()` / `ensure ref()`, an inline script, or a `match` expression.
+- **`log` / `logerr`** accept `"string"`, `"""…"""`, a bare identifier (`log status` ≡ `log "${status}"`), or `log run \`cmd\`()`.
 
-# match — value branching (statement and expression forms)
-const label = match status {
-  "ok" => "success"
-  /err/ => "something went wrong"
-  _ => "unknown"
-}
+### Rules — checks only
 
-# if — conditional guard (no else; use match for exhaustive branching)
-if env == "" {
-  fail "env was not provided"
-}
-if mode =~ /^debug/ {
-  log "Debug mode enabled"
+```jaiph
+rule branch_is(expected) {
+  run `test "$(git branch --show-current)" = "$1"`(expected)
 }
 
-# for — iterate over lines of a string variable
-const paths = """
-docs/a.md
-docs/b.md
-"""
-for path in paths {
-  log "${path}"
+rule preconditions() {
+  ensure branch_is("main")
+  ensure git_clean()
 }
+```
 
-# typed prompt — structured JSON with dot-notation field access
-const result = prompt "Analyze this code" returns "{ type: string, risk: string }"
-log "Type: ${result.type}, Risk: ${result.risk}"
+Allowed in rule bodies: `ensure`, `run` (**scripts only**), `const`, `if`, `match`, `for`, `log`/`logerr`, `fail`, `return`, `catch`/`recover` suffixes. **Not allowed:** `prompt`, channel sends, `run async`, `run` to a workflow, raw shell lines. A rule passes when it exits 0. Treat rules as read-only: do mutations in workflows and scripts.
 
-# const capture — from run, ensure, prompt
-const tag = run get_version()
-const ok = ensure validate(tag)
-const answer = prompt "Summarize the changes"
+### Prompts — delegating to an agent
 
-# inline scripts — one-off commands without a named script definition
-run `echo $1`("hello")
-const ts = run `date +%s`()
-```
+```jaiph
+prompt "Summarize the diff in one paragraph"          # fire and forget
+const answer = prompt "Summarize the diff"            # capture the agent's answer
 
-Conventions:
+const body = "Review this plan: ${plan}"
+prompt body                                           # identifier form
 
-- `jaiph run <file.jh>` executes `workflow default` in that file. The file must define a `workflow default` (the runtime checks for it and exits with an error if missing).
-- Inside a workflow, reach other workflows/scripts with **`run ref()`**. Free-form bash can appear as **inline shell** lines when the grammar allows; prefer **`script`** + **`run`** for anything non-trivial. Never use `fn args` or `$(fn …)` as a substitute for **`run`**.
-- Inside a rule, use `ensure` for **rules** and `run` for **scripts only** — not `prompt`, `send`, or `run async`.
-- Treat rules as non-mutating checks; perform filesystem or agent mutations in **workflows**. Script steps from rules use the same managed subprocess path as workflows. Details: [Sandboxing](sandboxing.md).
-- **Parallelism:** `run async ref([args...])` for managed async with implicit join. For concurrent **bash**, use `&` and the shell builtin `wait` inside a **`script`** and call it with `run`. Do not call Jaiph internals from background subprocesses unless you understand how isolation and logging interact with the runtime.
-- **Shell conditions:** Express conditionals with `run` to a **script** and handle failure with `catch`, or use `if` / `match` for value branching. Short-circuit brace groups remain valid **inside `script`** bodies: `cmd || { ... }`.
-- **No shell redirection around managed calls:** `run foo() > file`, `run foo() | cmd`, `run foo() &` are all `E_PARSE` errors — shell operators (`>`, `>>`, `|`, `&`) are not supported adjacent to `run` or `ensure` steps. Move shell pipelines and redirections into a **`script`** block and call it with `run`.
-- **Script reuse:** Prefer `import script "./tool.py" as tool` (or a sibling `.jh` module) instead of maintaining ad-hoc bash outside the compiler. Avoid informal workspace-level shared-bash directories that bypass the module graph.
-- **Unified namespace:** Channels, rules, workflows, scripts, script import aliases, and module-scoped `local`/`const` share a single namespace per module (`E_PARSE` on collision).
-- **Calling conventions (compiler-enforced):** `ensure` must target a rule — using it on a workflow or script is `E_VALIDATE`. `run` in a **workflow** must target a workflow or script; `run` in a **rule** must target a **script** only. **Type crossing:** `string` and `script` are distinct primitive types — `prompt` rejects script names, `run` rejects string consts, assigning a script to a `const` or interpolating `${scriptName}` are all `E_VALIDATE`. See [Grammar — Types](grammar.md#types). Jaiph symbols must not appear inside `$(...)` in bash contexts the compiler still scans (principally **`script`** bodies). Script bodies cannot contain `run`, `ensure`, `config`, nested definitions, routes, or Jaiph `fail` / `const` / `log` / `logerr` / `return "…"`.
+const review = prompt """
+You are reviewing a release plan.
+Approve only if all checks below are addressed.
+Plan:
+${plan}
+"""
+```
 
-## Authoring Heuristics
+**Typed prompts** force structured JSON output and give you field access:
 
-- Keep workflows short and explicit.
-- Put expensive checks after fast checks.
-- Include clear prompts with concrete acceptance criteria.
-- Reuse rules via `ensure`; reuse workflows and scripts via `run`.
-- **Always run `jaiph format` on `.jh` files you create or modify before committing.** This ensures canonical whitespace, indentation, and top-level ordering. In CI, use `jaiph format --check` to gate on formatting.
-- Use only syntax described in [jaiph.org](https://jaiph.org) and [Grammar](grammar.md). For advanced constructs (e.g. `config` block, `export`, prompt capture), see the grammar. For testing workflows, see [Testing](testing.md) (`expect_contain`, `expect_not_contain`, `expect_equal`, mocks).
+```jaiph
+const r = prompt "Assess this change" returns "{ verdict: string, risk: string }"
+log "verdict=${r.verdict} risk=${r.risk}"
+# if/match accept dot subjects on typed prompt captures — no rebind needed
+if r.verdict == "reject" {
+  fail "rejected: ${r.risk}"
+}
+```
+
+- Schema is **flat**, types `string` | `number` | `boolean` only. Capture (`const r =`) is **required** with `returns`.
+- The runtime extracts and validates JSON from the agent's reply; on schema mismatch the step fails. All fields are stored as **strings** (a `number` field holds the text `"42"`).
+- For a `"""` prompt, `returns "…"` goes on the closing-`"""` line or the line immediately after.
+- Triple **backticks** inside prompt context are rejected — they are script delimiters. Use indentation or quotes for code in prompt text.
 
-## Writing Tests
+Backend is configured, not per-prompt: `agent.backend` = `cursor` (default) | `claude` | `codex`, plus `agent.default_model`, via `config { … }` or `JAIPH_AGENT_*` env vars (env wins). On the **cursor** backend only, `agent.command` can point at a custom executable (prompt on stdin, answer on stdout); `claude` and `codex` ignore `agent.command`.
 
-Test files use the `*.test.jh` suffix and contain `test "name" { ... }` blocks. They import the workflows under test and use mocks to replace live agent/script behavior. The test runner uses the same `NodeWorkflowRuntime` as `jaiph run`. See [Testing](testing.md) for the full reference.
+**Write prompts like task briefs:** state the goal, the constraints, the acceptance criteria, and what to output. Interpolate concrete context (`${task}`, `${diff}`, captured file contents) rather than asking the agent to go find it.
 
-**Running:** `jaiph test` (all `*.test.jh` in workspace), `jaiph test <dir>` (recursive), or `jaiph test <file.test.jh>` (single file).
+### Failure handling: `catch` and `recover`
 
-**Available mocks:**
+```jaiph
+# catch — runs ONCE on failure, then continues
+run deploy(env) catch (err) {
+  logerr "deploy failed: ${err}"
+  run rollback(env)
+}
 
-- `mock prompt "fixed response"` — queues a fixed response for the next `prompt` call (multiple queue in order).
-- `mock prompt responseVar` — uses the string already bound as `responseVar` (e.g. a `const` earlier in the block) as the next response.
-- `mock prompt { /pattern/ => "response", _ => "default" }` — content-based dispatch.
-- `mock workflow alias.name() { return "stubbed" }` — replaces a workflow body.
-- `mock rule alias.name() { return "ok" }` — replaces a rule body.
-- `mock script alias.name() { … }` — replaces a script body with **shell lines** between the braces (same line as `{` is not enough; put the shell on the following lines, then `}` on its own line).
+# recover — repair-and-RETRY loop: run target → on failure run body → retry target
+run tests() recover (err) {
+  prompt "Tests failed. Fix the code. Failure output: ${err}"
+}
+```
 
-**Assertions:**
+- The binding (`err`) receives the merged stdout+stderr of the failed execution. Exactly one binding, always in parentheses — bare `catch {` is a parse error.
+- `catch` works on `ensure` and `run`; `recover` works on `run` (and `run async`) only. They are mutually exclusive on one step.
+- `recover` retries until success or `run.recover_limit` (default **10**; workflow-level config overrides module-level).
+- A common pattern: a `catch` whose body is the "else branch" — note `return` inside a catch body returns from the **enclosing workflow**.
 
-- `expect_contain var "expected substring"`
-- `expect_not_contain var "unwanted text"`
-- `expect_equal var "exact expected value"`
+`recover` + `prompt` is Jaiph's signature loop for repetitive agent work: *check → if broken, ask agent to fix → re-check*, fully unattended.
 
-**Minimal example:**
+### Control flow: `if`, `match`, `for`
 
 ```jaiph
-import "main.jh" as app
+if status == "ok" { log "healthy" }       # operators: == != =~ !~
+if msg =~ /ERROR|FATAL/ { fail "bad" }    # =~ / !~ take /regex/
 
-test "happy path produces greeting" {
-  mock prompt "hello from mock"
-  const out = run app.default("task")
-  expect_contain out "hello from mock"
+const label = match status {              # statement, expression, or return form
+  "ok" => "success"
+  /^warn/ => "warning"
+  _ => "unknown"
 }
 
-test "handles failure gracefully" {
-  mock prompt "error"
-  const out = run app.default("bad input") allow_failure
-  expect_contain out "error"
+for path in paths {                       # iterates LINES of the string `paths`
+  run process(path)
 }
 ```
 
-`allow_failure` on a `run` step (with or without `const … =`) prevents a non-zero workflow exit from failing the test — useful for testing error paths. For **`mock script`**, put shell lines on lines after the opening `{`, then close with `}` on its own line (see [Testing](testing.md)).
+- Subjects for `if` and `match` are bare identifiers (`if status == …`, `match status {`) or `IDENT.IDENT` reading a field from a typed prompt capture (`if r.verdict == "ok"`, `match r.verdict { … }`). `$status` / `${status}` as subject is still a parse error. Dot subjects on a non-typed-capture variable, or a field not in the prompt's `returns` schema, get the same `E_VALIDATE` errors as `${var.field}` interpolation. `for` iterators stay bare identifiers (`for x in lines`).
+- `if` supports an optional `else` branch — `} else {` must be on **the same line** as the closing `}` of the `if` body. **No `else if` chaining**: nest an `if` inside the `else` block, or use `match` for multi-way branching.
+- `match`: arms are newline-separated (no commas), first match wins, exactly one `_` arm required. Arm bodies: string, `"""…"""`, in-scope identifier, `${var}`, `fail "…"`, `run ref()`, `ensure ref()`. **Not** allowed in arms: `return` (write `return match x { … }`), `log`/`logerr`, inline scripts — capture the match result into a `const` and act on it after.
+- `for` splits the source string on newlines (a trailing final newline does not produce an empty iteration). There is no numeric/while loop — iterate lines, use `recover`, or use recursive workflows (depth limit 256).
 
-## Suggested Starter Layout
+### Channels — fan-out between workflows
 
-- `.jaiph/bootstrap.jh` — Created by `jaiph init`; contains a single triple-quoted prompt (`prompt """ ... """`) that points the agent at `.jaiph/SKILL.md` (a copy of this guide).
-- `.jaiph/readiness.jh` — Preflight: rules and `workflow default` that runs readiness checks.
-- `.jaiph/ba_review.jh` (or any name you choose) — (Optional) Pre-implementation review: reads tasks from a queue file, sends one to an agent for review, and marks it dev-ready or exits with questions. This repository uses `.jaiph/architect_review.jh` with `QUEUE.md`.
-- `.jaiph/verification.jh` — Verification: rules and `workflow default` for lint/test/build.
-- `.jaiph/main.jh` — Imports readiness, optional review, and verification; defines implementation workflow and `workflow default` that orchestrates preflight → (optional) review → implementation → verification.
+```jaiph
+channel findings -> analyst, reviewer     # routes declared at TOP LEVEL only
 
-Optional: `.jaiph/implementation.jh` if you prefer the implementation workflow in a separate module; otherwise keep it in `main.jh`.
+workflow scanner() {
+  findings <- "Found 3 issues in auth"    # RHS: "literal", """block""", ${var}, or run ref()
+}
 
-## Final Output Requirement
+workflow analyst(message, chan, sender) { # route targets declare EXACTLY 3 params
+  log "from ${sender}: ${message}"
+}
 
-After scaffolding workflows, print the exact commands the developer should run. The primary command runs the default entrypoint (typically preflight, then implementation, then verification — plus any optional review step you added). Point users to the canonical skill URL for agents: <https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md>.
+workflow default() {
+  run scanner()                           # dispatch happens AFTER steps finish
+}
+```
 
-Include a compile check and, when the repository has native tests (`*.test.jh`), `jaiph test` (see [Testing](testing.md)); skip `jaiph test` if there are no test files, since discovery mode exits with an error when nothing matches.
+Sends enqueue in memory; the queue drains after the owning workflow's steps complete, calling each target sequentially. A `->` inside a workflow body is a parse error. Sends on a channel with no route are silently dropped. Each workflow frame may drain at most **1000** messages before the runtime aborts the owning workflow with `E_INBOX_DISPATCH_LIMIT` (naming the channel that hit the cap); override via `JAIPH_INBOX_MAX_DISPATCH=<positive int>` only if the high volume is intentional. Routed payloads are persisted under the run dir as `inbox/NNN-<channel>.txt`.
 
-```bash
-jaiph format .jaiph/*.jh
-jaiph compile .jaiph
-# Omit the next line when the repo has no *.test.jh files (workspace discovery exits 1 with "no *.test.jh files found").
-jaiph test
-jaiph run .jaiph/main.jh "implement feature X"
-# Or run verification only:
-jaiph run .jaiph/verification.jh
+### Concurrency: `run async`
+
+```jaiph
+workflow default() {
+  const a = run async lint()             # returns a handle immediately
+  const b = run async unit_tests()
+  log "lint: ${a}"                       # first real read blocks + resolves
+  log "tests: ${b}"
+}                                        # unread handles are joined when this step list finishes
 ```
 
-Arguments after the file path are passed to `workflow default` as named parameters (when declared) and as `$1`, `$2` in script bodies.
+Workflows only (rejected in rules); not combinable with inline scripts. `catch`/`recover` compose with `run async`. Unread handles are joined at the end of the **current step list** (the workflow body, an `if`/`else` branch, or a `catch`/`recover` body) before control continues — channel drains run only after the entry workflow's top-level list finishes. For concurrent *shell*, use `&` + `wait` inside one script body instead.
 
-## Minimal Sample (Agent Reference)
+### Config
 
-Use this as a shape to adapt. Paths and prompts should match the target repository. All three files live under `.jaiph/`. Imports in `main.jh` are relative to that file (e.g. `"readiness.jh"` resolves to `.jaiph/readiness.jh`). When you run `jaiph run .jaiph/main.jh "implement feature X"`, the default workflow receives `"implement feature X"` as `${task}` (named parameter). Note that `run` does not forward args implicitly, so the default workflow passes `task` as a bare identifier to `run implement(task)` so the implement workflow's prompt can use `${task}`.
+```jaiph
+config {
+  agent.backend = "claude"               # cursor | claude | codex
+  agent.default_model = "claude-sonnet-4-6"
+  run.recover_limit = 5                  # workflow-level config also honored
+  run.logs_dir = ".jaiph/runs"
+}
+```
 
-**File: .jaiph/readiness.jh**
+Precedence: **environment > workflow-level config > module-level config > defaults**. A workflow body may open with its own `config { … }` (before any steps; `agent.*`/`run.*` keys only) to override the model or backend for just that workflow. Docker on/off is env-only (`JAIPH_UNSAFE`, `JAIPH_DOCKER_ENABLED`); image/network/timeout come from `runtime.*` keys or `JAIPH_DOCKER_*`.
 
-```jaiph
-script git_is_clean = `test -z "$(git status --porcelain)"`
+## Compile errors you will see, and the fix
 
-rule git_clean() {
-  run git_is_clean() catch (err) {
-    fail "git working tree is not clean"
-  }
-}
+| Error (abridged) | Fix |
+|---|---|
+| `E_PARSE` missing `()` on definition/call | Add parentheses: `workflow default()`, `run setup()` |
+| `E_PARSE` assignment without `const` | `const x = run foo()` |
+| `E_VALIDATE` cannot rebind immutable name | Rename the new binding — nothing is reassignable |
+| `E_VALIDATE` `ensure` on non-rule / `run` on rule | Match keyword to callee: rules→`ensure`, scripts/workflows→`run` |
+| `E_VALIDATE` `run` to workflow inside rule | Rules may `run` scripts only; restructure or move to a workflow |
+| `E_VALIDATE` inline shell forbidden in rules | Wrap the shell in a `script` (named or inline) and `run` it |
+| `E_PARSE` `${…}` in single-backtick script | Use `$1`/`$2` args, or switch to a fenced ``` block |
+| `E_VALIDATE` unknown identifier / unknown `${name}` | Declare it (`const`/param) before use; check spelling |
+| `E_VALIDATE` nested call must be explicit | `run f(run g())`, not `run f(g())` |
+| `E_VALIDATE` duplicate import alias | Use a unique `as` name for each `import` |
+| `E_VALIDATE` arity mismatch | Match the callee's declared parameter count |
+| `E_PARSE` redirection after managed call | Move pipes/redirects into a script body |
+| `E_VALIDATE` scripts are not values/promptable | Scripts aren't strings: don't `const x = scriptName`, `${scriptName}`, or `prompt scriptName` |
+| `E_PARSE` `->` inside workflow body | Move the route to the top-level `channel` line |
+| `E_PARSE` `prompt … returns` without capture | `const x = prompt … returns "…"` |
+| `E_SCHEMA` invalid returns schema | Flat `{ field: string|number|boolean }` only |
+| `E_IMPORT_NOT_FOUND` | Fix the path (relative to the importing file) or `jaiph install` the library |
+
+## Runtime model (what happens when it runs)
+
+- `jaiph run file.jh args…` validates the import closure, emits script bodies as executable files, then interprets `workflow default` with the args bound to its named parameters. Scripts additionally see positional args as `$1`, `$2`.
+- **Run directory:** `.jaiph/runs/<UTC-date>/<UTC-time>-<file>/` with numbered `NNNNNN-<step>.out`/`.err` per step (written incrementally — `tail -f` works) and `run_summary.jsonl`, one JSON event per line (`WORKFLOW_START/END`, `STEP_START/END`, `LOG`, `INBOX_*`, `PROMPT_*`). When debugging a failed run, read the failure footer the CLI prints, then the referenced `.err`/`.out` files.
+- **Return value:** if `default` returns a string, the CLI prints it to stdout after the PASS line.
+- **Capture sources:** workflow/rule → its explicit `return` value; script → stdout; prompt → the agent's answer.
+- Step environment: scripts inherit the runner's environment plus `JAIPH_WORKSPACE`, `JAIPH_SCRIPTS`, `JAIPH_RUN_DIR`, `JAIPH_ARTIFACTS_DIR`, etc. Workflow variables are **not** auto-exported — pass them as arguments.
+
+## Testing your workflows
+
+Test files are `*.test.jh` next to your modules, run with `jaiph test`. They execute the same interpreter with prompts and bodies mocked — no live LLM calls.
 
-script require_git_node_npm = ```
-command -v git
-command -v node
-command -v npm
-```
+```jaiph
+import "main.jh" as app
 
-rule required_tools() {
-  run require_git_node_npm()
+test "happy path" {
+  mock prompt "LGTM — implemented"
+  const out = run app.default("add logging")
+  expect_contain out "LGTM"
 }
 
-workflow default() {
-  ensure required_tools()
-  ensure git_clean()
+test "failure path is handled" {
+  mock prompt { /fix/ => "fixed", _ => "noop" }   # content-based dispatch
+  mock script app.run_tests() {
+    exit 1
+  }
+  const out = run app.default("x") allow_failure   # non-zero exit doesn't fail the test
+  expect_contain out "rollback"
 }
 ```
 
-**File: .jaiph/verification.jh**
+- Mocks: `mock prompt "…"` (queued, one per prompt call), `mock prompt { /re/ => "…", _ => "…" }`, `mock workflow ref() { … }`, `mock rule ref() { … }`, `mock script ref() { shell lines }`. All mock refs need `()`.
+- Assertions: `expect_contain`, `expect_not_contain`, `expect_equal` — `expect_* <captureVar> "literal"` or a test-block `const` name.
+- For typed prompts, the mock text must be one line of valid JSON matching the schema.
+- Mixing queued `mock prompt "…"` / `mock prompt <const>` and a `mock prompt { … }` block in one test is rejected at compile time (`E_VALIDATE`: `cannot mix "mock prompt { … }" with queued "mock prompt …" in one test block; choose one style`). Use one style per block; separate tests in the same file may use different styles.
 
-```jaiph
-script npm_test_ci = `npm test`
+Write at least one test per workflow you author when the repo uses tests; mock every prompt so the suite is deterministic.
 
-rule unit_tests_pass() {
-  run npm_test_ci()
-}
+## Patterns for repetitive tasks
 
-script run_build = `npm run build`
+**Gate → do → verify** (the standard delivery shape):
 
-rule build_passes() {
-  run run_build()
+```jaiph
+workflow default(task) {
+  ensure preconditions()          # fast checks first
+  run implement(task)             # prompt-driven work
+  run verify() recover (err) {    # verification with self-repair
+    prompt "Verification failed — fix it. Output: ${err}"
+  }
 }
+```
+
+**Process a queue of items** (line-oriented `for`):
 
+```jaiph
 workflow default() {
-  ensure unit_tests_pass()
-  ensure build_passes()
+  const items = run `ls inbox/*.md 2>/dev/null || true`()
+  for item in items {
+    run handle(item)
+  }
 }
 ```
 
-**File: .jaiph/main.jh**
+**Review-then-act with a typed verdict:**
 
 ```jaiph
-import "readiness.jh" as readiness
-import "verification.jh" as verification
+workflow triage(item) {
+  const r = prompt "Is this ready to implement? Item: ${item}" returns "{ verdict: string, reason: string }"
+  const outcome = match r.verdict {
+    "ready" => run implement(item)
+    _ => "skipped: ${r.reason}"
+  }
+  log outcome
+}
+```
 
-workflow implement(task) {
-  prompt """
-Implement the requested feature or fix with minimal, reviewable changes.
-Keep edits consistent with existing architecture and style.
-Add or update tests for behavior changes.
+**Pipeline stages via channels** when later stages should react to earlier ones without direct calls (see the channel section above).
 
-User asks for: ${task}
-"""
-}
+## What to produce in a repository
 
-workflow default(task) {
-  run readiness.default()
-  run implement(task)
-  run verification.default()
-}
+When asked to scaffold Jaiph automation (e.g. after `jaiph init`), build a small composable set under `.jaiph/`:
+
+- `.jaiph/readiness.jh` — preflight rules (required tools, clean git) + `workflow default` running them.
+- `.jaiph/verification.jh` — lint/test/build rules + `workflow default`.
+- `.jaiph/main.jh` — imports both, defines the prompt-driven `implement` workflow, and a `workflow default(task)` wiring **preflight → implement → verification**.
+- Optional: a review workflow gating a task queue, `*.test.jh` tests for the workflows.
+
+Keep workflows short; put expensive checks after cheap ones; pass data explicitly. Always finish with format + compile:
+
+```bash
+jaiph format .jaiph/*.jh
+jaiph compile .jaiph
+jaiph test                       # safe even when no *.test.jh exists yet
+jaiph run .jaiph/main.jh "implement feature X"
 ```
+
+End your scaffolding response by printing those exact commands for the user, plus a short **WHAT CHANGED** / **WHY** summary. Canonical agent-readable copy of this skill: <https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md>.
diff --git a/docs/language.md b/docs/language.md
index 8d6c789d..86c29270 100644
--- a/docs/language.md
+++ b/docs/language.md
@@ -1,788 +1,411 @@
 ---
 title: Language
-permalink: /language
+permalink: /reference/language
+diataxis: reference
 redirect_from:
+  - /language
   - /language.md
 ---
 
 # Language
 
-Workflow systems usually need two layers: a **host language** that sequences work, handles failures, and talks to tools, and **task code** (shell, Python, and so on) that does the mechanical steps. Jaiph’s `.jh` modules are that host layer: they wire prompts, scripts, validation **rules**, and **channels** into pipelines you can run from the CLI or CI.
+This page is the per-step reference: every `WorkflowStepDef` variant and every `Expr` kind the runtime executes, with the visible contract. For the formal grammar (EBNF, lexical rules, validation catalog) see [Grammar](grammar.md). For the conceptual model — why the language is shaped this way — see [Why Jaiph](why-jaiph.md).
 
-Under the hood, the **TypeScript CLI** parses modules, runs **`validateReferences`** while emitting script files (`emitScriptsForModule` / `buildScripts`), then starts a **Node workflow runtime** that walks the same AST in process — there is no separate workflow shell. The **`jaiph compile`** command walks the same import closure with **`validateReferences`** only — it **does not** emit `scripts/`, **invoke** **`buildRuntimeGraph`**, or spawn the workflow runner (`src/cli/commands/compile.ts`). The runtime’s **`buildRuntimeGraph`** pass loads imports with the parser only; compile-time checks live in the transpile path, not in the graph loader. For repository layout, event contracts, and diagrams, see [Architecture](architecture.md).
+The runtime is `NodeWorkflowRuntime` (`src/runtime/kernel/node-workflow-runtime.ts`). Step dispatch is driven by `WorkflowStepDef.type` (8 variants). Value evaluation goes through one private `evaluateExpr` over `Expr.kind` (8 variants); see [Architecture — AST / Types](architecture.md#core-components).
 
-This page is the practical reference for language primitives — syntax, steps, and runtime behavior at the author’s eye level. For lexical/syntax tables and edge-case grammar, see [Grammar](grammar.md). Test files (`*.test.jh`) are a dialect documented in [Testing](testing.md).
+## Value types
 
-## Strings
-
-Strings are the general-purpose value type. They can be interpolated, passed as arguments, assigned to `const` bindings, and sent to an agent via `prompt`.
-
-**Single-line** — double-quoted:
-
-```jaiph
-const greeting = "Hello, ${name}."
-prompt "Review the code for issues"
-```
-
-**Multiline** — triple-quoted (`"""…"""`):
-
-```jaiph
-const instructions = """
-You are a code reviewer.
-Analyze the following: ${input}
-Be concise.
-"""
-prompt instructions
-```
-
-Triple-quoted strings preserve internal newlines and support `${…}` interpolation. Leading/trailing blank lines adjacent to the `"""` delimiters are trimmed.
-
-Single-quoted strings are parse errors. Use `\"` for literal double quotes inside strings, `\\` for literal backslashes.
-
-## Scripts
-
-Scripts are executable definitions — shell (or polyglot) code that runs as an isolated subprocess. They are invoked with `run` and cannot be interpolated, assigned to variables, or used as prompt bodies. The compiler enforces this at every call site.
-
-**Single-line** — backtick:
-
-```jaiph
-script greet = `echo "Hello, $1"`
-```
-
-Backtick scripts do not support `${…}` Jaiph interpolation — the compiler rejects it to prevent ambiguity with shell expansion. Use positional arguments (`$1`, `$2`, …).
-
-**Multiline** — fenced block:
-
-<pre><code>script setup_env = ```
-export BASE_DIR=$(pwd)
-mkdir -p "$BASE_DIR/output"
-echo "Environment initialized"
-```
-</code></pre>
-
-Fenced scripts support `${…}` — it passes through to the shell as standard shell parameter expansion.
-
-**Polyglot** — use a fence lang tag to select the interpreter:
-
-<pre><code>script analyze = ```python3
-import sys
-print(f"Analyzing {sys.argv[1]}")
-```
-</code></pre>
-
-The tag maps to `#!/usr/bin/env <tag>`. Any tag is valid. Alternatively, use a manual `#!` shebang as the first line. Combining both is an error. If the body has **neither** a fence lang tag nor a leading `#!` line, emitted scripts default to `#!/usr/bin/env bash`.
-
-Strings and scripts are structurally distinct and non-interchangeable — using one where the other is expected produces a compile-time error.
-
-## Module Structure
-
-A `.jh` file is a module. Modules contain top-level declarations in any order: imports, config, channels, constants, rules, scripts, and workflows. `jaiph format` hoists imports, config, and channels to the top but preserves the relative order of everything else.
-
-### Imports and Exports
-
-`import` loads another module; `export` marks a declaration as public. All three definition types support export: `export workflow`, `export rule`, and `export script`.
-
-```jaiph
-import "tools/security.jh" as security
-import "bootstrap.jh" as bootstrap
-
-export script build_docs = `mkdocs build`
-
-export workflow default() {
-  ensure security.scan_passes()
-  run bootstrap.nodejs()
-}
-```
-
-Imported symbols use dot notation: `alias.name`. The `.jh` extension is appended automatically if omitted. Import aliases must be unique within a module.
-
-#### Script Imports
-
-`import script` loads an external script file and binds it to a local script symbol. The imported file is treated as raw script source (not as a Jaiph module) — shebangs are preserved and used to select the interpreter. The bound name works exactly like a locally declared `script`: callable with `run`, capturable with `const`, and subject to the same isolation rules.
-
-```jaiph
-import script "./queue.py" as queue
-
-workflow default() {
-  const result = run queue("get")
-  log result
-}
-```
-
-The path is resolved relative to the importing `.jh` file's directory (not the process CWD). The path must be double-quoted. Missing targets fail at compile time with `E_IMPORT_NOT_FOUND`.
-
-This is useful when a script body is large enough that embedding it inline couples DSL structure and script implementation too tightly, or when you want normal editor/tooling support (syntax highlighting, linting) on the script file.
-
-#### Export Visibility
-
-If a module contains at least one `export` declaration, it has an **explicit API surface**: only exported names can be referenced through the import alias. Referencing a symbol that exists in the module but is not exported produces a compile-time error:
-
-```
-E_VALIDATE: "private_rule" is not exported from module "lib"
-```
-
-Modules with **zero** `export` declarations retain legacy behavior — every top-level rule, script, and workflow is implicitly public. This means existing projects that don't use `export` continue to work without changes.
-
-The check applies uniformly to all qualified-reference positions: `run`, `ensure`, channel route targets, `send` RHS, and test mocks.
-
-### Library Imports
-
-Import paths resolve relative to the importing file first. If no file is found and the path contains a `/`, the resolver falls back to project-scoped libraries under `.jaiph/libs/`:
-
-```jaiph
-import "queue-lib/queue" as queue   # resolves to .jaiph/libs/queue-lib/queue.jh
-```
-
-The path is split as `<lib-name>/<path-inside-lib>`. Libraries are installed with `jaiph install` — see [CLI — jaiph install](cli.md#jaiph-install). Missing library imports fail at compile time with `E_IMPORT_NOT_FOUND`.
-
-### Top-Level `const`
-
-Module-scoped variables accessible as `${name}` inside that module's rules and workflows.
-
-```jaiph
-const REPO = "my-project"
-const MAX_RETRIES = 3
-const GREETING = """
-Hello,
-world
-"""
-```
-
-Values can be double-quoted strings (single-line), triple-quoted strings (multiline `"""..."""`), or a **bare** right-hand side: everything after `=` on that line becomes the stored string verbatim (including tokens that look like numbers, for example `const N = 42` keeps **`"42"`** as text for `${N}` — there is no separate numeric type).
-
-Declaration order matters — `${name}` only expands variables already bound above. Module constants are **not** passed to script subprocesses; use arguments or shared libraries instead.
-
-### Channels
-
-Named message queues for inter-workflow communication. Declared at the top level, one per line.
-
-```jaiph
-channel alerts
-channel findings -> analyst
-channel events -> handler_a, handler_b
-```
-
-Routes (`->`) declare which workflows receive messages sent to the channel. See [Inbox & Dispatch](inbox.md) for dispatch semantics.
-
-### Config
-
-Optional `config { … }` block. At **module** level only the keys allowed in **`src/parse/metadata.ts`** are accepted (`agent.*`, `run.*`, `runtime.*`, `module.*` — each assignment is validated for type). For example **`agent.backend`** must be **`cursor`**, **`claude`**, or **`codex`**. A **workflow** may contain **at most one** nested `config { … }`, it must appear **before** the first step, and only **`agent.*`** and **`run.*`** are allowed there — `runtime.*` and `module.*` are rejected with `E_PARSE`.
-
-```jaiph
-config {
-  agent.default_model = "claude-sonnet-4-6"
-  agent.backend = "claude"
-  run.debug = true
-}
-```
-
-See [Configuration](configuration.md) for key semantics and precedence rules.
-
-## Definitions
-
-### Workflows
-
-Named sequences of orchestration steps. Workflows can call other workflows, scripts, prompts, and channels. Parentheses are required on definitions, even when parameterless.
-
-`jaiph run` only executes the workflow named **`default`** in the entry `.jh` file (the runner’s argv hard-codes that name today). Other workflows are reachable from steps inside the module or its imports. See the `jaiph run` sequence in [Architecture](architecture.md).
-
-```jaiph
-workflow default() {
-  ensure check_deps()
-  run setup_env()
-  prompt "Review the code for issues"
-}
-
-workflow deploy(env, version) {
-  log "Deploying ${version} to ${env}"
-  run build(version)
-  run push(env)
-}
-```
-
-Workflows support all step types: `run`, `ensure`, `prompt`, `const`, `log`, `logerr`, `fail`, `return`, `send`, `match`, `if`, `run async`, `catch`, and `recover`.
-
-#### Inline shell lines (workflows only)
-
-Any workflow body line that does **not** parse as a managed Jaiph step is treated as **inline shell**: the text is Jaiph-interpolated, then executed with `sh -c` in the workspace (same working-directory rules as `run` on scripts — see [Script isolation](#script-isolation)). Prefer a top-level `script` and `run name()` for non-trivial shell.
-
-The compiler still inspects shell lines (for example a first word that names a local script or workflow must be written as a managed `run`/`ensure` step, not as bare shell). **`wait`** is not a step — using it is a parse error (`"wait" has been removed from the language`).
-
-**Rules cannot** contain inline shell; unstructured shell there fails validation (`inline shell steps are forbidden in rules; use explicit script blocks`).
-
-### Rules
-
-Named blocks of structured validation steps. Rules are called with `ensure` and are meant for checks and gates.
-
-```jaiph
-rule check_deps() {
-  run verify_lockfile()
-  run check_versions()
-}
-
-rule gate(path) {
-  run check_exists(path)
-  ensure validate_format(path)
-}
-```
-
-Rules are more restricted than workflows: the compiler rejects `prompt`, `send`, and `run async` in rule bodies, and `run` may only target **scripts** (never workflows or other rules via `run` — use `ensure` for rules). Rule bodies also reject `const … = prompt`. Otherwise rule bodies share the same structured step set as workflows for control flow (**`match`**, **`if`**, **`for … in …`**), captures, logging, **`return`**, and failure handling (**`catch`** / **`recover`** on **`run`**). Those restrictions are **static** (see `validateReferences` in `src/transpile/validate.ts`). At runtime, `run` inside a rule still launches a normal managed script subprocess with the same **environment model** as workflow scripts (see [Script isolation](#script-isolation)); scripts can perform side effects — the language simply keeps orchestration-heavy steps out of rules.
-
-`catch` and **`recover`** on **`run`** are allowed in rules the same as in workflows. **`recover` never attaches to `ensure`** — only `run` steps support `recover`.
-
-### Scripts
-
-Executable shell (or polyglot) definitions. Bodies are opaque to the compiler — Jaiph does not parse them as orchestration steps. Scripts are called with `run` and execute as isolated subprocesses. See [Scripts](#scripts) above for syntax (backtick, fenced, polyglot).
-
-## Parameters and Arguments
-
-### Definitions
-
-All workflow and rule definitions require parentheses. Named parameters go inside:
-
-```jaiph
-workflow implement(task, role) {
-  log "Implementing ${task} as ${role}"
-}
-```
+| Type | Operations | Crossings |
+|---|---|---|
+| `string` | `${…}` interpolation, `run` / `ensure` arguments, `const`, `prompt` body, `send` payload, `return`. | Cannot be invoked with `run` (`E_VALIDATE: strings are not executable`). |
+| `script` | Invocable with `run`. | Not interpolatable, not `const`-assignable by name, not a valid `prompt` body. |
 
-Parameter names must be valid identifiers, unique, and not reserved keywords. Inside the body, parameters are accessed as `${paramName}`. Parameters are immutable — they cannot be rebound by `const` or any other declaration in the same scope (see [`const` — Variable Binding](#const--variable-binding) for details).
+Crossings produce specific `E_VALIDATE` messages identifying the violated rule.
 
-### Call Sites
+## Module surface
 
-Arguments are comma-separated inside parentheses:
+| Top-level | Description |
+|---|---|
+| `import "path" as alias` | Loads another module. `.jh` appended automatically. Resolution: relative-first, then library fallback (`<workspace>/.jaiph/libs/<name>/...`). |
+| `import script "path" as name` | Loads an external script file (no `.jh` appended). Path is relative-only. Treated as a `script` symbol. |
+| `export rule` / `export workflow` / `export script` | Marks a definition public. At least one `export` makes module visibility explicit; otherwise all top-level definitions are implicitly public. |
+| `channel name [-> target [, target …]]` | Declares a named queue. Inline routes target workflows with exactly three parameters (message, channel, sender). |
+| `const NAME = value` | Module-scoped immutable string. Values: double-quoted, triple-quoted, or bare token. Stored verbatim. |
+| `config { … }` | Module-level configuration block (`agent.*`, `run.*`, `runtime.*`, `module.*`). See [Configuration](configuration.md). |
+| `rule name([params]) { … }` | Validation rule. Invoked with `ensure`. |
+| `script name = …` | Executable definition. Invoked with `run`. |
+| `workflow name([params]) { … }` | Orchestration entrypoint. Invoked with `run` (or by `jaiph run` for `default`). |
 
-```jaiph
-run setup()
-run deploy("prod", version)
-```
+Visibility rule: when a module has at least one `export`, only exported names are reachable through its alias (`E_VALIDATE: "<name>" is not exported from module "<alias>"`).
 
-**Bare identifier arguments** pass a variable’s value without quoting; the compiler records the identifier so unknown names fail early. You can still pass the same value as a quoted orchestration string (for example `run greet("${name}")` when a literal is required), but **prefer the bare form** when the whole argument is exactly one binding — it reads clearly and matches formatter output.
+The unified per-module namespace covers channels, rules, workflows, scripts, script-import aliases, and top-level `const`. Duplicates are `E_PARSE`.
 
-```jaiph
-const task = run get_next_task()
-run process(task)                    # bare identifier — passes value of task
-run process(task, "extra context")   # mixed bare + quoted literal
-run greet("hello_${name}")           # quoted string with extra text — allowed
-```
-
-### Nested Managed Calls in Arguments
+## Workflow body — step types
 
-Call arguments can contain nested managed calls — but the `run` or `ensure` keyword must be explicit. This is a deliberate language rule: scripts and workflows execute only via `run`, and rules execute only via `ensure`, even when nested inside another call's arguments.
+There are eight `WorkflowStepDef` variants. Every body line that does not match a managed form becomes a `shell` step (workflows only — rules reject unrecognised shell).
 
-**Valid — explicit nested calls:**
-
-```jaiph
-run mkdir_p_simple(run jaiph_tmp_dir())
-run do_work(ensure check_ok())
-run do_work(run `echo aaa`())
-```
-
-The nested call executes first and its result is passed as a single argument to the outer call.
-
-**Invalid — bare call-like forms:**
-
-```jaiph
-# run do_work(bar())          — E_VALIDATE: use "run bar()" or "ensure bar()"
-# run do_work(rule_bar())     — E_VALIDATE: use "ensure rule_bar()"
-# run do_work(`echo aaa`())   — E_VALIDATE: use "run `...`()"
-# const x = bar()             — E_PARSE: use "const x = run bar()"
-```
+| Type | Surface | Description |
+|---|---|---|
+| `exec` | `run` / `ensure` / `prompt` / standalone `match` / inline shell | Side-effecting managed call statement. The discriminator (call / inline_script / prompt / match / shell) lives in `body.kind`. Carries optional `captureName`, `catch`, or `recover`. |
+| `const` | `const NAME = <expr>` | Bind a value expression to a name. |
+| `return` | `return <expr>` | Set the managed return value. |
+| `send` | `channel <- <expr>` | Enqueue a payload on a channel for the current workflow context. |
+| `say` | `log` / `logerr` / `fail` | `level: "log"` / `"logerr"` / `"fail"`. `level: "fail"` aborts with the message. |
+| `if` | `if <subject> <op> <operand> { … } [ else { … } ]` | Conditional block. |
+| `for_lines` | `for <iter> in <source> { … }` | Iterate lines of a string variable. |
+| `trivia` | comments, blank lines | Formatter-only. Skipped by the runtime and validator. |
 
-The explicit capture-then-pass form is also valid:
+## Value expressions — `Expr` kinds
 
-```jaiph
-const x = run bar()
-run foo(x)
-```
+Every value position (`const` RHS, `return`, `send` RHS, `log` / `logerr` / `fail` argument, and `exec` body) carries an `Expr` of one of eight kinds.
 
-### Arity Checking
+| Kind | Source form | Runtime behaviour |
+|---|---|---|
+| `literal` | `"…"`, `"""…"""`, `${var}`, post-dedent triple-quoted body | Interpolated against the current scope; `${run …}` / `${ensure …}` perform inline managed calls. |
+| `call` | `run ref(args)`, `run async ref(args)` | Managed workflow/script call. `async: true` on the `run async` capture position. |
+| `ensure_call` | `ensure ref(args)` | Managed rule call. |
+| `inline_script` | `` `body`(args) `` / `` ```lang...body...```(args) `` | Inline script body emitted as `scripts/__inline_<hash>`. |
+| `prompt` | `prompt body [returns "<schema>"]` | Sends body to the agent backend; JSON-quoted in transport. |
+| `match` | `match <subject> { … }` | Walks arms top-to-bottom; first match wins. |
+| `shell` | Free-form workflow body line; send RHS parse fallback | Workflow: unparsed line becomes an inline-shell `exec` step (rules forbid). Send: non-literal RHS fallback — usually `E_VALIDATE`. |
+| `bare_ref` | A bare symbol on a `send` RHS | Always rejected by the validator; preserved so the error can name the symbol. |
 
-When the callee declares named parameters, the compiler validates argument count:
+## `run` — execute a workflow or script
 
-```jaiph
-workflow greet(name) { log "Hello ${name}" }
+| Position | Allowed target |
+|---|---|
+| `run` in workflow | Workflow or named script. |
+| `run` in rule | Named script only. Workflows / rules are `E_VALIDATE`. |
+| `run async` | Workflows only. Inline scripts not supported. |
+| Inline-script `run` | Allowed in both workflows and rules. |
 
-workflow default() {
-  run greet("Alice")         # OK: 1 arg, 1 param
-  # run greet("A", "B")     — compile error: expects 1 argument
-  # run greet()             — compile error: expects 1 argument
-}
-```
+Capture rules:
 
-## Workflow Steps
+| Callee | Captured value |
+|---|---|
+| Workflow | Explicit `return` value of the callee. |
+| Named script | Trimmed stdout. |
+| Inline script | Trimmed stdout. |
+| Rule (`ensure`) | Explicit `return` value. |
 
-### `run` — Execute a Workflow or Script
+### Inline scripts
 
-Calls a workflow or script (in a workflow) or a script only (in a rule).
+Inline scripts embed a script body in a step without a separate `script` definition. Single backticks for one-liners, triple backticks for multiline or polyglot bodies.
 
 ```jaiph
-run setup_env()
-run lib.build_project(task)
-const output = run transform()
+run `echo hello`()
+const x = run `echo captured`()
+const y = run `date +%s`()
+run `echo $1-$2`("hello", "world")   # => hello-world
 ```
 
-**Capture:** For a workflow, captures the explicit `return` value. For a script or inline script, captures **trimmed** stdout on success (`node-workflow-runtime.ts` treats the emitted stdout string with `.trim()` when producing the capture value).
+| Aspect | Rule |
+|---|---|
+| Backtick form | `${…}` Jaiph interpolation is `E_PARSE`. Use `$1`, `$2`, … |
+| Fenced form | `${…}` passes through to the shell. Optional lang tag selects the interpreter (`` ```python3 `` → `#!/usr/bin/env python3`). |
+| Mixing fence tag + manual shebang | Error. |
+| Default shebang | `#!/usr/bin/env bash` when neither tag nor `#!` line is present. |
+| Emitted name | `scripts/__inline_<12-hex>`; deterministic across runs. |
+| `catch` / `recover` | Allowed on a standalone `run` step with inline-script body. Forbidden on inline scripts in `log` / `logerr` / `return` / `const` RHS. |
+| Subprocess env | Same `scope.env` as named scripts (runner `process.env` plus Jaiph metadata). Module `const` values are not auto-exported — pass via `$1`, `$2`. |
+| `run async` | Not supported. |
 
-### `run async` — Concurrent Execution with Handles
+### `run async` — concurrent execution with handles
 
-`run async ref(args)` starts a workflow or script concurrently and returns a **`Handle<T>`** — a value that resolves to the called function's return value on first non-passthrough read. `T` is the same type the function would return under a synchronous `run`.
+`run async ref(args)` starts the callee concurrently and returns a `Handle<T>` immediately. `T` is the same type a synchronous `run` would return.
 
 ```jaiph
 workflow default() {
-  # Start work without storing a binding — still tracked until this step list ends
   run async lib.task_a()
-
-  # Capture the handle for later use
   const h = run async lib.task_b()
-
-  # Reading the handle forces resolution (blocks until task_b completes)
-  log "${h}"
-}
-```
-
-**Handle resolution:** The handle resolves on first **non-passthrough** read — string interpolation, passing as a bare argument to `run` / `ensure` (rewritten to use `${name}`), comparison / regex tests in **`if`**, **`match`** on the handle variable, **`prompt`** bodies that mention `${h}`, **`send`** payloads that interpolate `${h}`, and similar paths that scan orchestration strings (full table in [Spec: Async Handles](spec-async-handles.md)).
-
-**Passthrough:** `const h = run async foo()` binds the opaque handle token **without awaiting** `foo()` on that line. A bare `run async foo()` also performs no handle read — it still registers the branch for joining.
-
-**Important:** Workflow **`const`** can use a bare identifier RHS (for example `const copy = h`); that desugars to string interpolation **`"${h}"`** in `parse/const-rhs.ts`, which **does** resolve a handle — unlike the initial async capture alone.
-
-**Implicit join:** When the **`executeSteps`** scope that created handles **finishes** (for example end of an `if` body, **`for`** body, or the outer workflow step list), the runtime awaits **every** `run async` handle registered there — including handles that were never read. Nested blocks join **their** handles before control continues outward. Failures aggregate like a synchronous step failure. This preserves backward compatibility with the pre-handle concurrency model while still allowing overlap until a read or a scope boundary forces ordering ([Spec: Async Handles](spec-async-handles.md#implicit-join)).
-
-**`recover` composition:** `recover` works with `run async` to provide retry-loop semantics on the async branch:
-
-```jaiph
-const b1 = run async foo() recover(err) {
-  log "repairing: ${err}"
-  run fix_it()
+  log "${h}"      # forces resolution of h (blocks until task_b finishes)
 }
 ```
 
-The async branch retries `foo()` using the same retry-limit semantics as non-async `recover` (default 10, configurable via `run.recover_limit`). The handle resolves to the eventual success value or the final failure. `catch` also works with `run async` for single-shot recovery (no retry loop).
-
-See [Spec: Async Handles](spec-async-handles.md) for the full value model.
+| Aspect | Behaviour |
+|---|---|
+| Resolution trigger | First non-passthrough read — string interpolation, argument to `run` / `ensure`, comparison in `if` / `match`, prompt body referencing `${h}`, channel `send` payload referencing `${h}`, or `const copy = h` (bare-identifier RHS desugars to `"${h}"`). |
+| Passthrough | Initial capture (`const h = run async foo()`), bare `run async` with no capture name. |
+| Implicit join | When the enclosing `executeSteps` scope exits, all remaining unresolved handles created there are joined. Failures aggregate like a synchronous step. |
+| `recover` / `catch` | Both work with `run async`. `recover` uses the same retry-limit semantics as non-async `recover` (`run.recover_limit`). |
+| Inline scripts | Not supported with `run async`. |
+| Rule scope | `run async` in a rule is `E_VALIDATE`. |
+| Progress display | Each branch is prefixed with subscript digits (₁, ₂, …) at the call site's indent level, in dispatch order. Nested branches get their own numbering scope. |
 
-Constraints: workflow-only (rejected in rules), inline scripts not supported with `run async`.
+See [Spec — Async Handles](spec-async-handles.md) for the full value model.
 
-### `ensure` — Execute a Rule
-
-Runs a rule and succeeds if its exit code is 0.
+## `ensure` — execute a rule
 
 ```jaiph
 ensure check_deps()
-ensure lib.validate(input)
-const result = ensure validator(path)
-```
-
-### `catch` — Failure Recovery
-
-Both `ensure` and `run` support a `catch` clause. On failure, the recovery body runs once. `catch` requires an explicit binding that receives merged stdout+stderr from the failed step.
-
-```jaiph
-# Single-statement recovery
-ensure install_deps() catch (failure) run fix_deps()
-
-# Block recovery
-run deploy(env) catch (err) {
-  log "Deploy failed, rolling back"
-  run rollback(env)
-}
-
-# Retry via recursion
-workflow deploy(env) {
-  ensure ci_passes() catch (failure) {
-    prompt "CI failed — fix the code."
-    run deploy(env)
-  }
+const result = ensure lib.validate(input)
+ensure ci_passes() catch (failure) {
+  log "ci failed: ${failure}"
 }
 ```
 
-Bare `catch` without a binding is a parse error. All call arguments must appear inside parentheses before `catch`.
+Succeeds when the rule's exit code is `0`. The capture binds the rule's explicit `return` value. `ensure` does not accept `recover` — only `catch`.
 
-### `recover` — Repair-and-Retry Loop
+## `catch` and `recover`
 
-`recover` is a first-class retry primitive for `run` steps. Unlike `catch` (which runs the recovery body once), `recover` implements a **loop**: try the target, and if it fails, bind the error, run the repair body, then retry. The loop stops when the target succeeds or when the retry limit is exhausted.
+Both attach to `run` (any form) or to `ensure` (`catch` only). The binding receives the merged stdout+stderr from the failed execution.
+
+| Form | Loop | Allowed on |
+|---|---|---|
+| `catch (name) <body>` | Runs the recovery body once on failure. | `ensure` and `run` (sync and async). |
+| `recover (name) <body>` | Retries the target after each repair body until success or `run.recover_limit` (default `10`). | `run` only (sync and async). |
 
 ```jaiph
-# Single-statement recovery loop
-run deploy() recover(err) run fix_deploy()
+run deploy() catch (err) run rollback()
 
-# Block recovery loop
 run deploy(env) recover(err) {
-  log "Deploy failed: ${err}"
+  log "deploy failed: ${err}"
   run auto_repair(env)
 }
 ```
 
-**Semantics:**
-
-1. Execute the `run` target.
-2. If it succeeds, continue (the `recover` body never runs).
-3. If it fails, bind merged stdout+stderr to the `recover` binding (e.g. `err`), execute the repair body, then go to step 1.
-4. If the retry limit is reached and the target still fails, the step fails with the last error.
-
-**Retry limit:** The default limit is **10** attempts. Override it per-module with the `run.recover_limit` config key:
-
-```jaiph
-config {
-  run.recover_limit = 3
-}
-
-workflow default() {
-  run flaky_step() recover(err) {
-    log "Retrying after: ${err}"
-    run repair()
-  }
-}
-```
-
-**Capture:** When the target eventually succeeds, `const name = run ref() recover(err) { … }` captures the result (same rules as plain `run` — `return` value for workflows, stdout for scripts).
+Validation rules:
 
-**Constraints:**
-- `recover` requires exactly one binding: `recover(name)`. Bare `recover` without bindings is a parse error.
-- All call arguments must appear inside parentheses **before** `recover`.
-- `recover` is only valid on **`run`** steps (`ensure` supports `catch`, not `recover`). It is allowed in both workflow and rule bodies. `recover` also works with `run async` — see [`run async`](#run-async--concurrent-execution-with-handles).
-- `recover` and `catch` are mutually exclusive on the same step — use one or the other.
+| Rule | Behaviour |
+|---|---|
+| Binding required | Exactly one binding. Bare `catch` / `recover` is `E_PARSE`. |
+| Argument placement | All call arguments inside `()` before `catch` / `recover`. |
+| Mutual exclusion | A single `run` step accepts `catch` or `recover` but not both. |
+| Inline-script position | `catch` / `recover` only on standalone `run` steps. Forbidden on inline scripts in `log` / `logerr` / `return` / `const` RHS. |
 
-### `prompt` — Agent Interaction
+## `prompt` — agent interaction
 
 Sends text to the configured agent backend. Three body forms:
 
-**String literal** (single-line):
-
-```jaiph
-prompt "Review the code for security issues"
-const answer = prompt "Summarize the report"
-```
-
-**Identifier reference** (existing binding):
-
-```jaiph
-const text = "Analyze this code"
-prompt text
-```
-
-**Triple-quoted block** (multiline):
-
-```jaiph
-prompt """
-You are a helpful assistant.
-Analyze the following: ${input}
-"""
-```
-
-All three forms work with capture (`const name = prompt …`).
-
-**Typed prompt** — ask the agent for structured JSON with `returns`:
-
-```jaiph
-const result = prompt "Analyze this code" returns "{ type: string, risk: string }"
-log "Type: ${result.type}, Risk: ${result.risk}"
-```
+| Body form | Syntax |
+|---|---|
+| Single-line literal | `prompt "Review the code"` |
+| Identifier | `prompt my_text` (`my_text` must be in scope) |
+| Triple-quoted | `prompt """\nMultiline body with ${vars}\n"""` |
 
-The schema is a flat comma-separated `{ field: type, … }` fragment — only `string`, `number`, and `boolean`; no nested objects or union syntax (`validatePromptReturnsSchema` in `src/transpile/validate-prompt-schema.ts`). Fields are exposed as dot accessors (`${result.type}`); the compiler checks those references against the declared fields.
+| Aspect | Rule |
+|---|---|
+| Capture | `const name = prompt …`. `name = prompt …` is `E_PARSE`. |
+| Typed `returns` | Flat `{ field: type, … }` with `string` / `number` / `boolean`. Stored verbatim as text per-field. |
+| Capture required when `returns` | `prompt … returns "…"` without `const` is `E_PARSE`. |
+| Dot notation | `${result.field}` requires that the base is a typed-prompt capture and the field appears in the schema. |
+| Rule scope | Forbidden — `prompt` and `const … = prompt` are `E_VALIDATE` inside rules. |
+| Transport retry | Transport failures retry on a backoff schedule; deterministic post-processing failures do not. See [Configuration — Prompt retry on transport failure](configuration.md#prompt-retry-on-transport-failure). |
 
-Prompts using `returns` must be captured (`const … = prompt … returns …`). A `returns` prompt without capture is rejected at compile time.
-
-Prompts are not allowed in rules.
-
-### `const` — Variable Binding
-
-Introduces an **immutable** variable in a workflow or rule body.
+## `const` — bind a value
 
 ```jaiph
 const tag = "v1.0"
 const message = """
-  Hello ${name},
-  Welcome to the project.
+  Hello ${name}
 """
 const result = run helper(arg)
 const check = ensure validator(input)
-const answer = prompt "Summarize the report"
+const answer = prompt "Summarize"
 const label = match status {
   "ok" => "success"
   _ => "failure"
 }
 ```
 
-A bare reference like `const x = ref(args)` is rejected — use `const x = run ref(args)`.
-
-**Immutability:** All bindings — parameters, `const` declarations, captures, and `script` names — are immutable within their scope. The compiler rejects:
-
-- Rebinding a parameter name via `const` (e.g. `workflow run(x) { const x = … }`)
-- Duplicate `const` declarations with the same name in the same scope
-- A `script` name that collides with an existing immutable binding
-
-The error names the conflicting binding and its origin:
-
-```
-E_VALIDATE: cannot rebind immutable name "x"; already bound as parameter at file.jh:1
-```
-
-### `log` and `logerr`
-
-`log` writes to stdout; `logerr` writes to stderr (shown with a red `!` marker in the progress tree).
+| RHS form | Notes |
+|---|---|
+| Double-quoted string | Single-line. Multi-line double-quoted is `E_PARSE`. |
+| Triple-quoted block | Multiline; supports `${…}`. |
+| `run` call / `run async` call / `ensure` call | Managed capture. |
+| `prompt` (any body form) | Optional `returns` schema. |
+| `match` expression | Walks arms; first match wins. |
+| Bare `ref(args)` | `E_PARSE` — wrap with `run` / `ensure` / `prompt`. |
+| `$(…)`, `${var:-fallback}`, etc. | `E_PARSE` in `const` RHS. |
 
-```jaiph
-log "Processing ${message}"
-logerr "Warning: ${name} not found"
-log status                   # bare identifier — logs the variable's value
-log """
-  Build started at ${timestamp}
-  Target: ${env}
-"""
-```
+All bindings — parameters, `const`, captures, `script` names — are immutable in their scope. The validator names the conflicting binding and its origin (`E_VALIDATE: cannot rebind immutable name "x"; already bound as parameter at file.jh:1`).
 
-Both accept single-line strings, triple-quoted blocks, bare identifiers, or **managed inline-script calls**:
-
-```jaiph
-log run `echo hello`()
-logerr run `echo $1`("details")
-```
-
-A managed inline-script call executes the script and logs its stdout. The `run` keyword is required — bare inline scripts (`log \`…\`()`) are rejected at compile time.
-
-### `fail`
-
-Aborts the workflow or rule with a message on stderr and non-zero exit.
-
-```jaiph
-fail "Missing required configuration"
-fail """
-  Multiple issues found:
-  - ${issue1}
-  - ${issue2}
-"""
-```
-
-### `return`
-
-Sets the managed return value in rules and workflows.
+## `return` — managed return value
 
 ```jaiph
 return "success"
 return "${result}"
-return response                        # bare identifier — returns the variable's value
-return """
-  Report for ${name}:
-  Status: ${status}
-"""
-```
-
-**Bare identifier** — `return response` is sugar for `return "${response}"`. The identifier must be in scope (`const`, capture, or parameter). Unknown identifiers produce a compile-time `E_VALIDATE` error naming the missing binding.
-
-**Direct managed call** — executes a target and uses its result as the return value:
-
-```jaiph
+return response                  # sugar for return "${response}"
 return run helper()
 return ensure check(input)
-return match status {
-  "ok" => "pass"
-  _ => "fail"
-}
+return match status { "ok" => "pass", _ => "fail" }
 return run `cat report.txt`()
-return run `echo $1`("arg")
 ```
 
-Inline scripts are supported with `return run \`…\`(args)`. The `run` keyword is required — bare inline scripts (`return \`…\`()`) are rejected at compile time.
-
+| Form | Notes |
+|---|---|
+| String / triple-quoted | Verbatim with interpolation. |
+| Bare identifier | Sugar for `return "${ident}"`. Unknown identifier is `E_VALIDATE`. |
+| `return run ref()` / `return ensure ref()` | Managed direct return. Requires `()`. `return run helper` without parens becomes a shell step. |
+| `return run \`…\`(args)` | Inline-script direct return. The `run` keyword is required. |
+| `return match … { … }` | Match expression as the return value. `return` inside an arm body is forbidden. |
+| Position | Only in `rule` and `workflow` bodies. Script bodies use `echo`/`printf`; bare `return 0` / `return $?` in a script are shell exit codes. |
 
-### `send` — Channel Messages
-
-Sends a message to a declared channel using `<-`.
+## `send` — channel message
 
 ```jaiph
 alerts <- "Build started"
 reports <- ${output}
 results <- run build_message(data)
 alerts <- """
-  Build report for ${project}:
-  Status: ${status}
+  Build report for ${project}
 """
 ```
 
-Combining capture and send (`name = channel <- …`) is a parse error.
-
-### `match` — Pattern Matching
+| Rule | Behaviour |
+|---|---|
+| RHS required | Bare `channel <-` is `E_PARSE`. |
+| Allowed RHS | Double-quoted string, triple-quoted block, `${ident}` / `${…}`, `run ref(args)` (with parens). |
+| Bare ref RHS | A bare workflow / rule / script name is `E_VALIDATE`. |
+| Combined capture | `name = channel <- …` is `E_VALIDATE` (`invalid send: channel must be a single name or …`). |
+| Allowed in | Workflows only. Rules forbid `send`. |
+| Dispatch | `send` enqueues on the active workflow context. After that workflow's steps complete successfully, the runtime drains the queue sequentially and runs each route target. Sends from nested workflows bubble to the nearest ancestor context that declares routes for the channel. See [Inbox & Dispatch](inbox.md). |
 
-Pattern match on a string variable. The subject is a bare identifier (no `$` or `${}`). Arms are tested top-to-bottom; first match wins.
+## `log` / `logerr` / `fail`
 
 ```jaiph
-match status {
-  "ok" => "all good"
-  /err/ => "something went wrong"
-  _ => "unknown"
-}
+log "Processing ${message}"
+logerr "Warning: ${name} not found"
+log status                       # bare identifier — same as log "${status}"
+log run `date +%s`()             # inline-script form (run keyword required)
+log """
+  Build started at ${timestamp}
+"""
+fail "Missing configuration"
 ```
 
-Patterns can be string literals (exact equality), regex (`/pattern/`), or `_` (default). Exactly one default arm is required. Arms are **newline-delimited** — commas between or after arms are rejected at parse time (`"commas are not allowed in match arms; use one arm per line"`).
-
-**Arm bodies** — the value expression after `=>`. Allowed: string literals (`"…"` or `"""…"""`), bare in-scope identifiers (`const`, capture, or parameter), `$var`/`${var}` interpolation, `fail "…"`, `run ref(…)`, `ensure ref(…)`. A bare word that is not an in-scope variable is rejected at compile time with `E_VALIDATE` (`unknown identifier "…" in match arm body`) — this catches typos like `_ => true` or `_ => blorp` that would otherwise silently become string literals. The `return` keyword inside an arm body is forbidden — use `return match x { … }` at the outer level. Inline script forms (backtick) are also forbidden in arms; use named scripts.
-
-**Runtime execution** — arm bodies are not merely string values. Each form executes at runtime:
-- `fail "message"` aborts the workflow with a non-zero exit and the given message.
-- `run ref(args)` executes the named script or workflow and captures its return value.
-- `ensure ref(args)` executes the named rule and captures its return value.
-- String literals and variable references evaluate to their string value as before.
+| Statement | Effect |
+|---|---|
+| `log` | Writes to the run's stdout stream. Double-quoted messages store backslash sequences literally; use triple-quoted `log """…"""` for multiline text. |
+| `logerr` | Writes to stderr. Displayed with `!` marker in the progress tree. |
+| `fail` | Aborts the workflow or rule with a stderr message and non-zero exit. |
 
-When a `const` step uses a `match` expression containing `run` or `ensure` arms, the CLI progress tree surfaces the nested script/workflow/rule targets as child steps (e.g. `▸ script safe_name` / `✓ script safe_name`), consistent with top-level `run` steps.
+Bare inline scripts in `log` / `logerr` (`log \`…\`()`) are `E_PARSE` — use `log run \`…\`(args)`.
 
-**Multiline arm bodies** — triple-quoted:
+## `if` — conditional guard
 
 ```jaiph
-match mode {
-  "verbose" => """
-Detailed output enabled.
-All logs will be shown.
-  """
-  _ => "standard"
+if status == "ok" {
+  log "healthy"
+} else {
+  logerr "unhealthy: ${status}"
 }
-```
-
-**Expression form** — works with `const` and `return`:
 
-```jaiph
-const label = match status {
-  "ok" => "success"
-  _ => "failure"
+if message =~ /ERROR/ {
+  logerr "matched error pattern"
 }
 ```
 
-The outer `return` in `return match x { … }` applies to the whole match expression and remains valid.
+| Aspect | Rule |
+|---|---|
+| Subject | Bare identifier or `IDENT.IDENT` (typed-prompt field access). |
+| Operators | `==`, `!=` with double-quoted strings; `=~`, `!~` with `/regex/`. Mixing kinds is `E_PARSE`. |
+| `else` | Optional. `} else {` must be on a single line. `else if` chaining is not supported — nest `if` inside the `else` block or use `match`. |
+| Value production | `if` is a statement. For value branching use `match`. |
+| Async handles | Resolved before the comparison. |
+| Allowed in | Workflows and rules. |
 
-### `if` — Conditional Guard
-
-Simple conditional that executes a block when a string comparison holds. No `else` branch — use `match` for exhaustive value branching.
+## `match` — pattern match
 
 ```jaiph
-if param == "" {
-  fail "param was not provided"
-}
-
-if mode =~ /^debug/ {
-  log "Debug mode enabled"
+match status {
+  "ok" => "all good"
+  /err/ => "something went wrong"
+  _ => "unknown"
 }
 ```
 
-The subject is a bare identifier (no `$` or `${}`). Operators:
+| Aspect | Rule |
+|---|---|
+| Subject | Bare identifier or `IDENT.IDENT`. `$var` / `${var}` is `E_PARSE`. |
+| Patterns | String literal (exact equality), `/regex/`, or `_` (wildcard — exactly one required). |
+| Arm delimiter | Newlines. Commas between arms are `E_PARSE`. |
+| Arm bodies | String literal, triple-quoted block, bare in-scope identifier, `$var` / `${var}`, `fail "…"`, `run ref(…)`, `ensure ref(…)`. |
+| Disallowed in arms | `return` (use `return match … { … }` outside), inline scripts, unknown bare identifiers (`E_VALIDATE: unknown identifier "…" in match arm body; declare it with "const", use a capture, or add a parameter`). |
+| Expression form | Usable with `const x = match …` or `return match …`. |
 
-| Operator | Meaning | Operand type |
-|---|---|---|
-| `==` | exact string equality | `"string"` |
-| `!=` | string inequality | `"string"` |
-| `=~` | regex match | `/pattern/` |
-| `!~` | regex non-match | `/pattern/` |
+When a `const x = match …` step contains arms with `run` / `ensure`, the progress tree surfaces the called targets as child steps of the `const` row.
 
-The body is a brace block containing any valid workflow/rule steps. `if` is a statement — it does not produce a value, so it cannot be used with `const` or `return`.
+## `for` — iterate lines of a string
 
 ```jaiph
-workflow default(env) {
-  if env != "production" {
-    log "Skipping deploy for non-production env"
-    return ""
-  }
-  run deploy()
-}
-```
-
-
-### `for` — Iterate lines of a string
+const paths = """
+docs/a.md
+docs/b.md
+"""
 
-```jaiph
-for line in paths_blob {
-  if line != "" {
-    run process_one(line)
-  }
+for path in paths {
+  log "${path}"
 }
 ```
 
-`for <identifier> in <identifier> { … }` splits the **string value** of the right-hand variable on newlines (`\r\n` is normalized to `\n`). If the string ends with a final newline, the trailing empty segment is **not** iterated (so `"a\nb\n"` yields two lines, not three). **Interior** empty lines are still yielded as empty strings. There is **no** automatic trimming of whitespace; use an `if` guard, `match`, or a script when you need to skip blanks or strip indentation.
+| Aspect | Rule |
+|---|---|
+| Source variable | Must already hold a string (`const`, capture, parameter). Unknown name is `E_VALIDATE`. |
+| Line splitting | Splits on `\n` (normalises `\r\n`). A trailing newline does not yield an empty final line. Interior empty lines are yielded. |
+| Iterator name | Subject to the immutable-binding rules of the surrounding scope. After the loop, the iterator remains bound to the last line. |
+| Allowed in | Workflows and rules. |
 
-The iterator name must not conflict with an existing parameter, `const`, or capture in the same scope. After the loop completes, the iterator variable remains set to the last line visited (same shared scope as other workflow bindings).
+## String interpolation
 
-## Inline Scripts
-
-Embed a shell command directly in a step without a named `script` definition. Single backticks for one-liners, triple backticks for multiline.
-
-```jaiph
-run `echo hello`()
-const x = run `echo captured`()
-const y = run `date +%s`()
-```
-
-Arguments are passed in parentheses after the closing backtick(s) and available as `$1`, `$2`, …:
-
-```jaiph
-run `echo $1-$2`("hello", "world")   # prints: hello-world
-```
-
-**Fenced block form** for multiline or polyglot:
-
-<pre><code>run ```python3
-import sys
-print(f"args: {sys.argv[1:]}")
-```()
-</code></pre>
-
-Inline scripts use the same emission layout (`scripts/__inline_<hash>`) and the same **`NodeWorkflowRuntime` spawn contract** as named scripts (full scope env, cwd from `JAIPH_WORKSPACE` / module path — see [Script isolation](#script-isolation)). `run async` with inline scripts is not supported.
-
-## String Interpolation
-
-Jaiph orchestration strings support `${identifier}` interpolation. Every identifier must reference a binding in scope (`const`, capture, or named parameter). Unknown names are rejected at compile time.
-
-| Form | Description | Where |
+| Form | Status | Where |
 |---|---|---|
-| `${varName}` | Variable reference | All orchestration strings |
-| `${var.field}` | Typed prompt field access | All orchestration strings |
-| `${run ref(args)}` | Inline capture — executes and inlines result | All orchestration strings |
-| `${ensure ref(args)}` | Inline capture — executes rule and inlines result | All orchestration strings |
-| `$1`, `$2` | Positional args (bash convention) | Script bodies — syntax depends on interpreter |
+| `${ident}` | Primary | All orchestration strings. |
+| `${var.field}` | Typed-prompt field access | All orchestration strings. |
+| `${run ref(args)}` | Inline capture — executes and inlines stdout / return value. | All orchestration strings. |
+| `${ensure ref(args)}` | Inline capture — executes a rule and inlines result. | All orchestration strings. |
+| `$ident` (no braces) | `E_PARSE` in orchestration strings. | — |
+| `$1`, `$2`, … | Positional args | `script` bodies only (interpretation depends on the interpreter). |
+| `${var:-fallback}`, `${var%%…}`, `${var//…}`, `${#var}` | `E_PARSE` in orchestration strings and backtick scripts; passes through in fenced scripts. | — |
+| `$(…)` | `E_PARSE` in orchestration strings. | — |
 
-`$varName` (without braces) is rejected — always use `${varName}`. Shell expansions like `${var:-fallback}`, `$(…)`, and `${#var}` are rejected in orchestration strings.
-
-**Inline captures** execute a call directly inside the string:
-
-```jaiph
-log "Got: ${run some_script()}"
-log "Status: ${ensure check_ok()}"
-```
+If an inline capture fails, the enclosing step fails. Nested inline captures (`${run foo(${run bar()})}`) are `E_PARSE` — extract the inner call to a `const`.
 
-If the inline capture fails, the enclosing step fails. Nested inline captures are rejected — extract the inner call to a `const`.
+## Rule scope restrictions
 
-## Script isolation
+Rules accept the same step set as workflows except:
 
-**Emitted script files** do not embed module `const` values or other Jaiph “shims” — the transpiler writes the authored body plus a shebang (see `emitScriptsForModule` / `emit-script.ts`). Anything a script needs from the module must be passed as **positional arguments** (`$1`, `$2`, …), read from paths under `JAIPH_WORKSPACE`, or live in shared script sources (`import script`).
+| Step / form | Rule scope |
+|---|---|
+| `prompt` | Forbidden. |
+| `const … = prompt …` | Forbidden. |
+| `send` (`<-`) | Forbidden. |
+| `run async` | Forbidden. |
+| `run` to a workflow | Forbidden (`run` in rules targets scripts only). |
+| Raw shell lines | Forbidden (every line must be a recognised Jaiph step). |
+| `catch` / `recover` on `run` | Allowed. |
+| `for`, `if`, `match` | Allowed. |
 
-**Subprocess environment (`NodeWorkflowRuntime`):** Managed **script** steps (`run` on a named script, script import, or inline `` `…` `` / fenced body), and **workflow inline shell** lines, all use the same **`scope.env`**: the runner’s `process.env` as adjusted by Jaiph (for example `JAIPH_SCRIPTS`, `JAIPH_WORKSPACE`, `JAIPH_RUN_DIR`, `JAIPH_ARTIFACTS_DIR`, prompt-related `JAIPH_AGENT_*` when set, and keys derived from `config { … }`). It is **not** reset to a small fixed allowlist; anything visible to the workflow runner is visible to child processes unless your deployment strips the parent environment.
+Compile-time enforcement: `validate-step.ts` consults `RULE_SCOPE.allowSteps`.
 
-**Interpolation rules by body form:**
+## Subprocess environment
 
-- **Backtick** (single-line): `${...}` is forbidden — the compiler rejects it to prevent ambiguity with shell expansion. Use `$1`, `$2` positional arguments.
-- **Fenced block** (triple-backtick): `${...}` passes through to the shell as standard shell parameter expansion.
+Managed script steps (`run` to a named script, `import script`, inline scripts) and workflow inline-shell lines all use the same `scope.env`: the runner's `process.env` augmented by Jaiph (`JAIPH_WORKSPACE`, `JAIPH_SCRIPTS`, `JAIPH_RUN_DIR`, `JAIPH_ARTIFACTS_DIR`, `JAIPH_RUN_ID`, `JAIPH_RUN_SUMMARY_FILE`, prompt-related `JAIPH_AGENT_*`, and keys derived from `config { … }`). This is **not** an `env -i`-style wipe — anything the runner sees, the child sees, unless explicitly stripped.
 
-## Step Output Contract
+Module `const` values are **not** automatically exported into script environments. Pass them as positional arguments (`$1`, `$2`, …) or read Jaiph-provided variables.
 
-Every step produces three outputs: status, value, and logs.
+## Step output contract
 
-| Step | Status | Capture value (`x = …`) | Logs |
+| Step | Status | Capture value | Logs |
 |---|---|---|---|
-| `ensure rule` | exit code | explicit `return` value | artifacts |
-| `run workflow` | exit code | explicit `return` value | artifacts |
-| `run script` | exit code | trimmed stdout | artifacts |
-| `run` inline | exit code | trimmed stdout | artifacts |
-| `prompt` | exit code | final assistant answer | artifacts |
-| `log` / `logerr` | always 0 | — | event stream |
-| `fail` | non-zero (abort) | — | stderr |
-| `run async` | aggregated | `Handle<T>` — resolves to return value on read | artifacts |
-| `const` | same as RHS | binds locally | — |
-
-## Lexical Notes
-
-- **Identifiers:** `[A-Za-z_][A-Za-z0-9_]*`
-- **References:** `IDENT` (local) or `IDENT.IDENT` (module-qualified)
-- **Comments:** Full-line `#` comments
-- **Blank lines:** Preserved as visual grouping between steps; consecutive blanks collapsed by `jaiph format`
-- **Shebang:** A `#!` first line of the file is ignored by the parser
-- **String quoting:** `"..."` for single-line, `"""..."""` for multiline. Single-quoted strings are parse errors. Use `\"` for literal double quotes, `\\` for literal backslashes
-- **Unified namespace:** Channels, rules, workflows, scripts, script import aliases, and top-level `const` share one namespace per module
-- **Recursion limit:** Hard depth limit of 256 at runtime
+| `ensure rule` | rule exit code | explicit `return` value | rule artifacts |
+| `run workflow` | workflow exit code | explicit `return` value | workflow artifacts |
+| `run script` (named) | script exit code | trimmed stdout | script `.out` / `.err` |
+| `` run `…`() `` (inline) | script exit code | trimmed stdout | script `.out` / `.err` |
+| `prompt` | prompt exit code | final assistant answer | transcript artifacts |
+| `log` / `logerr` | always 0 | empty | event stream + stdout/stderr |
+| `fail` | non-zero (abort) | empty | stderr |
+| `run async` | aggregated | `Handle<T>` resolving on read | async step artifacts |
+| `const` | same as RHS step | empty (binds local) | n/a |
+
+## Recursion limit
+
+The runtime enforces a hard recursion depth limit of `256` (`MAX_RECURSION_DEPTH` in `src/runtime/kernel/runtime-arg-parser.ts`). Exceeding the limit produces a runtime error. The depth is the active workflow / rule call chain (not script subprocesses). There is no environment variable override.
+
+## Related
+
+- [Grammar](grammar.md) — formal EBNF, lexical rules, validation catalog.
+- [Configuration](configuration.md) — config keys consumed at runtime.
+- [Inbox & Dispatch](inbox.md) — `send` queueing and route execution semantics.
+- [Spec — Async Handles](spec-async-handles.md) — handle resolution and join semantics.
+- [Environment variables](env-vars.md) — variables visible to workflows, rules, and scripts.
diff --git a/docs/libraries.md b/docs/libraries.md
index 4e65e296..673a635f 100644
--- a/docs/libraries.md
+++ b/docs/libraries.md
@@ -1,67 +1,60 @@
 ---
-title: Libraries
-permalink: /libraries
+title: Use & publish a library
+permalink: /how-to/libraries
+diataxis: how-to
 redirect_from:
+  - /libraries
   - /libraries.md
 ---
 
-# Libraries
+# Use & publish a library
 
-## Why workspaces and `.jaiph/libs`
+This recipe installs a reusable Jaiph library into your workspace, imports it from a workflow, and (in the second half) publishes a library of your own.
 
-Workflow authoring usually needs **shared modules**: reusable rules, scripts, and small packaged workflows people can version and reuse across projects.
+A **Jaiph library is a public git repository** containing at least one `.jh` module anywhere in the tree. Imports written as `lib-name/path` resolve to `<workspace>/.jaiph/libs/<lib-name>/<path>.jh` after `jaiph install` clones the library into that directory.
 
-Jaiph avoids a machine-wide library path: resolution is anchored to a **workspace** (detected directory root; see below). Modules you own live next to your entry `.jh`; **third-party clones** conventionally live under **`<workspace>/.jaiph/libs/<name>/`**, wired up by **`jaiph install`**. Imports that look like **`lib-name/rest/of/path`** attach to those directories when relative resolution misses.
+## Prerequisites
 
-This page covers that layout, **`import`** resolution (**`resolveImportPath`** in `src/transpile/resolve.ts`), **`jaiph install`**, and the first-party **`jaiphlang/`** helpers shipped in **this repo** under `.jaiph/libs/jaiphlang/`. Validator behavior crosses into [Architecture — Core components](architecture.md#core-components). Grammar for import/export syntax lives in [Grammar — Imports and Exports](grammar.md#imports-and-exports).
+- Run commands from your project directory. `jaiph install` detects the workspace root from the current directory (walks up for `.jaiph` or `.git`, with temp-directory guards; if no marker is found, the starting directory is used).
+- `git` on `PATH`.
 
-## How imports resolve
+## Part A — Use a library
 
-Resolution runs in **`resolveImportPath`** — order:
+### 1. Install by name or URL
 
-1. **Relative to the importing file** — e.g. `import "./foo"`, `import "../lib/util"`. Paths without a `.jh` suffix get **`.jh`** appended automatically.
-2. **Library fallback** — only if step 1’s candidate path **does not exist on disk**, **`workspaceRoot`** is set, **and** the import string **`contains`** a **`/`**. The first `/` splits **`lib-name`** from **`rest`**, then the compiler looks for **`<workspace>/.jaiph/libs/<lib-name>/<rest>.jh`** (same extension defaulting).
-
-Implications:
+```bash
+# Resolve a registry name (uses JAIPH_REGISTRY, default https://jaiph.org/registry)
+jaiph install jaiphlang
 
-- **Imports without `/`** — e.g. **`import "submod"`** — only relative-to-file lookup is attempted; there is **no** library fallback under `.jaiph/libs/` even if a matching folder name exists.
-- **`jaiph compile`** runs the same **`validateReferences`** check as **`jaiph run`** but does not emit **`scripts/`** or invoke **`buildRuntimeGraph()`** ([Architecture — Summary](architecture.md#summary)).
+# Pin a registry name to a version
+jaiph install mylib@v1.2
 
-**Workspace root:** whatever the invoking CLI path passes into **`emitScriptsForModule`** / **`validateReferences`**:
+# Clone a git URL directly into .jaiph/libs/<name>/
+jaiph install https://github.com/you/queue-lib.git
 
-- **`jaiph run`** and **`jaiph test`** on an explicit **`*.jh` / `*.test.jh`** file use **`detectWorkspaceRoot(dirname(entry))`** (same predicate for both commands).
-- **`jaiph test`** with **no** file argument discovers tests under **`detectWorkspaceRoot(process.cwd())`** (`src/cli/commands/test.ts`).
-- **`jaiph install`** uses **`detectWorkspaceRoot(process.cwd())`**.
-- **`jaiph compile`** uses **`detectWorkspaceRoot(dirname(file))`** per validated module by default, or **`--workspace <dir>`** to pin one root for the whole command (`src/cli/commands/compile.ts`).
+# Pin a branch or tag
+jaiph install https://github.com/you/queue-lib.git@v1.0
+```
 
-Walk-up rules (`.jaiph` / `.git` markers, temp-directory guards) match [CLI — `jaiph install`](cli.md#jaiph-install).
+The argument shape decides the path. A token matching `/^[A-Za-z0-9_-]+(@[A-Za-z0-9._+/-]+)?$/` with no `/` and no `:` is a **registry name** and is resolved through the index. Everything else is parsed as a **git URL** (optional `@<ref>` suffix for branch or tag).
 
-**Export visibility:** if an imported module declares **any** `export`, only those names are valid through the alias; otherwise **every** top-level workflow, rule, and script in that file is reachable ([Architecture — Core components](architecture.md#core-components)). First-party **`jaiphlang/*`** modules typically use explicit `export` lines; **`jaiphlang/git`** is the odd one out (see below).
+Registry names install into `.jaiph/libs/<name>/` using the registry key. Git URLs install into `.jaiph/libs/<derived-name>/`, where `<derived-name>` is the last URL path segment without the `.git` suffix — the import prefix may differ from a registry name for the same repository.
 
-**Limitation:** **`import script "…"`** paths are validated with **`resolveScriptImportPath`**: **only** relative to the importing file’s directory — **no** workspace library fallback (`src/transpile/validate.ts`).
+`jaiph install` shallow-clones (`git clone --depth 1`) each missing library, removes the nested `.git` directory, and writes a `.jaiph/libs.lock` entry recording the resolved URL, optional version, and the 40-char commit captured before `.git` was removed. Existing directories are skipped unless you pass `--force`. Commit the lockfile.
 
-## Installing third-party libraries
+### 2. Restore from the lockfile
 
 ```bash
-# Clone into .jaiph/libs/<name>/ (shallow git clone) and update the lockfile
-jaiph install https://github.com/you/queue-lib.git
-
-# Pin a branch or tag (common shape: …/.git@ref — passed to git clone --branch)
-jaiph install https://github.com/you/queue-lib.git@v1.0
-
-# Restore all libraries from the lockfile (e.g. after git clone or in CI)
 jaiph install
 ```
 
-`jaiph install` writes **`.jaiph/libs.lock`** under the workspace root. Commit the lockfile; add **`.jaiph/libs/`** to `.gitignore` if you do not want vendored clones in version control. If **`.jaiph/libs/<name>/`** already exists, the clone is skipped unless you pass **`--force`** (URL / `@ref` parsing: [CLI — `jaiph install`](cli.md#jaiph-install)).
+With no arguments, `jaiph install` restores every entry in `.jaiph/libs.lock`: it clones any missing library directory (existing directories are skipped unless you pass `--force`). When a lock entry includes a `commit`, the cloned HEAD must match it; on mismatch the directory is removed and the run fails with the locked vs cloned SHAs. Lock entries without `commit` (older lockfiles) restore without that check. The registry is never read on this path.
 
-The clone directory name is **`deriveLibName(url)`** (last path segment, **`.git`** stripped), so imports use that segment as **`lib-name`**.
+### 3. Import from a workflow
 
-## Example: `import` from a clone under `.jaiph/libs/`
+The clone directory name is the import prefix. For `jaiph install jaiphlang`, the lib lives at `.jaiph/libs/jaiphlang/` and imports use the `jaiphlang/` prefix:
 
-After `jaiph install`, paths like **`queue-lib/queue`** resolve like any other library layout. Below assumes **`.jaiph/libs/jaiphlang/`** exists (copy from this repo or install a repo whose root name is **`jaiphlang`**).
-
-```jaiph
+```jh
 import "jaiphlang/queue" as q
 
 workflow default() {
@@ -71,74 +64,82 @@ workflow default() {
 }
 ```
 
-## The `jaiphlang/` standard libraries
+Imports without `/` only attempt relative-to-file lookup; the library fallback is skipped.
+
+### 4. Verify
+
+```bash
+ls .jaiph/libs/jaiphlang/         # cloned files, no nested .git
+cat .jaiph/libs.lock              # one entry per installed library
+jaiph run ./flow.jh               # imports must resolve at compile time
+```
+
+A clone with no `.jh` files anywhere in the tree is rejected with `lib "<name>" contains no .jh modules — not a jaiph library?` and the directory is removed before any lock entry is written.
+
+## Part B — Publish a library
+
+Publishing is git-native — no package registry upload, no build step.
+
+### 1. Lay out the repo
 
-The **`jaiphlang/`** prefix is a **naming convention** for first-party helper modules maintained **in this repository** under **`.jaiph/libs/jaiphlang/`**. They are **not** bundled inside the published npm **`jaiph`** package; copy that tree into your workspace or track it in git so **`import "jaiphlang/…"`** resolves. They use the same **`import` / `export workflow` / `export rule`** pattern as any other library (except **`git`**, see below).
+A library is a git repository of `.jh` modules plus any companion script files those modules reference. Two common shapes:
 
-### `jaiphlang/queue` — `QUEUE.md` task queue
+- **Single-file lib** — `repo-root/queue.jh`, imported as `"queue-lib/queue"` when installed as `queue-lib`.
+- **Multi-module lib** — several `.jh` files (at the repo root or in subdirectories), each imported as `"<install-name>/<path>"` without the `.jh` suffix (for example `"mylib/subdir/helper"` for `subdir/helper.jh`).
 
-Manages a markdown task file **`QUEUE.md`** at **`${JAIPH_WORKSPACE:-.}`** (`queue.jh` + `queue.py`). Sections use **`##`** headers; tags are **`#hashtags`** on the header line (e.g. **`## My task #dev-ready`**). **`python3`** must be on **`PATH`** when steps run the imported **`queue.py`** script.
+Companion scripts (e.g. `queue.py` next to `queue.jh`) must be referenced with **relative paths** — `import script "./queue.py"` — because `import script` has no workspace-libs fallback.
 
-| Symbol | Kind | Description |
-|--------|------|-------------|
-| `get_first_task()` | workflow | Returns the first task block (header + body) via **`queue("get")`**. |
-| `next_task(tag)` | workflow | Returns the first task whose header carries the given tag (tag name without `#`). |
-| `get_task_by_header(header)` | workflow | Returns a task by title; tags stripped for matching. |
-| `get_all_task_headers()` | workflow | Newline-separated task titles (no `##` prefix); calls **`queue("headers")`** with no extra args, so **all** tasks are listed (the Python **`headers`** subcommand accepts an optional tag when run directly from the CLI, but this workflow does not expose that). |
-| `mark_task_dev_ready(header)` | workflow | Adds **`#dev-ready`** to the matching header. |
-| `remove_completed_task(header)` | workflow | Removes the task with that title. |
-| `set_task_description_from_file(header, bodyPath)` | workflow | Replaces body text from a UTF-8 file; header unchanged. |
-| `has_tasks()` | rule | Passes if the queue has at least one task. |
-| `task_is_dev_ready(task)` | rule | Passes if the task text has **`#dev-ready`** on the header line. |
-| `all_dev_ready()` | rule | Passes if every task has **`#dev-ready`**. |
+### 2. Decide the public surface
 
-The module also defines a **`default`** workflow for **direct CLI** use (arguments pass through to the Python helper). Examples:
+Add `export` to the workflows, rules, and scripts you want importers to see:
+
+```jh
+export workflow get_first_task() { … }
+export rule has_tasks() { … }
+```
+
+A module with **zero** `export` lines exposes every top-level rule, workflow, and script through the import alias. Prefer explicit `export` on published libraries so removing a private helper does not break consumers.
+
+### 3. Tag a release
 
 ```bash
-jaiph .jaiph/libs/jaiphlang/queue.jh headers
-jaiph .jaiph/libs/jaiphlang/queue.jh get dev-ready
-jaiph .jaiph/libs/jaiphlang/queue.jh json
+git tag v0.1.0
+git push --tags
 ```
 
-### `jaiphlang/artifacts` — publishing files out of the sandbox
+Consumers pin to that tag with `jaiph install <name>@v0.1.0` or `jaiph install <url>.git@v0.1.0`. The ref is passed straight to `git clone --branch`; the resolved 40-char commit is recorded in `.jaiph/libs.lock` so restore is reproducible even when the tag later moves.
 
-Copies files from the **workspace** (or sandbox overlay) into the run’s **`artifacts/`** tree so they remain on the host after Docker teardown or process exit. The runtime sets **`JAIPH_ARTIFACTS_DIR`** to the writable directory for the current run. See [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout) and [Sandboxing](sandboxing.md) for the read-only workspace contract in Docker.
+### 4. (Optional) List on `jaiph.org/registry`
 
-```jaiph
-import "jaiphlang/artifacts" as artifacts
+To let consumers install by bare name, open a PR against [`jaiphlang/registry`](https://github.com/jaiphlang/registry) adding an entry to `registry.json` under a unique key matching `/^[A-Za-z0-9_-]+$/`:
 
-workflow default() {
-  # Single file:
-  const path = run artifacts.save("./build/output.bin")
-
-  # Or several files at once — newline-separated list of paths:
-  const paths = """
-  a.txt
-  b/nested.txt
-  """
-  const dests = run artifacts.save(paths)
+```json
+{
+  "libs": {
+    "<your-name>": {
+      "url": "https://github.com/<you>/<repo>.git",
+      "description": "<one line>"
+    }
+  }
 }
 ```
 
-**Exported workflow**
+The key is the import prefix consumers will write (`import "<your-name>/…"`). After the PR merges upstream, maintainers of the Jaiph repo run `npm run registry:build`, commit the updated `docs/registry`, and push — GitHub Pages then serves the index at `https://jaiph.org/registry`.
+
+## Verification
 
-| Workflow | Description |
-|----------|-------------|
-| `save(paths)` | **`paths`** is a single file path or a **newline-separated** list of file paths. Blank lines are ignored. Each file is copied to **`${JAIPH_ARTIFACTS_DIR}/…`** preserving relative layout (`./` stripped; absolute sources use **`basename`** only). Returns absolute destination path(s), one per line, in order. Exits with failure if the list is empty after trimming, any path is missing, or **`JAIPH_ARTIFACTS_DIR`** is unset. |
+For a consumer:
 
-### `jaiphlang/git` — git hygiene helpers and an example commit flow
+- `.jaiph/libs/<name>/` exists with the expected `.jh` modules.
+- `jaiph run ./flow.jh` compiles without `E_IMPORT_NOT_FOUND`.
+- `.jaiph/libs.lock` records the resolved URL and commit.
 
-**`git.jh`** defines rules and workflows **without** **`export`** keywords. With **zero** `export` lines, the compiler does **not** hide any top-level names: importers may reference **every** **`rule`** and **`workflow`** in that file. Prefer explicit **`export`** in libraries you publish so only a stable surface is reachable.
+For a publisher:
 
-The module mixes small rules around **`git status`** / **`git rev-parse`** with **`commit(task)`** / **`default(task)`** workflows that drive a **`prompt`** to stage/commit and write **`git format-patch -1 HEAD --stdout`** to a **`*.patch`** path. This file is **opinionated** (default **`config`** block targets the Cursor agent); read **`.jaiph/libs/jaiphlang/git.jh`** before trimming or reusing.
+- A fresh clone of your lib by URL (`jaiph install <url>.git@<tag>`) resolves and runs.
+- Removing an unexported private name does not break consumers when the module uses explicit `export` lines (only exported names are reachable).
 
-| Symbol | Kind | Description |
-|--------|------|-------------|
-| `in_git_repo()` | rule | Passes when **`git rev-parse --is-inside-work-tree`** succeeds (after marking the workspace as a safe directory). |
-| `branch_clean()` | rule | Passes when **`git status --porcelain`** is empty. |
-| `has_changes()` | rule | Passes when there are porcelain changes (fails on a clean tree). |
-| `is_clean()` | rule | Passes when **`in_git_repo()`** **and** **`branch_clean()`** both pass (their **`ensure`** calls are inlined in this rule). |
-| `commit(task)` | workflow | Ensures repo + changes, runs **`prompt`**, writes patch file, returns path. |
-| `default(task)` | workflow | Runs **`commit(task)`** (same **`return`**). |
+## Related
 
-Use **`jaiphlang`** modules as patterns for your own libs: thin **`script`** wrappers, composable **`rule`** constructs, and workflows built on both.
+- [Architecture — Local module graph](architecture.md#local-module-graph) — how `<lib>/<path>` imports resolve through `.jaiph/libs/`.
+- [Save artifacts](/how-to/artifacts) — the `jaiphlang/artifacts` library covered there is one example consumer.
diff --git a/docs/registry b/docs/registry
new file mode 100644
index 00000000..901aff32
--- /dev/null
+++ b/docs/registry
@@ -0,0 +1,8 @@
+{
+  "libs": {
+    "jaiphlang": {
+      "url": "https://github.com/jaiphlang/jaiphlang.git",
+      "description": "Jaiph standard library: artifacts, git, queue"
+    }
+  }
+}
diff --git a/docs/sandbox-run.md b/docs/sandbox-run.md
new file mode 100644
index 00000000..b82e2a5a
--- /dev/null
+++ b/docs/sandbox-run.md
@@ -0,0 +1,93 @@
+---
+title: Run in a Docker sandbox
+permalink: /how-to/sandbox-run
+diataxis: how-to
+---
+
+# Run a workflow in a Docker sandbox
+
+This recipe runs a `.jh` workflow inside the Docker sandbox, picks the right workspace-presentation mode, and bypasses the confirmation prompt in CI.
+
+For the design (what the sandbox protects against, what it does not), see [Sandboxing](sandboxing.md). This page is the enabling procedure only.
+
+## Prerequisites
+
+- Docker installed and `docker info` succeeds on the host.
+- An entry `.jh` file with a `default` workflow.
+- Agent credentials forwarded into the container if the workflow uses `prompt` — see [Authenticate agent backends](/how-to/agent-auth).
+
+## 1. Run with the default sandbox
+
+```bash
+jaiph run ./flow.jh
+```
+
+Docker is **on by default**. The CLI picks the workspace-presentation mode automatically:
+
+- **Overlay mode** when `/dev/fuse` exists on the host (typically Linux). Reads come from the read-only host workspace; writes land in a `fuse-overlayfs` upper layer and are discarded at container exit.
+- **Copy mode** when `/dev/fuse` is missing (typically macOS Docker Desktop), or when `JAIPH_DOCKER_NO_OVERLAY=1` or `JAIPH_DOCKER_NO_OVERLAY=true` is set. The CLI clones the workspace into `.jaiph/runs/.sandbox-<id>/` (or `<runs-root>/.sandbox-<id>/` when `JAIPH_RUNS_DIR` overrides the default) and mounts the clone read-write.
+
+In both modes the host checkout is unmodified after the run. Run artifacts always land under host `.jaiph/runs/` via a separate read-write mount.
+
+## 2. Pick inplace mode for live edits
+
+When you want the run's edits to land **live on the host** (typical for an agent-driven dev loop), opt in to inplace mode:
+
+```bash
+jaiph run --inplace ./flow.jh
+```
+
+or set the environment variable (`1` or `true`):
+
+```bash
+JAIPH_INPLACE=1 jaiph run ./flow.jh
+```
+
+The `--inplace` flag normalizes into `JAIPH_INPLACE=1` for one run only. The container's other protections (`--cap-drop ALL`, `--security-opt no-new-privileges`, env allowlist, mount allowlist) are unchanged — only the workspace-isolation half is removed.
+
+Before launch the CLI prints a warning tailored to your git state (clean tree → `git restore .` recovers; dirty tree → commit/stash first; no repo → no safety net) and waits for `y`. The default answer on empty input or EOF is **no**.
+
+## 3. Skip the inplace confirmation prompt in CI
+
+When stdout is not a TTY (typical in CI), the inplace prompt cannot run interactively. Pass `-y` / `--yes` with `--inplace`, or set `JAIPH_INPLACE_YES=1` or `JAIPH_INPLACE_YES=true`:
+
+```bash
+jaiph run --inplace --yes ./flow.jh
+```
+
+```bash
+JAIPH_INPLACE=1 JAIPH_INPLACE_YES=1 jaiph run ./flow.jh
+```
+
+Without one of these in a non-TTY environment, the run aborts with `E_DOCKER_INPLACE_NO_CONFIRM` before any container is launched.
+
+## 4. Run on the host without a sandbox
+
+```bash
+jaiph run --unsafe ./flow.jh
+```
+
+or:
+
+```bash
+JAIPH_UNSAFE=true jaiph run ./flow.jh
+```
+
+This disables Docker entirely; the workflow runs on the host. Combining `--unsafe` with `--inplace` is rejected with `E_FLAG_CONFLICT` before any container starts (one keeps the sandbox on, the other turns it off).
+
+## Verification
+
+The CLI banner reports the sandbox mode it picked:
+
+- `Docker sandbox, fusefs` — overlay mode.
+- `Docker sandbox, tmp workspace` — copy mode.
+- `Docker sandbox, in-place (live host edits)` — inplace mode.
+- `no sandbox` — `--unsafe` / `JAIPH_UNSAFE=true` is active (Docker disabled).
+
+Run artifacts always land under host `.jaiph/runs/<date>/<time>-<entry>/` regardless of mode. Open `run_summary.jsonl` there to inspect the live `__JAIPH_EVENT__` timeline the CLI also rendered.
+
+## Related
+
+- [Sandboxing](sandboxing.md) — the model: what each mode protects, what it does not.
+- [Authenticate agent backends](/how-to/agent-auth) — getting credentials into the container.
+- [Architecture — Docker runtime helper](architecture.md#core-components) — how the host CLI builds the `docker run` invocation.
diff --git a/docs/sandboxing.md b/docs/sandboxing.md
index 9b9ba3b5..054626f2 100644
--- a/docs/sandboxing.md
+++ b/docs/sandboxing.md
@@ -1,255 +1,92 @@
 ---
 title: Sandboxing
 permalink: /sandboxing
+diataxis: explanation
 redirect_from:
   - /sandboxing.md
 ---
 
-# Sandboxing
+# Sandboxing — the model
 
-Workflows orchestrate **managed scripts** and other steps on the machine where `jaiph run` executes. That power is useful for builds and agents, but it also means a script can read files, call the network, and run arbitrary programs unless you constrain it. Jaiph addresses that at two layers: **language rules** (what may appear in a rule body) and **Docker-backed isolation** for `jaiph run` (on by default via env; see [Enabling Docker](#enabling-docker)). You can rely on rules alone, turn Docker off for host execution, or combine both.
+A Jaiph workflow runs scripts, calls agents, and touches the filesystem on whatever machine `jaiph run` is invoked on. That power is the point — and also the risk: a careless or untrusted script can read files, exfiltrate secrets, and run arbitrary programs unless something constrains it.
 
-At a high level, the **CLI** chooses local vs Docker launch (see `src/runtime/docker.ts`); the **Node workflow runtime** (`NodeWorkflowRuntime` in `src/runtime/kernel/`) interprets the same AST either way. See [Architecture](architecture.md) for how compile validation, the runner child, and durable artifacts fit together.
+Jaiph addresses this at two layers, each doing a different job:
 
-Both local and Docker runs stream `__JAIPH_EVENT__` on **stderr** only; [Hooks](hooks.md) always run on the **host** CLI and read that stream, even when the workflow runs in a container. For `config` syntax, allowed keys, and merge rules, see [Configuration](configuration.md). For the full step-type matrix, see [Grammar](grammar.md).
+- **Rules** — compile-time structural validation of what a `rule` body is allowed to contain.
+- **Docker isolation** — a runtime sandbox for `jaiph run` that runs the same workflow inside a container with a tight resource posture.
 
-## Rules: structured validation, not mutation
+This page explains the *model*: what each layer protects, what it deliberately does not protect, and why the design picks the trade-offs it does. The how-to of enabling or disabling Docker, the full configuration-key list, and the failure-mode codes live in their own how-to and reference pages — this page stays on the conceptual surface.
 
-Rules restrict which step types are allowed in their body — enforced at **compile time** in `validateReferences` (`src/transpile/validate.ts`), not by an OS sandbox. The permitted set matches [Grammar — Language concepts](grammar.md#language-concepts): `ensure` (other rules only), `run` (**scripts** only — not workflows), `const` (script/`ensure` captures, `match` expressions, or bash RHS — never `prompt`), `match`, `if`, `for … in … { … }` (line iteration over a string variable), `fail`, `log` / `logerr`, `return` (strings, identifiers, `return run …` / `return ensure …`, and the managed forms the grammar allows), `ensure … catch`, `run … catch`, and `run … recover`. Inline script steps and managed `log`/`logerr` from inline scripts are allowed where the grammar permits them.
+For the runtime implementation, see [Architecture — Docker runtime helper](architecture.md#core-components).
 
-Disallowed in rules: **raw shell lines** (every line must be a recognized Jaiph step — use a `script` and `run`), `prompt`, inbox **`send`** / routing, and **`run async`**. See the grammar page for the authoritative list and examples.
+## Two layers, two jobs
 
-The runtime executes rules by walking the rule body in-process (same interpreter as workflows; see `executeRule` in `src/runtime/kernel/node-workflow-runtime.ts`). There is no per-rule OS sandbox — no mount namespace, no automatic read-only filesystem. When a rule runs a script step, that script executes as a normal managed subprocess with full access to paths the process user can reach. Treat rules as non-mutating checks by convention; perform intentional filesystem changes in workflows, not rules.
+Rules and Docker isolation are doing fundamentally different work, and it is worth keeping them separate:
 
-`jaiph test` executes tests in-process via `runTestFile()` (`src/runtime/kernel/node-test-runner.ts`) and does not use Docker or a separate rule sandbox.
+| Layer | When it fires | What it constrains | What it does not constrain |
+|---|---|---|---|
+| **Rules** | Compile time | The set of step types allowed inside a `rule` body — no inline shell, no `prompt`, no `const … = prompt`, no `send`, no `run async` | Anything a `script` does at runtime (rules can still call scripts via `run`) |
+| **Docker** | `jaiph run` launch time | Filesystem reach, process isolation, capability surface, env-var exposure for *every* step in the workflow | Network egress (default-on), agent credentials (forwarded by design), hooks (run on host) |
 
-## Threat model
+Rules are about **structure**: by the time the compiler is done, a rule cannot contain a step type that mutates state in a surprising way. There is no OS sandbox around a rule body — when a rule calls a script, that script runs as a normal managed subprocess with the same access the workflow has. Treat rules as non-mutating checks by convention; do mutation in workflows.
 
-Docker sandboxing is designed to contain damage from untrusted or semi-trusted workflow scripts. Understanding what it does and does not protect against helps you make informed decisions about when to enable it.
+Docker is about **blast radius**: it cannot stop a script from misbehaving, but it can keep that misbehavior inside a disposable container.
 
-**What Docker protects against:**
+## The three sandbox modes
 
-- **Filesystem access** -- Scripts inside the container cannot read or write arbitrary host paths. The container's `/jaiph/workspace` is either an in-container `fuse-overlayfs` merge over a read-only bind of the host workspace (overlay mode; writes go to the overlay upper/work dirs under `/tmp` inside the container and are discarded on exit) or a host-side clone of the workspace mounted read-write (copy mode; the clone is removed on exit unless kept for debugging). Only the run-artifacts directory (`/jaiph/run`) persists writes back to the host workspace.
-- **Process isolation** -- Container processes cannot see or signal host processes. Every sandboxed container uses `--cap-drop ALL` plus `--security-opt no-new-privileges`. **Overlay mode** (Linux) adds capabilities required for `fuse-overlayfs` and for dropping privileges after mount: `SYS_ADMIN`, `SETUID`, `SETGID`, `CHOWN`, and `DAC_READ_SEARCH` (see `buildDockerArgs` in `src/runtime/docker.ts`). **Copy mode** does not add capabilities. The overlay entrypoint (`runtime/overlay-run.sh`) starts as the container user `0:0` so it can mount, then normally **`exec`s `jaiph run` as the host UID/GID** via `setpriv` when `JAIPH_HOST_UID` / `JAIPH_HOST_GID` are set; copy mode uses `--user <host_uid>:<host_gid>` directly. macOS Docker Desktop does not use Linux `--user` overrides (UID mapping is handled by the VM).
-- **Credential leakage** -- Environment variable forwarding uses an explicit allowlist: only `JAIPH_*` (except `JAIPH_DOCKER_*`), `ANTHROPIC_*`, `CLAUDE_*`, and `CURSOR_*` cross the container boundary. Everything else is dropped.
-- **Mount safety** -- The host root filesystem (`/`), Docker socket (`/var/run/docker.sock`, `/run/docker.sock`), and OS internals (`/proc`, `/sys`, `/dev`) cannot be mounted into the container. Attempting to do so produces `E_VALIDATE_MOUNT`.
-- **Shell injection safety** -- All Docker CLI invocations (`docker info`, `docker image inspect`, `docker pull`) use `execFileSync` with an explicit argument array, bypassing `/bin/sh`. Image names and other parameters are passed as literal argv entries with no shell expansion, so values containing shell metacharacters (`;`, `$`, backticks, etc.) are never evaluated.
+When Docker is enabled, the CLI picks one of three sandbox primitives at launch. The mode controls **how the workspace is presented to the container**; the env allowlist, mount allowlist, and `--security-opt no-new-privileges` posture is the same across all three. Every mode starts from `--cap-drop ALL`; overlay mode adds back a small cap set for `fuse-overlayfs` (see [What Docker protects against](#what-docker-protects-against)).
 
-**What Docker does NOT protect against:**
+- **Overlay mode** — the host workspace is bind-mounted read-only; `fuse-overlayfs` inside the container layers a writable scratch space on top, merged at `/jaiph/workspace`. Reads come from the real workspace, writes land in the overlay and are discarded when the container exits. The *idea* is copy-on-write isolation: the host checkout is the source of truth, the run can pretend to mutate it, and at exit there is no trace.
+- **Copy mode** — before launching, the CLI clones the workspace into a disposable sandbox directory and bind-mounts that clone read-write. Writes are real, but they are local to the clone, which is removed on exit. The *idea* is the same isolation contract as overlay, expressed without `fuse-overlayfs` (which is not available everywhere, notably on macOS Docker Desktop and on Linux hosts that block fuse mounts).
+- **Inplace mode** — the host workspace itself is bind-mounted read-write. The run's edits land **live** on the host. The *idea* is "trusted workspace, untrusted machine": the rest of the sandbox (caps, env allowlist, mount set) still applies, but the workspace-isolation half is removed on purpose so an agent-driven dev loop can iterate against the real checkout.
 
-- **Hooks run on the host.** Hook commands in `hooks.json` execute on the host CLI process, not inside the container. A malicious hook definition has full host access. Treat `hooks.json` as trusted configuration.
-- **Network egress by default.** Unless `runtime.docker_network` is set to `"none"`, the container has outbound network access via Docker's default bridge. Scripts can reach external services and exfiltrate data through the network.
-- **Agent credential forwarding.** `ANTHROPIC_*`, `CLAUDE_*`, and `CURSOR_*` variables are forwarded into the container so agent-backed workflows function. Any workflow code in the container can read them from the environment together with outbound network access; treat that as **full disclosure** of those secrets to workflow code.
-- **Image supply chain.** Jaiph verifies that the selected image contains `jaiph` but does not verify image signatures or provenance. Use trusted registries and pin image digests for production workloads.
-- **Container escapes.** Docker is not a security boundary against a determined attacker with kernel exploits. It raises the bar significantly for script-level mischief but is not equivalent to a VM or hardware-level isolation.
+Overlay and copy are interchangeable from the user's point of view — both produce the property that **the host workspace is unmodified after a Docker run**. Inplace explicitly opts out of that property in exchange for a tighter dev loop, and the CLI gates it behind a destructive-edit confirmation prompt before launch.
 
-## Docker container isolation
+In every mode, run artifacts are written to a separate read-write mount at `/jaiph/run` (outside the workspace sandbox) so the artifact tree under `.jaiph/runs/` persists on the host regardless of what happened inside the container.
 
-> **Beta.** Docker sandboxing is functional but still under active development. Expect rough edges, breaking changes, and incomplete platform coverage. Feedback is welcome at <https://github.com/jaiphlang/jaiph/issues>.
+## What Docker protects against
 
-Docker applies to `jaiph run` only (not `jaiph test`). Enablement is **environment-driven** (see [Enabling Docker](#enabling-docker)); there is no `jaiph run --docker` flag — the CLI decides from env before spawn. **`jaiph run --raw` on the host never starts Docker:** only interactive `jaiph run` (no `--raw` on the host) consults `JAIPH_DOCKER_ENABLED` / `JAIPH_UNSAFE` and may spawn a container — see [CLI — `jaiph run`](cli.md#jaiph-run). When Docker is active, the entire workflow (every rule and script step) runs inside a **single** container. The container runs `jaiph run --raw <file>` using the **image’s** installed `jaiph`, not the host binary. The `--raw` flag skips the banner and progress UI in that inner process so `__JAIPH_EVENT__` JSON lines go to **stderr** unchanged for the host CLI to parse.
+The Docker sandbox is designed to contain damage from untrusted or semi-trusted workflow scripts. Its protections are:
 
-The container's `/jaiph/workspace` always *looks* writable to scripts but never mutates the host checkout. The CLI picks one of two sandbox primitives at launch time:
+- **Filesystem reach** — scripts inside the container cannot read or write arbitrary host paths outside the workspace mount and the run-artifacts mount. The rest of the host is invisible to the container. Overlay and copy modes additionally make the workspace itself non-persistent.
+- **Process isolation** — container processes cannot see or signal host processes. Every sandboxed container runs with `--cap-drop ALL` and `--security-opt no-new-privileges`. Overlay mode adds back a small set of capabilities required to mount `fuse-overlayfs` and then drop privileges; copy and inplace modes do not add any back.
+- **Mount safety** — the host root filesystem, the Docker daemon socket, and OS-internal paths (`/proc`, `/sys`, `/dev`) cannot be mounted into the container. Attempting to do so produces a validation error before launch.
+- **Environment exposure** — host environment variables do not cross the boundary by default. Only an explicit prefix allowlist (`JAIPH_*`, `ANTHROPIC_*`, `CLAUDE_*`, `CURSOR_*`, with `JAIPH_DOCKER_*` and the inplace-control flags excluded) is forwarded. Every other variable is dropped, including unrelated cloud credentials, SSH agents, and registry tokens.
+- **Shell injection safety** — every `docker` invocation passes an explicit argv array (`execFileSync` or `spawn`), never `/bin/sh`. Image names and other parameters are passed as literal arguments, so values containing shell metacharacters are never expanded.
 
-- **Overlay mode** (selected when `/dev/fuse` exists on the host — typically Linux). The host workspace is bind-mounted read-only at `/jaiph/workspace-ro`. The runtime entrypoint (`runtime/overlay-run.sh`, copied into the container read-only) runs `fuse-overlayfs` with that read-only tree as the lower layer and **writable upper/work directories under `/tmp`** inside the container, merged at `/jaiph/workspace`. Writes stay in the container filesystem and are discarded when the container exits. Requires `/dev/fuse` in the container and the extra Linux capabilities described under [Process isolation](#threat-model) (not only `SYS_ADMIN`).
-- **Copy mode** (selected when `/dev/fuse` is missing — typically macOS Docker Desktop, or when forced via `JAIPH_DOCKER_NO_OVERLAY=1` or `JAIPH_DOCKER_NO_OVERLAY=true`). Before launching the container, the CLI clones the host workspace (see below) into a fresh `<runs-root>/.sandbox-<id>/` directory, then bind-mounts that clone read-write at `/jaiph/workspace`. On macOS the clone uses `cp -cR` (APFS clonefile, near-zero cost) when the filesystem supports it; otherwise it falls back to `cp -pR` and emits a one-line stderr warning. The clone is removed on exit unless `JAIPH_DOCKER_KEEP_SANDBOX` is `1` or `true`. No `SYS_ADMIN`, no `/dev/fuse`, no in-container overlay script.
+## What Docker does **not** protect against
 
-The clone copies each top-level entry of the workspace; under `.jaiph` it copies everything except the `runs` tree (run logs live under the separate `/jaiph/run` mount). **`.git` is not stripped** — workflows that call `git` see the same history as on the host, at the cost of a larger copy in copy mode on Linux.
+Equally important is the list of things Docker is deliberately *not* claiming to defend:
 
-In both modes, run artifacts are written to a separate rw mount at `/jaiph/run` (outside the workspace sandbox) so they persist to the host.
+- **Network egress is on by default.** The sandbox only passes `--network none` when configuration sets the Docker network mode to `none` (`JAIPH_DOCKER_NETWORK` or module `runtime.docker_network`; see [Configuration — Runtime (Docker) keys](configuration.md#runtime-docker-keys)). When the mode is the default (`default`), no `--network` flag is passed and the container uses Docker's bridge with outbound access. A script can reach external services and exfiltrate data over the network.
+- **Agent credentials cross the boundary.** `ANTHROPIC_*`, `CLAUDE_*`, and `CURSOR_*` variables are forwarded so agent-backed workflows can function. Combined with default network egress, treat them as **fully disclosed** to anything that runs inside the container.
+- **Hooks run on the host.** Hook commands from `.jaiph/hooks.json` (merged with `~/.jaiph/hooks.json`) execute on the host CLI process, not inside the container, and have full host access. Hook config is trusted.
+- **Image supply chain is the user's responsibility.** Jaiph verifies that the selected image contains a working `jaiph` binary, but does not verify image signatures or provenance. Use trusted registries and pin digests for anything that matters.
+- **Container escapes are not guaranteed-impossible.** Docker is not equivalent to a VM or hardware isolation. It raises the bar against script-level mischief, but a kernel exploit can in principle break out.
+- **Inplace mode opts out of workspace isolation.** With `JAIPH_INPLACE` set, the run can mutate your real workspace. The machine outside the workspace stays sandboxed as in any mode, but a crashed or malicious run can leave your checkout half-edited.
 
-### Enabling Docker
+This list exists because a sandbox that overclaims is worse than one that is honest about its scope. Jaiph treats the Docker boundary as a **blast-radius reducer for workflow scripts**, not as a credential vault or a network firewall.
 
-**Turning Docker on or off** uses environment variables only — a `.jh` workflow file cannot enable or disable the container by itself. **Image, network, and timeout** still come from module `config` and env overrides as in [Configuration keys](#configuration-keys). The idea is that skipping the container always requires an explicit host choice (`JAIPH_UNSAFE` / `JAIPH_DOCKER_ENABLED`), not something you can turn on from committed workflow source alone.
+## Why opt-out, not opt-in
 
-Docker is **on by default** for both local development and CI. To run on the host without a sandbox, set `JAIPH_UNSAFE=true`. To control Docker enablement explicitly, set `JAIPH_DOCKER_ENABLED`.
+The default-on choice — Docker on unless the host sets `JAIPH_UNSAFE=true` or sets `JAIPH_DOCKER_ENABLED` to any value other than exact `true` — is deliberate. Workflows orchestrate agent and script code that is often pulled from a repository, edited by a model, or contributed by a third party. Making the safer posture the path of least resistance means a careless workflow gets contained by default and only escapes the container when a human types out the override.
 
-> **Credential warning:** Docker sandboxing **does not isolate agent credentials**. `ANTHROPIC_*`, `CLAUDE_*`, and `CURSOR_*` env vars are forwarded into the container and the default network allows outbound access. A malicious script can read these from its environment and exfiltrate them. Set `runtime.docker_network = "none"` for workflows that should not make external calls.
+A second, equally deliberate choice: **enablement lives entirely in environment variables, not in in-file `config`**. Module-level `runtime.docker_*` keys can tune image, network, and timeout, but nothing in a `.jh` file can turn Docker off — `runtime.docker_enabled` is rejected at parse time. That keeps the "host is in charge of sandbox enablement" property: pulling a workflow file from a less-trusted source cannot ship an off-switch with it.
 
-**Precedence (two rows, env only):**
+The escape hatch — `JAIPH_UNSAFE=true` or `jaiph run --unsafe` — exists because some environments genuinely cannot run Docker (a sandboxed CI without nested virtualization, a developer iterating on the runtime itself). The choice to take that hatch should be visible and ergonomic, which is why it is a single explicit host-side switch rather than an in-file `config` knob.
 
-| Check | Result |
-|-------|--------|
-| `JAIPH_DOCKER_ENABLED` is set | `"true"` enables Docker; any other value disables it |
-| Default (no explicit env) | Docker **on**, unless `JAIPH_UNSAFE=true` (Docker **off**) |
+## Why `jaiph test` does not use Docker
 
-CI environments (`CI=true`) deliberately exercise the same sandbox path users do -- `CI=true` alone does not disable Docker.
+The test runner runs in-process on the host. This is intentional: tests are a development feedback loop, they typically mock prompts and replace external calls, and Docker spawn overhead would harm the iteration cycle. Tests already get isolation from the things they care about (prompts, network) through the runtime's mock infrastructure. The Docker boundary is for `jaiph run`, where the workflow is executing real scripts against real resources.
 
-If Docker is enabled but `docker info` fails, the run exits with `E_DOCKER_NOT_FOUND` and suggests setting `JAIPH_UNSAFE=true` as an escape hatch. There is no silent fallback to local execution.
+## How sandboxing fits the rest of Jaiph
 
-> **Migration note:** `runtime.docker_enabled` is not an allowed `config` key — the parser rejects it as an unknown key (with the allowed-key list in the error). Use `JAIPH_DOCKER_ENABLED` or `JAIPH_UNSAFE` in the environment instead.
+The Docker sandbox does not change workflow semantics. The runtime inside the container is the same **`NodeWorkflowRuntime`** AST interpreter that runs locally — the container runs **`jaiph run --raw`**, which spawns the internal **`__workflow-runner`** child the same way as host **`--raw`** execution (see [Architecture — Docker runtime helper](architecture.md#core-components)), same **`__JAIPH_EVENT__`** stream on stderr, same **`run_summary.jsonl`** written under **`.jaiph/runs/`**. The only differences are *where* processes execute and *what host resources they can reach*.
 
-### Configuration keys
+That property is the point of the design: a workflow is the same workflow whether it runs sandboxed or not. The sandbox is a deployment decision, not a programming model.
 
-**Docker on/off** is **not** a `runtime.*` key — only `JAIPH_DOCKER_ENABLED` / `JAIPH_UNSAFE` control that (see [Enabling Docker](#enabling-docker)). The keys below live under `runtime.*` in **module-level** `config` only. For **image**, **network**, and **timeout**, the merge is **`JAIPH_DOCKER_*` environment variables > module `runtime.*` > defaults** (`resolveDockerConfig` in `src/runtime/docker.ts`). Docker on/off does not use `runtime.*`; it follows [Enabling Docker](#enabling-docker) only.
+## Related
 
-| Key | Type | Default | Description |
-|-----|------|---------|-------------|
-| `runtime.docker_image` | string | `"ghcr.io/jaiphlang/jaiph-runtime:<version>"` | Container image. Must already contain `jaiph`. Defaults to the official GHCR runtime image matching the installed jaiph version. |
-| `runtime.docker_network` | string | `"default"` | Docker network mode. |
-| `runtime.docker_timeout_seconds` | integer | `3600` | Max execution time in seconds (default one hour). Must be a non-negative integer; `0` disables the timeout. Negative values produce `E_DOCKER_TIMEOUT`. |
-
-Each key is type-checked at parse time. Unknown keys produce `E_PARSE`. The workspace mount is automatic and not configurable.
-
-#### Environment variable overrides
-
-Following the `JAIPH_*` convention: `JAIPH_DOCKER_ENABLED`, `JAIPH_DOCKER_IMAGE`, `JAIPH_DOCKER_NETWORK`, `JAIPH_DOCKER_TIMEOUT`. Additionally, `JAIPH_UNSAFE=true` disables Docker by default (see [Enabling Docker](#enabling-docker)). `CI=true` does **not** affect the default — CI runs use the same sandbox path users do.
-
-Precedence for **enablement** only: `JAIPH_DOCKER_ENABLED` env > unsafe default rule (see table above). Image, network, and timeout use the env > in-file > default merge described in this section.
-
-If `JAIPH_DOCKER_TIMEOUT` is set but not a valid non-negative integer, the run exits with `E_DOCKER_TIMEOUT`.
-
-### Workspace mount
-
-The workspace mount is automatic and not configurable. The workspace root is always bound into the container — in overlay mode at `/jaiph/workspace-ro` (read-only, with fuse-overlayfs merged at `/jaiph/workspace`), and in copy mode the host-side clone is mounted read-write at `/jaiph/workspace`. There are no user-controlled extra mounts.
-
-The workspace root is validated before launch. The following host paths are rejected with `E_VALIDATE_MOUNT`:
-
-- `/` (host root filesystem)
-- `/var/run/docker.sock`, `/run/docker.sock` (Docker daemon socket)
-- `/proc`, `/sys`, `/dev` (OS internals, including subpaths like `/proc/1/root`)
-
-### Container layout
-
-Overlay mode:
-
-```
-/jaiph/
-  workspace-ro/       # read-only bind mount of host workspace (overlay lower layer)
-  workspace/          # fuse-overlayfs merged view (reads from -ro; writes to upper/work under /tmp in the container)
-    *.jh              # source files
-    .jaiph/           # project config
-  run/                # writable bind mount for this run's artifacts (host runs root)
-  overlay-run.sh      # entrypoint script (from runtime/overlay-run.sh) mounted ro from host temp file
-```
-
-Copy mode:
-
-```
-/jaiph/
-  workspace/          # rw bind mount of <runs-root>/.sandbox-<id>/ on the host
-    *.jh              # cloned source files (writes are local to the clone)
-    .jaiph/           # cloned config (.jaiph/runs is excluded from the clone)
-  run/                # writable bind mount for this run's artifacts (host runs root)
-```
-
-The working directory is `/jaiph/workspace`. In overlay mode the host CLI writes `overlay-run.sh` (shipped as `runtime/overlay-run.sh` in the npm package) to a temp file and mounts it read-only at `/jaiph/overlay-run.sh`; the container runs `/jaiph/overlay-run.sh jaiph run --raw <file>`. In copy mode the container runs `jaiph run --raw <file>` directly -- no entrypoint script. The image must already contain `jaiph` — Jaiph does not install itself into the container at runtime.
-
-### Runtime behavior
-
-**Container lifecycle** -- `docker run --rm` launches the container and auto-removes it on exit. `--cap-drop ALL` drops all Linux capabilities; overlay mode re-adds the capability set listed under [Process isolation](#threat-model) (not copy mode). `--security-opt no-new-privileges` is always set. The pseudo-TTY flag (`-t`) is intentionally omitted: Docker's `-t` merges stderr into stdout, which would break the `__JAIPH_EVENT__` stderr-only live contract.
-
-**Signal-safe cleanup** -- When the CLI receives SIGINT (Ctrl-C) or SIGTERM during a Docker run, `cleanupDocker` is called before the process exits. This removes the copy-mode sandbox directory (`<runs-root>/.sandbox-<id>/`) and clears any timeout timer, preventing stale workspace clones from accumulating after interrupted runs. A `process.on("exit")` guard provides a final safety net: if the normal exit path has not already cleaned up, the guard calls `cleanupDocker` synchronously. A `cleaned` flag on `DockerSpawnResult` ensures cleanup runs at most once — there are no double-`rmSync` warnings regardless of which path fires first. SIGKILL cannot be caught and is not handled; a startup-time sweep of stale sandbox directories is out of scope.
-
-**UID/GID handling on Linux:**
-
-- **Copy mode** -- the container runs directly as `--user <host_uid>:<host_gid>` so writes to the cloned workspace and `/jaiph/run` land owned by the host user.
-- **Overlay mode** -- the container is started as `--user 0:0` so `fuse-overlayfs` can mount. The host UID/GID are forwarded as `JAIPH_HOST_UID` / `JAIPH_HOST_GID`; `overlay-run.sh` **`chown`s the run mount** (best effort) and then **`exec`s `jaiph run` under `setpriv`** to reuid/regid to the host user when `setpriv` is available. If `setpriv` is missing, the workflow may continue as UID 0 inside the container — use an image that includes `setpriv` (the official runtime does) for the intended behavior.
-
-On **Linux**, if the host UID/GID cannot be determined (`process.getuid()` / `process.getgid()` and `id -u` / `id -g` both fail), `buildDockerArgs` throws `E_DOCKER_UID` and the run exits before the container is launched. This prevents overlay or copy mode from starting without a usable `--user` mapping. On **macOS** Docker Desktop the VM transparently translates UIDs across the bind-mount boundary, so the CLI does not apply Linux-style `--user` overrides and this check does not run.
-
-**stdin** -- The `docker run` process is spawned with stdin set to `ignore` to prevent the Docker CLI from blocking on stdin EOF.
-
-**Events** -- The container's jaiph runs in `--raw` mode: it spawns the runtime with inherited stdio, so `__JAIPH_EVENT__` JSON flows directly to the container's stderr. The host CLI reads Docker's stderr pipe and renders the progress tree. stdout carries plain script output. `STEP_END` events embed `out_content` (and `err_content` on failure) so consumers do not need host paths to step artifact files.
-
-**Sandbox primitive (overlay vs. copy)** -- Selected at launch time. If `/dev/fuse` exists on the host, the CLI uses **overlay mode**: the `overlay-run.sh` wrapper (shipped as `runtime/overlay-run.sh`, written to a temp file and mounted read-only) runs `fuse-overlayfs` with the ro bind mount (`/jaiph/workspace-ro`) as the lower layer and **writable upper/work directories under `/tmp`** (`overlay-run.sh` uses `/tmp/overlay-upper` and `/tmp/overlay-work`), merged at `/jaiph/workspace`. Workspace writes stay in the container and are discarded on container exit. On Linux hosts, the overlay container is also launched with `--security-opt apparmor=unconfined` because the default Docker AppArmor profile (active on Ubuntu 22.04+, GitHub Actions runners, and similar) denies fuse mounts even when `SYS_ADMIN` and `/dev/fuse` are present. If `fuse-overlayfs` is missing from the image or the mount still fails at runtime, the entrypoint exits with `E_DOCKER_OVERLAY` — there is no in-container fallback. Set `JAIPH_DOCKER_NO_OVERLAY=1` (or `true`) on the host to opt into copy mode instead. Custom images used in overlay mode must ensure `/jaiph/workspace` is mountable by root (the official image keeps this path root-owned).
-
-If `/dev/fuse` is missing on the host, the CLI uses **copy mode**: before launching the container it clones the workspace into `<runs-root>/.sandbox-<id>/` using `cp -cR` on macOS when clonefile works (otherwise `cp -pR` and a one-time stderr warning), or `cp -pR` on other platforms. The clone is bind-mounted rw at `/jaiph/workspace`. After the container exits — whether normally, via signal (SIGINT/SIGTERM), or due to an uncaught error — the clone is removed unless `JAIPH_DOCKER_KEEP_SANDBOX` is `1` or `true`, in which case the path is left in place for debugging.
-
-**Run artifacts** -- The host CLI mounts the resolved host runs root at `/jaiph/run:rw` inside the container. By default this is `.jaiph/runs` under the workspace; a relative `JAIPH_RUNS_DIR` is resolved under the workspace; an absolute `JAIPH_RUNS_DIR` must stay within the workspace or the run fails with `E_DOCKER_RUNS_DIR`. `JAIPH_RUNS_DIR` is set to `/jaiph/run` inside the container, so the runtime writes artifacts directly into the requested host path. On **Linux** in **overlay** mode, the CLI best-effort `chmod`s that host run directory to mode `0777` before `docker run` so writes still work when the daemon uses user-namespace remapping and the inner workflow runs as a non-root UID.
-
-**Path remapping** {#path-remapping} -- Inside the container, the runtime records artifact paths relative to `/jaiph/run` (e.g. `/jaiph/run/2026-04-21/07-55-32-say_hello.jh/000003-script__validate_name.err`). These container-internal paths do not exist on the host. After the container exits, the host CLI remaps every container path that starts with `/jaiph/run/` to the corresponding path under the bind-mounted host runs directory (the `sandboxRunDir`). This ensures the failure footer (`Logs:`, `Summary:`, `out:`, `err:`) printed to stderr shows valid **host** paths that can be opened directly. The `run_summary.jsonl` file also records container-internal `out_file` / `err_file` values; the CLI applies the same remapping when reading these fields to locate artifact content for the "Output of failed step" excerpt. When the container meta file is inaccessible from the host (typical in Docker mode), the CLI discovers the run directory by walking UTC date/time subdirectories of the bind-mounted runs root **newest first** until it finds a `run_summary.jsonl` whose first line is a `WORKFLOW_START` event with `run_id` equal to the expected run id (the same value as `JAIPH_RUN_ID` on the host). This stays correct when concurrent `jaiph run` invocations share the same runs root. The net effect is that Docker and no-sandbox runs produce identical failure footers — same structure, same host-resolvable paths, same step output excerpt.
-
-**Workspace immutability contract** -- Docker runs cannot directly modify the host workspace. In overlay mode the host checkout is bind-mounted read-only and writes land in the overlay upper layer (under `/tmp` inside the container) and are discarded on container exit. In copy mode the container writes to a separate host-side clone of the workspace (`<runs-root>/.sandbox-<id>/`), which is removed on container exit unless explicitly kept for debugging. In both modes the only persistence channel from a Docker run to the host is the run-artifacts directory (`/jaiph/run` → host `.jaiph/runs`). Non-Docker (local) runs are unaffected by this contract.
-
-**Workspace patch export** -- To capture workspace changes as a patch, run `git diff` (or your own exporter) inside the workflow, write the result to a file under the workspace, then call `artifacts.save(local_path)` so the patch lands in the run’s `artifacts/` tree on the host. Callers choose when and what to record. The published GHCR runtime image includes `git` if you use it from a script step. See [Libraries — `jaiphlang/artifacts`](libraries.md#jaiphlangartifacts--publishing-files-out-of-the-sandbox).
-
-**Network** -- `"default"` omits `--network`, which uses Docker's default bridge network (outbound access allowed). `"none"` passes `--network none` and fully disables networking -- use this for workflows that should not make external calls. Any other value (e.g. a custom Docker network name) is passed through as-is. Set `runtime.docker_network` in config or `JAIPH_DOCKER_NETWORK` in the environment.
-
-**Timeout** -- When the effective timeout (from `JAIPH_DOCKER_TIMEOUT` or `runtime.docker_timeout_seconds`, after the merge in [Configuration keys](#configuration-keys)) is greater than zero, the CLI arms a timer on the spawned `docker` child; on overrun it sends `SIGTERM`, then `SIGKILL` after a 5-second grace period. The failure message includes `E_TIMEOUT container execution exceeded timeout`. `0` disables the timer.
-
-**Image pre-pull** -- Image preparation (`prepareImage`) runs **before** the CLI banner so Docker's pull overhead does not interleave with the progress tree. If the image is not present locally, a `pulling image <name>…` status line is written to stderr, then `docker pull --quiet` runs (Docker's native layer progress is suppressed); on success the CLI writes `pulled` on its own line. Pull failure produces `E_DOCKER_PULL`. After the pull (or if the image was already local), `verifyImageHasJaiph` confirms the image contains `jaiph`. The banner and progress tree only begin after image preparation completes.
-
-### Failure modes
-
-The table below lists Docker run failures and the codes emitted in logs or error output. Most are `E_DOCKER_*`; **`E_TIMEOUT`** and **`E_VALIDATE_MOUNT`** appear here because they surface during container runs or mount validation, not inside the interpreter.
-
-| Error code | Trigger | Behavior |
-|------------|---------|----------|
-| `E_DOCKER_NOT_FOUND` | `docker info` fails (Docker not installed or daemon not running) | Run exits immediately. No fallback to local execution. |
-| `E_DOCKER_PULL` | `docker pull` fails (network error, image not found, auth failure) | Run exits. Check registry access and image name. |
-| `E_DOCKER_NO_JAIPH` | Selected image does not contain a `jaiph` CLI | Run exits with guidance to use the official image or install jaiph. |
-| `E_DOCKER_RUNS_DIR` | Absolute `JAIPH_RUNS_DIR` points outside the workspace | Run exits. Use a relative path or an absolute path within the workspace. |
-| `E_DOCKER_OVERLAY` | Overlay mode selected but `fuse-overlayfs` is missing from the image or the mount fails inside the container | Container exits with code 78. Use the official runtime image, install `fuse-overlayfs` in your custom image, or set `JAIPH_DOCKER_NO_OVERLAY=1` (or `true`) on the host to switch to copy mode. The CLI already passes `--security-opt apparmor=unconfined` on Linux to defeat the default AppArmor fuse-deny; remaining failures usually mean the host kernel itself blocks fuse mounts (rootless docker without the right user-namespace setup, locked-down kernel, etc.). |
-| `E_DOCKER_TIMEOUT` | `JAIPH_DOCKER_TIMEOUT` is empty, non-numeric, negative, or has trailing junk; or `runtime.docker_timeout_seconds` is negative in the parsed module | Run exits before container launch. A valid value is a non-negative integer; `0` disables the timeout. |
-| `E_DOCKER_UID` | Linux host UID/GID detection failed (`process.getuid` and `id -u` both unavailable) | Run exits before container launch. Ensures the container never silently runs as root. Applies to both copy and overlay modes. |
-| `E_DOCKER_SANDBOX_COPY` | Copy mode failed to clone the host workspace (`cp` returned non-zero) | Run exits before container launch. Inspect the path printed in the error. |
-| `E_VALIDATE_MOUNT` | Mount targets a denied host path (`/`, `/proc`, docker socket, etc.) | Run exits before container launch. |
-| `E_TIMEOUT` | Container runs longer than the effective Docker timeout seconds (`JAIPH_DOCKER_TIMEOUT` or `runtime.docker_timeout_seconds` after merge; see [Configuration keys](#configuration-keys)) | Container receives SIGTERM, then SIGKILL after 5s grace period. |
-
-All failures are deterministic and produce non-zero exit codes. There is no silent fallback from Docker to local execution.
-
-### Image contract
-
-**Every Docker image used by Jaiph must already contain a working `jaiph` CLI.** Jaiph does not auto-install itself into containers at runtime — no derived image builds, no `npm pack` bootstrap. If the selected image lacks `jaiph`, the run fails immediately with `E_DOCKER_NO_JAIPH` and guidance to use the official image or install jaiph in a custom image.
-
-### Official runtime image
-
-Jaiph publishes official runtime images to GHCR:
-
-| Tag | Built from | Use case |
-|-----|-----------|----------|
-| `ghcr.io/jaiphlang/jaiph-runtime:<semver>` | Release tags (`v*`) | Production / pinned versions |
-| `ghcr.io/jaiphlang/jaiph-runtime:nightly` | `nightly` branch | Contributors and CI |
-| `ghcr.io/jaiphlang/jaiph-runtime:latest` | Latest release tag | Convenience alias |
-
-The default `runtime.docker_image` is `ghcr.io/jaiphlang/jaiph-runtime:<version>` where `<version>` matches the installed jaiph package version. Published tags (`:<semver>`, `:nightly`, `:latest`) are built from the `runtime/Dockerfile` in the jaiph repository (see the `docker-publish` job in `.github/workflows/ci.yml`). The image includes Node.js, jaiph, `fuse-overlayfs`, agent CLIs where that Dockerfile installs them, and a non-root `jaiph` user (UID 10001).
-
-### Custom images and `jaiph run`
-
-`jaiph run` **always** uses the configured image (`runtime.docker_image`, `JAIPH_DOCKER_IMAGE`, or the default GHCR tag above). It does not run `docker build` for you. Build and publish (or `docker build` + `docker tag`) your own image, then set `runtime.docker_image` / `JAIPH_DOCKER_IMAGE`.
-
-After the image is pulled or found locally, Jaiph verifies that `jaiph` is available inside the container. If the check fails, the run exits with `E_DOCKER_NO_JAIPH`.
-
-`overlay-run.sh` is shipped as `runtime/overlay-run.sh` in the npm package; the host CLI writes it to a temp file and mounts it into the container at runtime.
-
-### Extending the official image
-
-To add project-specific tools or agent CLIs, extend the published image in your own Dockerfile (build locally or in CI), then point `runtime.docker_image` at the result:
-
-```dockerfile
-FROM ghcr.io/jaiphlang/jaiph-runtime:nightly
-
-USER root
-RUN npm install -g @anthropic-ai/claude-code
-USER jaiph
-
-# Add project-specific package managers/build tools below.
-```
-
-### Environment variable forwarding
-
-Environment variable forwarding uses an explicit allowlist; everything else is dropped. Only variables matching the following prefixes are forwarded into the container:
-
-- `JAIPH_*` (except `JAIPH_DOCKER_*`, excluded to prevent nested Docker execution)
-- `ANTHROPIC_*`
-- `CURSOR_*`
-- `CLAUDE_*`
-
-`JAIPH_WORKSPACE` is overridden to `/jaiph/workspace` and `JAIPH_RUNS_DIR` is overridden to `/jaiph/run`. If `JAIPH_AGENT_TRUSTED_WORKSPACE` points at a path inside the host workspace, it is rewritten to the matching path under `/jaiph/workspace` so agent CLIs see a path that exists in the container; absolute paths outside the workspace are left unchanged. `JAIPH_RUN_ID` is forwarded into the container so the runtime reuses the host-generated run identifier instead of creating its own — this ties the container's `run_summary.jsonl` back to the host CLI invocation and prevents concurrent-run misidentification during run-directory discovery.
-
-This allowlist is enforced in `buildDockerArgs` and cannot be overridden. Any variable not matching the allowlist -- including cloud credentials (`AWS_*`, `GCP_*`, etc.), authentication sockets (`SSH_*`), registry tokens (`NPM_TOKEN`, `GITHUB_TOKEN`, `PYPI_*`, `CARGO_*`), and all other host environment -- is silently dropped. If a workflow needs external credentials inside the container, pass them explicitly through `JAIPH_*`-prefixed variables or use a credential proxy.
-
-### Example
-
-A workflow with a custom Docker timeout (Docker is on by default):
-
-```jh
-config {
-  runtime.docker_timeout_seconds = 600
-}
-
-workflow default() {
-  log "Running inside Docker"
-}
-```
+- [Architecture — Docker runtime helper](architecture.md#core-components) — the spawn, mount, and event-stream wiring.
+- [Architecture — Channels and hooks in context](architecture.md#channels-and-hooks-in-context) — why hooks run on the host even for containerized runs.
+- [Why Jaiph](why-jaiph.md) — the design context that puts the sandbox into the broader picture.
diff --git a/docs/setup.md b/docs/setup.md
index 0633f9ea..e9c1a9e7 100644
--- a/docs/setup.md
+++ b/docs/setup.md
@@ -1,139 +1,70 @@
 ---
-title: Setup
-permalink: /setup
+title: Install & switch versions
+permalink: /how-to/install
+diataxis: how-to
 redirect_from:
+  - /setup
   - /setup.md
 ---
 
-# Setup
+# Install & switch versions
 
-## Overview
+This recipe installs the `jaiph` CLI onto your `PATH`, verifies it, and switches between releases (stable, nightly, or a specific version).
 
-Jaiph ships as a **CLI** backed by Node: it parses `.jh` sources, runs compile-time validation during script extraction, emits **`script`** bodies into a **`scripts/`** directory (path in **`JAIPH_SCRIPTS`**), and starts a **Node workflow runtime** that interprets workflow ASTs in process (same stack for local runs, Docker, and tests — see [Architecture — System overview](architecture.md#system-overview)). This page covers **installing the CLI**, **running your first workflow**, **workspace layout**, and **`jaiph init`**, not language syntax or runtime internals.
+The curl installer downloads a per-platform standalone binary from the current stable GitHub Release. Node and npm are **not** required to run that binary; it self-contains the runtime and the agent skill.
 
-Goals you should leave with:
+## Prerequisites
 
-1. **The Jaiph CLI** on your `PATH`.
-2. A mental model for **workspace root** (`JAIPH_WORKSPACE`), **run artifacts**, and optional **`.jaiph/`** scaffolding.
-3. Pointers to **format**, **tests**, **libraries**, and deeper docs.
+- A POSIX `sh` (the runtime uses `sh -c` for inline shell lines inside workflows; emitted `script` steps follow their own shebang).
+- For the curl installer (step 1): `curl` and either `shasum` or `sha256sum` on `PATH`.
+- For the npm alternative (step 1): Node.js and npm on the host.
 
-### Prerequisites
+## 1. Install the binary
 
-- **Node.js** — required to run `jaiph` (the curl installer runs `npm install` and `npm run build` in a checkout).
-- **Shell tooling** — the CLI and workflow runtime are Node-based; **emitted `script` steps** run by spawning the script path so the interpreter comes from each file’s **shebang** (often `#!/usr/bin/env bash` or another interpreter on your `PATH`). **Shell lines inside workflows** (after Jaiph interpolation) run via **`sh -c`**, so a POSIX **`sh`** must exist. See [Architecture — Distribution](architecture.md#distribution-node-vs-bun-standalone).
-
-## Install
+Use the curl installer:
 
 ```bash
 curl -fsSL https://jaiph.org/install | bash
 ```
 
-This installs a small wrapper **`jaiph`** under `~/.local/bin` plus a **`~/.local/bin/.jaiph/`** tree: `src/` (compiled CLI), `package.json`, and **`jaiph-skill.md`** (copied from the repo for `jaiph init`). Alternatively:
-
-```bash
-npm install -g jaiph
-```
-
-The published npm package may **not** include `docs/jaiph-skill.md` next to the CLI the way the curl layout does — if **`jaiph init`** does not write `.jaiph/SKILL.md`, point **`JAIPH_SKILL_PATH`** at a skill file (for example the repo’s `docs/jaiph-skill.md`, or download the canonical raw skill: `https://raw.githubusercontent.com/jaiphlang/jaiph/refs/heads/main/docs/jaiph-skill.md`).
+This downloads `jaiph-{darwin|linux}-{arm64|x64}` and `SHA256SUMS` from the current stable Release, verifies the checksum, and installs the binary to `~/.local/bin/jaiph`. Override the install location with `JAIPH_BIN_DIR`.
 
-Verify:
+(Alternative) Install via npm when you already have Node on the host and want package-manager-tracked installs:
 
 ```bash
-jaiph --version
-```
-
-If the command is not found, ensure `~/.local/bin` (installer) or the npm global bin directory is on your **`PATH`** (the **`docs/run`** helper prepends `$HOME/.local/bin` automatically after installing).
-
-Switch versions anytime: **`jaiph use`** runs your install command via **`bash -c`** (default: `curl -fsSL https://jaiph.org/install | bash`) with **`JAIPH_REPO_REF`** set to **`nightly`** or to **`v`** plus the version (for example **`0.9.4`** → **`v0.9.4`**).
-
-```bash
-jaiph use nightly
-jaiph use 0.9.4    # reinstalls tag v0.9.4
-```
-
-Default install invocation is `curl -fsSL https://jaiph.org/install | bash`; override **`JAIPH_INSTALL_COMMAND`** when you need a fork, offline bundle, or local script (**`docs/install-from-local.sh`** wraps `docs/install` with a repo path).
-
-## Quick try
-
-Run a sample workflow without installing first:
-
-```bash
-curl -fsSL https://jaiph.org/run | bash -s '
-workflow default() {
-  const response = prompt "Say: Hello I'\''m [model name]!"
-  log response
-}'
-```
-
-The script installs Jaiph if it is missing, then runs the workflow in a fresh temp directory that includes a **`.jaiph`** marker (so Docker sandboxes only mount that tree — see comments in the repo’s [`docs/run`](https://github.com/jaiphlang/jaiph/blob/main/docs/run)). Requires **`node`** and **`curl`**. For local docs or CI without production URLs, set **`JAIPH_SITE`** (documented in the same file).
-
-For more runnable samples (inbox, async, testing, ensure/catch), see the [`examples/`](https://github.com/jaiphlang/jaiph/tree/main/examples) directory.
-
-## Running a workflow
-
-Jaiph workflows live in **`.jh`** files (**`*.test.jh`** suites use **`jaiph test`** instead — see [Testing](testing.md)). **`jaiph run`** loads a **single entry file** and runs the workflow named **`default`** (`workflow default(...) { ... }`). Use a **shebang** (`#!/usr/bin/env jaiph`) or the CLI: if the first argument is an existing file path, names ending in **`.test.jh`** dispatch to **`jaiph test`** (this check runs before the generic **`.jh`** rule), and every other **`.jh`** file dispatches to **`jaiph run`** (see [CLI — file shorthand](cli.md#file-shorthand)).
-
-```bash
-./path/to/main.jh "feature request or task"
-# or explicitly:
-jaiph run ./path/to/main.jh "feature request or task"
+npm install -g jaiph
 ```
 
-Arguments after the `.jh` path are bound **by position** to the named parameters of `workflow default` (for example `workflow default(task)` → `${task}` in the body; see [Language — Parameters and arguments](language.md#parameters-and-arguments)).
-
-### Workspace root
-
-The CLI sets **`JAIPH_WORKSPACE`** to a **workspace root** before it spawns the workflow runner. For **`jaiph run`**, detection starts at the **directory containing the entry `.jh` file** and walks **upward** until it finds **`.jaiph`** or **`.git`**, with guards for shared temp trees (see `detectWorkspaceRoot` in `src/cli/shared/paths.ts`). If no marker is found before the filesystem root, the **starting directory** (the entry file’s directory) is used as the workspace. That root is what import resolution and **`.jaiph/libs/`** are scoped to (see [Libraries](libraries.md)).
+The npm package exposes `dist/src/cli.js` as the `jaiph` command (Node executes it) plus the compiled runtime tree under `dist/src/`.
 
-Managed **script** steps receive **`$1`**, **`$2`**, … only for arguments passed at the corresponding **`run`** step in the workflow — not automatically from the CLI unless the workflow forwards them (see [Language — `run`](language.md#run--execute-a-workflow-or-script)).
+## 2. Add jaiph to PATH (if needed)
 
-### Run artifacts
-
-Each run writes durable files under **`.jaiph/runs/`**. See [Runtime artifacts](artifacts.md) for layout, per-step logs, the JSONL timeline, and inbox files.
-
-### Formatting
-
-Enforce consistent style across `.jh` / `*.test.jh` files (paths must end in **`.jh`**):
+If `jaiph --version` reports `command not found`, add the install directory to `PATH`:
 
 ```bash
-jaiph format flow.jh           # rewrite in place
-jaiph format --check flow.jh tests/flow.test.jh   # CI-safe: exits 1 when changes needed
-jaiph format --indent 4 flow.jh
+export PATH="$HOME/.local/bin:$PATH"   # curl installer
 ```
 
-Use your shell’s globbing if you pass multiple files (for example `jaiph format --check *.jh` when your shell expands the pattern). See [CLI — `jaiph format`](cli.md#jaiph-format).
-
-### Validate, test, and libraries (next steps)
-
-- **`jaiph compile`** — validates the import closure (**`validateReferences` only**); no script emission or runner. See [Architecture — Summary](architecture.md#summary) and [CLI](cli.md).
-- **`jaiph test`** — runs **`*.test.jh`** blocks in-process with mocks. See [Testing](testing.md).
-- **`jaiph install`** — fetches reusable modules into **`.jaiph/libs/`**; workspace root is detected from your **current working directory** (not the entry-`.jh` rule used by **`jaiph run`**). See [Libraries](libraries.md) and [CLI — `jaiph install`](cli.md#jaiph-install).
+or prepend npm's global bin directory: `export PATH="$(npm prefix -g)/bin:$PATH"`.
 
-## Workspace setup
-
-### Initialize with `jaiph init`
+## 3. (Optional) Switch versions
 
 ```bash
-jaiph init              # current directory (default)
-jaiph init path/to/repo # explicit workspace root
+jaiph use nightly      # rolling nightly prerelease
+jaiph use 0.10.0       # reinstalls the v0.10.0 release binary
 ```
 
-This creates **`.jaiph/`** under the chosen root with:
-
-- **`.jaiph/.gitignore`** — ignores ephemeral **`runs/`** and **`tmp/`** under **`.jaiph/`** (workflows and libraries stay tracked).
-- **`.jaiph/bootstrap.jh`** — executable **`workflow default`** whose template uses a triple-quoted multiline **prompt**; it tells the agent to read **`.jaiph/SKILL.md`**, scaffold workflows under **`.jaiph/`**, and end with **WHAT CHANGED** and **WHY**; the workflow **`log`**s the result.
-- **`.jaiph/SKILL.md`** — copied when **`jaiph init`** can resolve a skill markdown file: if **`JAIPH_SKILL_PATH`** is set **and** that path exists, it wins; otherwise the CLI tries install-relative paths (`jaiph-skill.md` beside the packaged tree — curl install: **`~/.local/bin/.jaiph/jaiph-skill.md`** next to **`src/`** — then **`docs/jaiph-skill.md`** beside the package when present), then **`docs/jaiph-skill.md`** under the current working directory. Resolution lives in **`resolveInstalledSkillPath()`** (`src/cli/shared/paths.ts`). If nothing resolves, the skill file is skipped and a message tells you to set **`JAIPH_SKILL_PATH`** and run **`jaiph init`** again. Same rules as [CLI — `jaiph init`](cli.md#jaiph-init).
+`jaiph use` re-invokes the step-1 installer (`JAIPH_INSTALL_COMMAND`, default `curl -fsSL https://jaiph.org/install | bash`) with `JAIPH_REPO_REF` set to `nightly` or `v<version>`, then replaces `~/.local/bin/jaiph` (or `JAIPH_BIN_DIR`). Override `JAIPH_INSTALL_COMMAND` for forks, offline bundles, or local scripts.
 
-Run the bootstrap workflow:
+## Verification
 
 ```bash
-./.jaiph/bootstrap.jh
+jaiph --version
 ```
 
-### Workspace convention
-
-By convention, keep Jaiph workflow files under **`<project_root>/.jaiph/`** so workspace-root detection and agent setup stay predictable. The runtime sees **`JAIPH_WORKSPACE`** as that detected root (same root the validator uses for **`.jaiph/libs/`** imports). Optional Docker sandboxes use a separate mount contract; see [Sandboxing](sandboxing.md) for how **`jaiph run`** selects container vs host execution.
+This prints `jaiph <version>` (sourced from the installed release at build time). After `jaiph use <version>`, re-run `jaiph --version` and confirm the printed version matches (for example `jaiph 0.10.0` after `jaiph use 0.10.0`).
 
-### Building from source
+## Related
 
-Contributors typically clone the repo, run **`npm install`** and **`npm run build`**, and invoke **`node dist/src/cli.js`** (or build the standalone Bun binary per [Contributing](contributing.md)). That path is separate from the curl/npm end-user install above.
+- [Architecture — Distribution: Node vs Bun standalone](architecture.md#distribution-node-vs-bun-standalone) — what the installer downloads and why the binary is self-contained.
+- [Why Jaiph](why-jaiph.md) — the design context behind the single-binary distribution.
diff --git a/docs/spec-async-handles.md b/docs/spec-async-handles.md
index 4d260f60..9b10380d 100644
--- a/docs/spec-async-handles.md
+++ b/docs/spec-async-handles.md
@@ -1,171 +1,88 @@
 ---
 title: "Spec: Async Handles"
 permalink: /spec-async-handles
+diataxis: explanation
 redirect_from:
   - /spec-async-handles.md
 ---
 
-# Async Handles — `Handle<T>` Value Model
+# Async Handles — the value model
 
-## Context
+Many workflows have a moment where two pieces of work are independent: an analysis and a build, two prompts with different backends, a slow fetch alongside cheap local checks. They could overlap, but only if the runtime keeps track of every started piece of work and refuses to let the workflow complete until each one has resolved.
 
-Concurrent work is a common orchestration problem: independent steps could run in parallel while the main line of the workflow keeps going, as long as completion and errors are accounted for before the surrounding scope finishes.
+Jaiph addresses this with **`run async`** and a value type called `Handle<T>`. This page is about the *value model* — what a handle represents, when it becomes a real string, and how that interacts with recovery and joins. For the surface syntax see [Language — `run async`](language.md#run-async-concurrent-execution-with-handles) and [Grammar — `run async`](grammar.md); for the runtime implementation see [Architecture — Core components](architecture.md#core-components).
 
-Jaiph addresses that with **`run async`**: the runtime starts a normal `run` target in the background, exposes the in-flight result as a **handle**, and **joins** every handle created in the current step list when that list ends—so nothing is left dangling. This page is about that **value model** (when a handle becomes a real string, how failures propagate, and how events look on the wire). Syntax lives in [Language — `run async`](language.md#run-async--concurrent-execution-with-handles) and [Grammar — `run async`](grammar.md#run-async--concurrent-execution-with-handles). For where this fits in the interpreter, events, and CLI progress, see [Architecture](architecture.md).
+## What a handle is
 
-**Implementation:** All of this runs in **`NodeWorkflowRuntime`** (`src/runtime/kernel/node-workflow-runtime.ts`)—the same AST interpreter described in [Architecture — System overview](architecture.md#system-overview). A handle is bookkeeping on an in-flight **`run`**; it is joined at the [`executeSteps`](#implicit-join) scope that registered it. **`async_indices`** for events are threaded through **`AsyncLocalStorage`** and emitted via **`RuntimeEventEmitter`** (see [Architecture — Core components](architecture.md#core-components) and [CLI progress reporting pipeline](architecture.md#cli-progress-reporting-pipeline)).
+`run async ref(args)` schedules the same target a synchronous `run` would have called — a workflow or a script — but does **not block** the current step list. The return value is a `Handle<T>`, where `T` is whatever a synchronous `run` would have produced (a workflow's `return`, or a script's trimmed stdout on success).
 
-## Overview
+In the runtime variable map the handle is stored as an opaque token of the form `__JAIPH_HANDLE__<id>`. That token is bookkeeping, not a value. The first place that actually *needs* the value awaits the scheduled work, then **replaces** the binding with the resolved string. After that, the variable behaves like any other string.
 
-`run async ref(args)` schedules the same **`run` target** (workflow or script) **without blocking** the current step list. The value is a **handle**—conceptually `Handle<T>` where `T` is what a synchronous `run` would have produced (workflow **`return`**, or trimmed script stdout on success). In the runtime variable map the handle is stored as an opaque string token (`__JAIPH_HANDLE__` + numeric id); the first **non-passthrough** use that needs the real value **awaits** the scheduled work, then **replaces** that binding with the resolved string (or clears it on failure—see [Resolution](#resolution)).
+The model has two ideas that are easy to mix up:
 
-## Handle creation
+1. **Eager start.** The moment `run async` executes, the work is scheduled. The handle is the receipt.
+2. **Lazy resolve.** The handle is not the value yet. The token can sit in its binding while later steps run; the wait happens at the first resolving read or at the implicit join.
 
-```jaiph
-script noop = `echo ok`
+This split is what makes `run async` cheap to write. You start work and continue. You only pay the wait cost where you genuinely depend on the result.
 
-workflow bg() {
-  run noop()
-}
+## Passthrough vs reads that force resolution
 
-workflow default() {
-  const h = run async bg()
-  run async bg()
-}
-```
+The runtime scans for `${name}` substrings in the places where a handle's contents would actually matter, and resolves any binding that still holds a token. The dividing line is:
 
-- `const h = run async bg()` — `h` holds a handle. Work for `bg()` starts immediately; later steps can overlap with it.
-- `run async bg()` — a handle is still created and **tracked** for [implicit join](#implicit-join) even if you do not store it in a variable.
+- **Passthrough** — the step does not look at the value. Examples: the `const h = run async foo()` binding itself (the token stays in the variable until something reads it); a bare `run async` with no capture variable (the handle is still tracked for the implicit join).
+- **Resolving reads** — the step needs the string. Examples: any `${h}` interpolation (`log "result: ${h}"`, send RHS, prompt body, shell one-liner); passing `h` as an argument to `run` or `ensure` (bare-identifier args are rewritten as `${name}` before the call); using `h` as the subject of `if` / `match`; a bare-identifier `const h2 = h1` (parser sugar for `"${h1}"`).
 
-This is not “fire and forget” in a scheduler sense: the runtime **registers** every `run async`, captured or not, and still **joins** it when the [scope below](#implicit-join) allows.
+There is no `await` keyword and no copy-without-reading form. To keep work overlapping, read the handle late: hold it in the original binding and avoid `${…}`, bare-identifier args to `run`/`ensure`, or `if`/`match` subjects until you need the value. When a resolving read fails (the underlying `run` ended non-zero), the binding is cleared to an empty string in that scope.
 
-**Forms:** Only `run async …` as a statement or as `const name = run async ref(args)` is supported. **`recover` / `catch` blocks attach only to the statement form** (`run async foo() recover …` / `catch …`); `const … = run async …` cannot carry a recovery block (the parser allows only a plain call there—see `const-rhs.ts` / `workflow-brace.ts`).
-
-## Resolution
-
-A handle resolves to the `run` result: workflow **`return`**, or **trimmed script stdout** on success; on failure, resolution carries the same failure shape as a synchronous `run` (and can fail the block or the join, depending on where resolution happens). Resolution is triggered on the first **non-passthrough** read of the value.
-
-`resolveHandlesInInput` scans for `${name}` substrings (identifier form) and resolves each binding that still holds a handle token; **`${run …}` / `${ensure …}`** **inline captures** run only after that scan (see `interpolateWithCaptures`).
-
-### Reads that force resolution
-
-The runtime scans for `${name}` in the places below. **Call arguments:** at parse time, bare identifiers in a `run` / `ensure` argument list are rewritten to **`${name}`** (`commaArgsToSpaced` in `src/parse/core.ts`), so they go through the same `resolveHandlesInInput` path as explicit interpolation (see [Grammar — Call-site arguments](grammar.md#call-site-arguments) and [Language — `run`](language.md#run--execute-a-workflow-or-script)).
-
-| Access pattern | Example | Forces resolution? |
-| --- | --- | --- |
-| String / template interpolation (`log`, `logerr`, `fail`, `return`, `const … = "…"`, shell one-liners, and other orchestration strings using `interpolateWithCaptures`) | `log "result: ${h}"` | Yes |
-| Arguments to `run` / `ensure` (tokens that embed `${…}` or bare identifiers rewritten for the callee) | `run downstream(h)` or `run downstream("pref_${h}")` | Yes |
-| Prompt body (string, identifier, or triple-quoted) before the model call | `prompt "ctx: ${h}"` | Yes |
-| `if` subject variable | `if h == "ok" { ... }` | Yes — subject is resolved when it is still a handle token |
-| `match` subject | `match h { ... }` | Yes |
-| Literal or `var` send RHS that contains `${…}` | `findings <- "${h}"` or `findings <- ${h}` (see send forms in [Inbox](inbox.md)) | Yes — `${name}` tokens in the payload are scanned |
-
-**Send RHS:** For the `var`-style RHS, use `${name}`; a bare `$name` is not treated as a handle reference in the Node runtime.
-
-**`for_lines`:** The loop source is read as a plain variable value **without** passing through handle resolution. If the source is still a handle token, you get the opaque string (or wrong iteration)—materialize the value first (for example `const text = "${h}"` on an expression RHS, or another step that interpolates the handle) before `for_lines`.
-
-### Passthrough (does not force resolution)
-
-Only the step that **starts** the async work avoids waiting on the result:
-
-| Access pattern | Example | Forces resolution? |
-| --- | --- | --- |
-| `const` binding from `run async` | `const h = run async foo()` | No — stores the handle token; work is already scheduled |
-| Bare `run async` (no capture variable) | `run async bar()` | No read of a value here; the handle still [joins](#implicit-join) at scope end |
-
-Any later use that needs a real string—including the first `${h}` inside a `const` RHS, or passing `h` as a `run` / `ensure` argument—forces resolution. There is no separate “copy handle without reading” statement; aliasing is done by passing the name through steps that eventually interpolate or join.
-
-If resolution fails (non-zero underlying `run`), the step or join fails with the same error shape as a synchronous `run`; the bound variable is cleared to an empty string in the scope where resolution ran.
-
-After a **successful** resolution, the variable holds the result string; further reads are ordinary string reads.
+`for_lines` is the one surprising exception: it reads the loop source as a plain variable value *without* passing through handle resolution. If the source is still a handle token, the loop sees the token and iterates wrong. Materialize the value first (`const text = "${h}"`) before iterating.
 
 ## Implicit join
 
-When the **step list** you are in finishes, the runtime **awaits every `run async` handle** created in that **`executeSteps`** invocation (`localHandleIds` in `node-workflow-runtime.ts`). Await happens **in creation order** (sequential `await`), not with a single `Promise.all`. That is the “implicit join”: it is per **block**, not merely per workflow name—for example, handles created only inside an `if` body are joined at the end of that **inner** list, before control continues after the `if`.
-
-For an **entry** workflow, **inbox dispatch** runs only **after** `executeSteps` returns successfully: the runtime finishes the step list and the implicit join first, then drains the channel queue ([Inbox — drain timing](inbox.md#who-registers-routes-and-who-drains), [Architecture — channels](architecture.md#channels-and-hooks-in-context)).
-
-- If all joined work succeeds, the outer step list continues or the workflow **returns** normally.
-- If any joined handle ends with a **non-zero** status, the scope fails; several failures are aggregated in one error. Messages refer to the **`run async`** target ref string(s). Handles that were **never read** still participate in this join.
-- If an async branch ends with a **`return`** from a `catch`/`recover` body (the same `recoverReturn` path as synchronous `run`/`ensure`), the join can propagate that **workflow return value** to the parent—mirroring non-async recovery. If multiple branches set `recoverReturn`, the **first** joined branch that does so wins (`returnValue` is only set while still `undefined`).
-
-This preserves the “all async work settled before the workflow could complete” guarantee, while still allowing overlap **until** an explicit read or a scope boundary forces ordering.
-
-## `recover` and `catch`
-
-### `recover` (retry loop)
-
-`recover` on `run async` mirrors non-async `recover`: after a failing run, the runtime executes the **repair** body, then **re-runs** the `run` target, until success or the [recover limit](#retry-limit) is reached. The async branch is scheduled once as a **single** promise; retries happen **inside** that branch.
-
-```jaiph
-script flaky = `test -f .marker`
-script touch_marker = `touch .marker`
-
-workflow maybe_ok() {
-  run flaky()
-}
-
-workflow repair() {
-  run touch_marker()
-}
+When a step list **runs through to its normal end** — every step executed without an early `return`, `fail`, or error exit — the runtime **awaits every `run async` handle created in that list**, captured or not. This is the implicit join, and the unit of joining is the `executeSteps` invocation, not the workflow. Handles created inside an `if` body are joined at the end of that inner block, before control continues after the `if`. An early `return` or `fail` exits the list immediately and does **not** run the join for handles already scheduled there.
 
-workflow default() {
-  run async maybe_ok() recover(err) {
-    log "repairing: ${err}"
-    run repair()
-  }
-}
-```
+The "uncaptured handles still join" rule is part of the value model. There is no opt-out on the normal-exit path: starting async work without storing the handle does not skip the wait. The runtime keeps a list of every handle created in the current step list and walks it on normal exit, in creation order, awaiting each one sequentially.
 
-Execution inside the promise:
+The guarantee this preserves is straightforward: when a step list reaches its normal end, **every piece of async work it scheduled has settled**. That is the property that lets the rest of the workflow — return values, channel drains, parent step lists — reason about completion without thinking about background tasks. For an entry workflow frame, the order is: the step list runs, the implicit join runs, *then* that frame's channel queue drains ([Inbox](inbox.md)). If several joined branches end with a `catch`/`recover` `return`, the first such branch in creation order supplies the parent workflow return value.
 
-1. Run the target once (`maybe_ok()`).
-2. While the last result is a failure and the repair-cycle count is still within `run.recover_limit`, run the `recover` body with `err` set to the merged **stdout+stderr** of the failure, then **run the target again** unless the repair body failed or used `return` to supply a result.
-3. A `return …` from inside the repair body **stops** the loop and becomes the async branch’s result (no further retries of the original target).
-4. If the limit is exhausted and the target still fails, the handle result is that failure—like synchronous `recover`.
+If any joined handle ended with a non-zero status, the join itself fails; multiple failures are aggregated into a single error.
 
-So the repair body runs only **after** a failing attempt, and each allowed cycle is “repair, then retry,” not “retry, then repair” on the first failure.
+## Recover and catch on async handles
 
-### `catch` (single-shot, surface keyword `catch`)
+Async handles compose with the same two error-handling forms that synchronous `run` uses:
 
-Use `catch` for a **one-time** error handler: if `foo()` fails, the `catch` body runs **once**; there is no automatic retry of `foo()`.
+- **`recover` is a retry loop.** After a failed attempt, the repair body runs and the target is retried, until either it succeeds or the recover limit is exhausted (`run.recover_limit`, default 10). On `run async`, the entire loop runs *inside the single async branch* — it is not a fan-out of attempts.
+- **`catch` is a one-shot handler.** If the target fails, the catch body runs once. If catch succeeds, the async branch is considered successful for the join. If catch ends with a `return`, that value becomes the branch's contribution to a parent workflow return.
 
-```jaiph
-run async foo() catch(err) {
-  log "caught: ${err}"
-}
-```
+These compose only with the **statement form** of `run async`. A captured `const h = run async foo()` cannot carry a `recover` or `catch` block — the parser allows only a plain call there. Use a separate workflow that wraps the recovery if you need both a captured handle and a recover loop around its target.
 
-The `catch` keyword is the user-facing name; the failure payload is the merged **stdout + stderr** text, as in synchronous `run … catch`. If the catch body succeeds without returning, the async branch is treated as **success** for join and handle resolution (status 0)—the original failure is not rethrown. A `return` from the catch body can supply a return value via the same **`recoverReturn`** path as synchronous recovery. See [Language — `catch`](language.md#catch--failure-recovery) and [Grammar](grammar.md).
+## Why no `await` keyword
 
-### Retry limit
+The reason `await` is not part of the language is that the implicit join already makes the synchronization point clear on the normal-exit path: it is the end of the step list. Adding `await` would create a second way to express the same boundary and a third state ("started but neither read nor joined yet") that users would have to reason about. Keeping the model to two states — token in the variable map, or resolved string — keeps the failure modes small.
 
-Limits apply to the **retry loop** in `recover` (including `run async … recover`).
+The trade-off is that overlapping a long-running async task with subsequent steps requires care: read the handle late, not early, or the read becomes a serializing point.
 
-- **Meaning:** `run.recover_limit` (default **10**) is the maximum number of **repair cycles** the runtime will execute after a failure: each cycle runs the `recover` body (when applicable) and then **re-runs** the target. Including the **first** attempt, the target may run **up to `recover_limit + 1` times** before the loop stops and surfaces the last failure.
-- **Config:** top-level `config { run.recover_limit = N }` in the **`.jh` file** whose module metadata is keyed by **`scope.filePath`** for that step list (`resolveRecoverLimit` reads `graph.modules.get(filePath)?.ast.metadata`). That is the file **currently executing** those steps—not necessarily the CLI entry file when you are deep in a nested `run`. Per-workflow nested `config { }` blocks are not read for this knob.
+## Where async handles are allowed
 
-## Progress and events
+`run async` is intentionally a **workflow-only** construct:
 
-Concurrent `run async` branches are tagged with a chain of **1-based indices** stored on `STEP_START`, `STEP_END`, `LOG`, and `LOGERR` events as `async_indices`; the CLI prints them as subscript prefixes on the live stream ([Architecture — CLI progress reporting pipeline](architecture.md#cli-progress-reporting-pipeline)). Indexing uses `AsyncLocalStorage` in the runtime so nested async work gets a deeper chain. Resolving a handle does not emit a separate event—the branch’s own step/log events are the timeline.
+- **Rules reject statement-form `run async`.** The validator emits `E_VALIDATE` for `run async ref(…)` in a rule body. The primitive is defined for workflows only — fan-out without an explicit join inside a rule body would break the read-only rule contract.
+- **Inline scripts reject it.** Inline `run \`body\`(args)` is shorthand for a one-off shell step; spawning it with `run async` is not a supported shape. Move the body into a named `script` and `run async` that.
+- **A `run async` call must be a real reference with parentheses.** Bare names are not async-able.
 
-In **`jaiph test`**, the runner sets `suppressLiveEvents: true` on the in-process runtime ([Architecture — Test runner integration](architecture.md#test-runner-integration-testjh-in-the-kernel)), which silences **`__JAIPH_EVENT__`** on stderr only; durable `run_summary.jsonl` (and handle semantics) behave like `jaiph run`.
+These restrictions are enforced at compile time (parser or validator), not at runtime.
 
-PTY E2E coverage for interleaved async progress: `e2e/tests/131_tty_async_progress.sh` ([Testing — PTY-based TTY tests](testing.md#pty-based-tty-tests)).
+## Async indices and the progress tree
 
-## Constraints
+Concurrent branches are tagged with a chain of 1-based indices stored on `STEP_START`, `STEP_END`, `LOG`, and `LOGERR` events as `async_indices`. The CLI renders them as subscript prefixes on the live event stream, so interleaved branches stay legible in the progress tree. Indexing uses `AsyncLocalStorage` in the runtime, which means nested async work — a `run async` inside a `run async` — gets a deeper chain rather than colliding with its parent.
 
-- **`run async`** is only allowed in **workflows** — not in **rules** (the validator enforces this).
-- **`run async`** is **not** supported for **inline scripts** (`` `body`(args) ``, ` ```…``` `, or similar).
-- A **`run async`** call must be a **normal reference with parentheses**: `run async name()` or `run async name(args)` — not a bare name.
-- There is **no `await` keyword**; you either **read** the value (triggers resolution) or hit a **join** at the [step-list boundary](#implicit-join).
-- “Uncaptured” `run async` still **joins**; there is no opt-out to skip waiting at scope end.
+Resolving a handle does **not** emit a separate event. The branch's own step and log events are the timeline; the resolve is just the point where a particular consumer stopped passing the token along.
 
-### Relationship to the rest of the system
+## Why this design, in one paragraph
 
-- **Local / Docker / `jaiph test`** share the same [`NodeWorkflowRuntime`](architecture.md#core-components) code path; sandboxing changes **where** the process runs, not how handles are implemented.
-- **`buildScripts` / `JAIPH_SCRIPTS`** only materialize **`script`** bodies; `run async` does not add new on-disk artifacts ([Architecture — Emit artifacts](architecture.md#emit-artifacts)).
+Async handles in Jaiph are a token bookkeeping model on top of normal `run`. They are eager to start, lazy to resolve, mandatory to join when a step list reaches its normal end, and otherwise indistinguishable from synchronous values once they have resolved. There is no scheduler, no thread pool, no `await`, no detached "fire and forget" — just a small contract that lets steps overlap until something genuinely needs the answer.
 
-Integration-style checks for handles and recovery live in `integration/sample-build/recover-handle.test.ts` (e.g. implicit join, passing handles into `run`, `run async … recover`).
+## Related
 
-If this spec disagrees with **`src/runtime/kernel/node-workflow-runtime.ts`**, trust the source and update [Grammar — `run async`](grammar.md#run-async--concurrent-execution-with-handles) and [Language — `run async`](language.md#run-async--concurrent-execution-with-handles) accordingly.
+- [Inbox & Dispatch](inbox.md) — the drain step that runs *after* the implicit join.
+- [Architecture — CLI progress reporting pipeline](architecture.md#cli-progress-reporting-pipeline) — how `async_indices` shape the live progress tree.
+- [Language — `run async`](language.md#run-async-concurrent-execution-with-handles) and [Grammar — `run async`](grammar.md) — surface syntax.
diff --git a/docs/testing.md b/docs/testing.md
index 106b4b0b..0a0cf484 100644
--- a/docs/testing.md
+++ b/docs/testing.md
@@ -1,59 +1,28 @@
 ---
-title: Testing
-permalink: /testing
+title: Write & run tests
+permalink: /how-to/testing
+diataxis: how-to
 redirect_from:
+  - /testing
   - /testing.md
 ---
 
-# Testing Jaiph Workflows
+# Write & run tests
 
-**Scope:** this page is about **authoring** `*.test.jh` workflow tests (`jaiph test`) and how those pieces relate to the same [Node workflow runtime](architecture.md#core-components) as `jaiph run`. It also summarizes **repository** test layers (compiler txtar, golden AST, shell E2E) that contributors run in CI.
+This recipe authors a `*.test.jh` file with mocked prompts and stubbed dependencies, then runs it through `jaiph test`. Test blocks execute the workflow under test in-process through `NodeWorkflowRuntime` — the same interpreter `jaiph run` uses — and assert on captured output.
 
-## Why workflow tests exist
+`jaiph test` runs on the host in-process — no Docker sandbox, no credential pre-flight, and no hooks. Mock every `prompt` step (and stub external workflows, rules, or scripts when needed): when no mocks are configured, or when a queued `mock prompt "…"` list is exhausted, the runtime falls through to the real agent backend the same way `jaiph run` would. Pattern-based `mock prompt { … }` blocks do not fall through — an unmatched prompt fails the test unless a `_` default arm catches it. The goal is fixed inputs and checkable outputs so refactors and CI catch regressions deterministically.
 
-In production, a workflow’s behavior depends on live models, host timing, and local files. A harness fixes inputs (mock prompts, stubbed workflows/scripts), runs the same interpreter the CLI uses for real runs, and checks outputs with small assertions so CI and refactors can catch regressions without external services.
+## Prerequisites
 
-## What Jaiph provides
+- The workflow under test lives in a separate `.jh` file you can import (recommended; keeps test files small).
+- You know the workflow's parameters and what `prompt` calls it makes.
 
-Jaiph includes a built-in test harness: test files (`*.test.jh`) mock prompt responses, stub workflows, rules, and scripts, execute workflows through `NodeWorkflowRuntime` **in-process**, and assert on captured output — without calling real LLMs or depending on external state. Unlike `jaiph run`, the harness does not spawn `node-workflow-runner`: after `buildScripts`, the CLI calls `runTestFile()` in `src/runtime/kernel/node-test-runner.ts`. There is no Docker mode for `jaiph test`; workflows under test always run on the host. **How** that fits `buildRuntimeGraph`, `suppressLiveEvents`, and artifact writes is in [Architecture — Test runner integration](architecture.md#test-runner-integration-testjh-in-the-kernel).
+## 1. Create the test file
 
-## File naming and layout
+Test files end in `.test.jh`. Convention: keep them next to the module under test or under a top-level `tests/` / `e2e/` directory.
 
-Test files use the `.test.jh` suffix (for example `workflow_greeting.test.jh`).
-
-A test file supports the same top-level forms as any `.jh` file (`import`, `config`, `workflow`, etc.), but the CLI only executes `test "..." { ... }` blocks. Other declarations are parsed into the runtime graph — for example, a local `workflow` is visible to single-segment references.
-
-**Recommended style:** keep test files to `import` statements and `test` blocks. Define the workflows under test in separate modules so files stay small and focused.
-
-Import paths in `import "..." as alias` resolve relative to the test file's directory, with the same extension handling as ordinary modules (`.jh` is appended when omitted). See [Grammar — Lexical notes](grammar.md#lexical-notes).
-
-## Running tests
-
-```bash
-# All *.test.jh files under the detected workspace root (recursive)
-jaiph test
-
-# All tests under a directory (recursive)
-jaiph test ./e2e
-
-# One file
-jaiph test ./e2e/workflow_greeting.test.jh
-
-# Equivalent shorthand (a *.test.jh path is treated as jaiph test)
-jaiph ./e2e/workflow_greeting.test.jh
-```
-
-`jaiph path.test.jh` without the `test` subcommand is only accepted when the **first** CLI argument ends with `.test.jh` **and** `path` resolves to an existing file (`src/cli/index.ts`); otherwise the token is treated as an unknown command.
-
-**Discovery:** With no path argument, Jaiph scans the detected workspace root recursively; with a directory, it scans that tree. Only `*.test.jh` files are collected: the name must end in `.jh` and the stem must end with `.test` (see `walkTestFiles` in `src/transpile/build.ts`). Unlike `walkjhFiles` (used when compiling ordinary `*.jh` trees), test discovery does **not** skip `.jaiph/` subtrees, so stray `*.test.jh` files under `.jaiph/...` would be picked up — keep test modules in normal source locations. The workspace root—for locating imports and setting `JAIPH_WORKSPACE`—is from `detectWorkspaceRoot` in `src/cli/shared/paths.ts`: walk upward from a starting directory (the current working directory, the directory you passed, or the parent of a single test file) until `.jaiph` or `.git` is found, subject to a few guards for shared temp directories and nested `.jaiph/tmp` layouts; if nothing matches, the resolved starting directory is used as the root.
-
-If no `*.test.jh` files are found, the command prints an error and exits with status 1. A file must contain at least one `test` block; otherwise the CLI reports a parse error. Passing a plain `*.jh` file that is not named `*.test.jh` is rejected — use `jaiph run` for those.
-
-## Test block syntax
-
-Each `test` block is a named test case containing ordered steps:
-
-```jaiph
+```jh
 import "workflow_greeting.jh" as w
 
 test "runs happy path and prints PASS" {
@@ -64,25 +33,25 @@ test "runs happy path and prints PASS" {
 }
 ```
 
-Inside a test block, steps execute in order. **`#` line comments** and **blank lines** are allowed between steps (they are ignored by the runner).
-
-### Mock prompt (inline)
+A test file can have any top-level construct (`import`, `config`, `workflow`, …), but the CLI only executes `test "..." { ... }` blocks. `#` line comments and blank lines are allowed between steps inside a test block.
 
-Queues a fixed response for the next `prompt` call in the workflow under test. Multiple `mock prompt` lines queue in order — one is consumed per `prompt` call.
+## 2. Queue mock prompt responses
 
-```jaiph
-mock prompt "hello from mock"
+```jh
+mock prompt "first response"
 mock prompt "second response"
-mock prompt myConstName
 ```
 
-Use a **double-quoted string** (escapes: `\"`, `\n`, `\\`) or a bare identifier for a [test `const`](#test-block-constants) defined earlier in the block. **Single-quoted** mock text is rejected at parse time — use double quotes.
+Multiple `mock prompt` lines queue in order — one is consumed per `prompt` call. Strings must use **double quotes** (with `\"`, `\n`, `\\` escapes). A bare identifier refers to a test-block `const` declared earlier as a double-quoted string:
 
-### Mock prompt (content-based dispatch)
+```jh
+const greeting = "hi"
+mock prompt greeting
+```
 
-Dispatches different responses based on the prompt text using pattern matching. Arms are tested top-to-bottom; the first match wins.
+For content-based dispatch, use the pattern form. Do not mix queued `mock prompt "…"` / `mock prompt <const>` lines with a `mock prompt { … }` block in one test — the compiler rejects that (`E_VALIDATE`). Separate tests in the same file may use different styles:
 
-```jaiph
+```jh
 mock prompt {
   /greeting/ => "hello"
   /farewell/ => "goodbye"
@@ -90,135 +59,73 @@ mock prompt {
 }
 ```
 
-Each arm is `pattern => "response"`. Patterns can be:
-
-- **String literal** (`"greeting"`) — exact match against the prompt text
-- **Regex** (`/greeting/`) — tested against the prompt text
-- **Wildcard** (`_`) — matches anything (like a default/else branch)
-
-Without a `_` wildcard arm, an unmatched prompt fails the test.
+Arms are evaluated top-to-bottom; the first match wins. Without a `_` wildcard arm, an unmatched prompt fails the test.
 
-Do not combine `mock prompt { ... }` with inline `mock prompt "..."` in the same test block — when a block mock is present, inline queue entries are ignored.
+## 3. (Optional) Stub workflows, rules, or scripts
 
-### Mock workflow
+Replace a workflow, rule, or script body for this test case. Parentheses are required:
 
-Replaces a workflow body for this test case with Jaiph steps:
-
-```jaiph
+```jh
 mock workflow w.greet() {
   return "stubbed greeting"
 }
-```
-
-**Syntax:** `mock workflow <ref>(<params>) { ... }` — **parentheses are required**, even when there are no parameters (`()`). The legacy form `mock workflow ref {` without `()` is rejected with a fix hint.
-
-The reference format is `<alias>.<workflow>` (preferred) or `<name>` for a workflow defined in the test file itself.
-
-### Mock rule
-
-Same as mock workflow, but for rules (body uses Jaiph steps, not shell):
 
-```jaiph
 mock rule w.validate() {
   return "stubbed validation"
 }
-```
-
-### Mock script
 
-Stubs a module `script` block. The body is **shell**, like a real `script` step (the runner executes it as a managed shell mock — see `runtime-mock.ts`):
-
-```jaiph
 mock script w.helper() {
   echo "stubbed script"
 }
 ```
 
-Test stubs use `mock script`, not `mock function`; the latter is a parse error with a fix hint.
-
-`mock script` uses the same **`ref() { ... }`** header shape as `mock workflow` / `mock rule`.
+`mock workflow` / `mock rule` use Jaiph steps in the body; `mock script` uses raw shell, like a real `script`.
 
-### Workflow run (with capture)
+## 4. Run the workflow and capture output
 
-Runs a workflow and captures its output into a variable:
-
-```jaiph
+```jh
 const response = run w.default()
+const response = run w.default("my input")     # with argument
+const response = run w.default() allow_failure # accept non-zero exit
 ```
 
-**Capture semantics** (see `runTestBlock` in `node-test-runner.ts`) pick the first branch that applies:
-
-1. **Exit code 0** and a **non-empty** `return` string from the workflow → that return value is captured.
-2. **Non-zero exit** and a non-empty runtime **error** string → the trimmed error string is captured (useful with `allow_failure` when you assert on failure output).
-3. **All other cases** (for example exit 0 with no return text, non-zero without an error string, or empty return) → the harness concatenates every `*.out` step capture in the run directory **in sorted filename order**; if listing or reading those files fails, it falls back to the runtime’s aggregated output string.
-
-The test still **fails** on non-zero exit unless `allow_failure` is set; capture content is independent of that check.
-
-**Variants:**
+`run` captures the workflow's return value when the exit is 0 and the return is non-empty; otherwise it falls back to the runtime error string (for non-zero exits) or the concatenated `*.out` files in sorted order.
 
-```jaiph
-# With an argument
-const response = run w.default("my input")
+## 5. Assert on the captured value
 
-# Allow failure
-const response = run w.default() allow_failure
-
-# With argument and allow failure
-const response = run w.default("my input") allow_failure
+```jh
+expect_contain     response "expected substring"
+expect_not_contain response "unwanted text"
+expect_equal       response "exact expected value"
 ```
 
-### Workflow run (no capture)
+The second argument is either a double-quoted literal or a test-block `const` name (bare identifier, not quoted).
 
-Runs a workflow without storing output. Still fails on non-zero exit unless `allow_failure` is appended:
+## 6. Run the tests
 
-```jaiph
-run w.setup()
-run w.setup("arg")
-run w.setup() allow_failure
+```bash
+jaiph test                            # discover *.test.jh under the workspace
+jaiph test ./e2e                      # restrict to a directory
+jaiph test ./e2e/workflow_greeting.test.jh  # single file
+jaiph ./e2e/workflow_greeting.test.jh       # shorthand: a *.test.jh path is treated as jaiph test
 ```
 
-### Test block constants
-
-Inside a `test` block, `const NAME = "value"` binds a test-local string (double-quoted literal only; no interpolation). Names can be used as:
-
-- `mock prompt NAME` — the next `prompt` consumes the bound value
-- the second argument to `expect_contain`, `expect_not_contain`, or `expect_equal` when written as a bare identifier (not quoted)
+The runner discovers `*.test.jh` files recursively. Zero matches in discovery mode print `jaiph test: no *.test.jh files found (nothing to do)` and exit **0** — safe to call unconditionally from CI.
 
-`const` bindings used for `mock prompt` or expected values must appear **before** the steps that read them. Capture variables (`const x = run w.default()`) are separate: only `const … = run …` introduces a capture name for `expect_*`.
+## Verification
 
-### Assertions
+A passing run prints one block per case followed by `✓ N test(s) passed` and exits **0**:
 
-After capturing workflow output, use these to check the result:
-
-```jaiph
-expect_contain response "expected substring"
-expect_not_contain response "unwanted text"
-expect_equal response "exact expected value"
 ```
-
-The second argument is either a **double-quoted string** (with `\"`, `\n`, and `\\` escapes) or a **`const` name** bound earlier in the same test block (see [Test block constants](#test-block-constants)):
-
-```jaiph
-const want = "expected substring"
-expect_contain response want
+testing workflow_greeting.test.jh
+  ▸ runs happy path and prints PASS
+  ✓ 0s
+✓ 1 test(s) passed
 ```
 
-`expect_equal` failures print a short `diff`-style `-` / `+` preview; substring assertions report lengths and the expected fragment.
-
-## Typed prompts
-
-When a workflow uses typed prompts (`returns "{ ... }"`), mock text must be a single line of valid JSON matching the schema so that parsing and field variables work correctly. Fields are accessed with dot notation — `${result.field}` — in `log`, `return`, and other interpolation contexts. See `e2e/prompt_returns_run_capture.test.jh` and `e2e/dot_notation.test.jh` for examples.
-
-## Pass/fail reporting
-
-Each test block runs in isolation. Failed assertions, harness/runtime errors while executing the block, or a workflow exiting non-zero (without `allow_failure`) mark that case as failed.
-
-The runner output looks like:
+A failure prints the failing assertion and exits non-zero:
 
 ```
-testing workflow_greeting.test.jh
-  ▸ runs happy path and prints PASS
-  ✓ 0s
   ▸ handles error case
   ✗ expect_contain failed: "response" (42 chars) does not contain "expected" 1s
 
@@ -226,207 +133,8 @@ testing workflow_greeting.test.jh
   - handles error case
 ```
 
-When all tests pass: `✓ N test(s) passed`. Exit status is 0 on full success, non-zero if any test failed.
-
-## How it works
-
-The CLI parses each test file and passes `test "…" { … }` blocks to `runTestFile()` (`src/runtime/kernel/node-test-runner.ts`). That path aligns with [Architecture — Test runner integration](architecture.md#test-runner-integration-testjh-in-the-kernel):
-
-1. **`buildScripts(testFileAbs, tmpDir, workspaceRoot)`** — same helper as `jaiph run`, with the **test file as the entrypoint** (`test.ts` calls it with the absolute path to the `*.test.jh` file). For a file entrypoint, the transpiler walks the test module and every file reachable by transitive **`import`** (see `collectTransitiveJhModules` in `src/transpile/build.ts`); it runs `validateReferences` / `emitScriptsForModule` per file and writes atomic **`script`** files into a temp `scripts/` tree. (If `buildScripts` were ever given a **directory** entrypoint, directory walks skip `*.test.jh` files — that is not how `jaiph test` invokes it.)
-2. **`buildRuntimeGraph(testFileAbs, workspaceRoot)`** — called **once per test file**; the same graph is reused for every `test` block in that file and for every `run` step inside them.
-3. For each block, a fresh temp layout sets env vars (below); workflows run in **`NodeWorkflowRuntime`**, not in a detached child.
-
-There is no Bash transpilation of full workflows on this path — only extracted `script` bodies are shell, same as production. The import graph is fixed for a single `jaiph test` process; **mutating imported `*.jh` on disk between blocks** is not a supported use case.
-
-## Environment variables
-
-For each workflow run inside a test block, the harness builds the runtime environment from `process.env` plus:
-
-| Variable | Value |
-|---|---|
-| `JAIPH_TEST_MODE` | `1` (selects mock prompt dispatch in `prompt.ts`) |
-| `JAIPH_WORKSPACE` | Project root (from `detectWorkspaceRoot`) |
-| `JAIPH_RUNS_DIR` | Per test block, `…/tmp/jaiph-test-block-*/.jaiph/runs` (ephemeral) |
-| `JAIPH_SCRIPTS` | Directory containing extracted `script` files from `buildScripts` (temp) |
-| `JAIPH_MOCK_RESPONSES_JSON` | JSON array of strings: sequential inline `mock prompt "…"` / `mock prompt <const>` responses (only when no `mock prompt { … }` block exists in that case) |
-| `JAIPH_MOCK_PROMPT_ARMS_JSON` | JSON payload for pattern-based `mock prompt { … }` arms (in-process dispatch in `mock.ts` / `prompt.ts`; mutually exclusive with the responses queue for that run) |
-
-You do not set mock variables or `JAIPH_TEST_MODE` yourself; the harness sets them for each `run …` step that starts an in-process `NodeWorkflowRuntime`. `JAIPH_TEST_MODE` routes prompt steps to the mock path in `prompt.ts`. Suppression of live `__JAIPH_EVENT__` lines on stderr is controlled by `suppressLiveEvents: true` on that runtime (see [Architecture — Test runner integration](architecture.md#test-runner-integration-testjh-in-the-kernel)), not by `JAIPH_TEST_MODE`; durable `run_summary.jsonl` writes still append. Production `jaiph run` uses a spawned `node-workflow-runner` child without `suppressLiveEvents`, so live events keep streaming to stderr there.
-
-## Organizing tests
-
-A Given / When / Then structure works well but is not required — comments and blank lines are fine:
-
-```jaiph
-import "app.jh" as app
-
-test "default workflow prints greeting" {
-  # Given
-  mock prompt "hello"
-
-  # When
-  const out = run app.default()
-
-  # Then
-  expect_contain out "hello"
-}
-```
-
-## Compiler tests (txtar format)
-
-Compiler tests verify parse and validate outcomes using a language-agnostic txtar format. Unlike the TypeScript-embedded tests in `src/`, these fixtures are plain text files that can be reused by alternative implementations (e.g. a Rust compiler).
-
-Test fixture files live in `test-fixtures/compiler-txtar/` as `.txt` files. Each file contains multiple test cases separated by `===` delimiters:
-
-```
-=== test name here
-# @expect ok
---- input.jh
-workflow default() {
-  log "hello"
-}
-
-=== another test
-# @expect error E_PARSE "unterminated workflow block"
---- input.jh
-workflow default() {
-  log "hello"
-
-```
-
-### Format rules
-
-- `=== <name>` starts a new test case. Everything until the next `===` (or EOF) belongs to that case.
-- `--- <filename>` starts a virtual file within the test case. Filenames must end in `.jh`.
-- `# @expect <directive>` declares the expected outcome and must appear before the first `---` marker.
-
-### Expect directives
-
-| Directive | Meaning |
-|-----------|---------|
-| `# @expect ok` | Parse + validate succeed with no errors |
-| `# @expect error E_CODE "substring"` | An error is thrown whose message contains both `E_CODE` and `substring` (substring must be **double-quoted** in the fixture — the runner parses that form only) |
-| `# @expect error E_CODE "substring" @L` | Same, and the error must be reported at line `L` (any column) |
-| `# @expect error E_CODE "substring" @L:C` | Same, and the error must be reported at line `L`, column `C` |
-
-### Single-file vs multi-file tests
-
-- **Single-file:** use `--- input.jh`. The runner parses and validates `input.jh`.
-- **Single test file:** use `--- input.test.jh` for test-specific fixtures.
-- **Multi-file:** use `--- main.jh` as the entry file plus additional `--- lib.jh` etc. The runner parses and validates `main.jh` as the entry.
-
-The entry file is determined by priority: `main.jh` if present, otherwise `input.jh`, otherwise `input.test.jh`, otherwise the first file.
-
-### Running compiler tests
-
-```bash
-npm run test:compiler
-```
-
-The runner (`test-infra/compiler-test-runner.ts`) discovers all `.txt` files in `test-fixtures/compiler-txtar/`, parses them, writes virtual files to a temp directory per case, runs `parsejaiph` + `validateReferences`, and asserts the expected outcome. Results are reported per test case via `node:test`. Compiler tests are also included in `npm test`.
-
-### Fixture files
-
-Test cases are organized by error type and single-vs-multi-module:
-
-| File | Cases | What it covers |
-|------|-------|----------------|
-| `test-fixtures/compiler-txtar/valid.txt` | 119 | Success cases — source compiles without error (single-module) |
-| `test-fixtures/compiler-txtar/parse-errors.txt` | 282 | `E_PARSE` error cases — syntax and grammar violations |
-| `test-fixtures/compiler-txtar/validate-errors.txt` | 92 | `E_VALIDATE`, `E_IMPORT_NOT_FOUND`, `E_SCHEMA` error cases (single-module) |
-| `test-fixtures/compiler-txtar/validate-errors-multi-module.txt` | 20 | Validation errors requiring imports (multi-file) |
-
-(Counts are lines matching `# @expect` in each `.txt` file; the runner also registers separate `node:test` meta-tests in `compiler-test-runner.ts`. Re-count after large fixture changes.)
-
-The initial cases were extracted from TypeScript test files across `src/parse/*.test.ts` and `src/transpile/*.test.ts`. Additional cases were written directly as txtar fixtures to cover compiler error paths that had no prior test coverage. Only tests that verify "source in, pass/fail out" qualify — tests that check AST structure or internal APIs remain in TypeScript.
-
-### Conventions
-
-- One `.txt` file per category.
-- Test names should be descriptive and unique within a file.
-- Keep test cases minimal — only include what is necessary to trigger the expected outcome.
-
-The format is documented in detail in `test-fixtures/compiler-txtar/README.md`.
-
-## Golden AST tests
-
-Golden AST tests verify that the parser produces the expected tree shape for successful parses. While compiler tests (txtar) cover pass/fail outcomes and E2E tests cover runtime behavior, golden AST tests lock in **what** the parser actually produced — so refactors cannot silently change tree structure.
-
-### How it works
-
-Each `.jh` fixture in `test-fixtures/golden-ast/fixtures/` is parsed and serialized to deterministic JSON (locations and file paths stripped, keys sorted). The result is compared against a checked-in `.json` golden file in `test-fixtures/golden-ast/expected/`.
-
-- **Txtar tests** = error messages and "this compiles."
-- **Golden AST tests** = parse tree shape for successful parses.
-- **E2E tests** = full CLI + runtime behavior.
-
-### Running golden AST tests
-
-```bash
-npm run test:golden-ast
-```
-
-Golden AST tests are also included in `npm test`.
-
-### Updating goldens
-
-When an intentional parser change alters AST shape, regenerate the golden files:
-
-```bash
-UPDATE_GOLDEN=1 npm run test:golden-ast
-```
-
-Review the diff to confirm the changes are expected, then commit the updated `.json` files.
-
-### Adding a new fixture
-
-1. Create a small, focused `.jh` file in `test-fixtures/golden-ast/fixtures/` (one concern per file).
-2. Run `UPDATE_GOLDEN=1 npm run test:golden-ast` to generate `test-fixtures/golden-ast/expected/<name>.json`.
-3. Review the generated JSON and commit both files.
-
-## Stress and soak testing
-
-For concurrency-sensitive behavior (for example inbox stress with many sends and route targets, or `run async` with interleaved managed steps), the repository includes shell-based E2E scenarios that go beyond single native tests:
-
-- High volume and fan-out to exercise locking and dispatch under concurrent writes to the same run directory.
-- Soak loops to flush out intermittent failures.
-- Order-insensitive checks (counts, uniqueness) when concurrent work makes ordering non-deterministic for the surface under test (for example async branch completion in the progress tree).
-
-See `e2e/tests/91_inbox_dispatch.sh`, `e2e/tests/93_inbox_stress.sh`, and `e2e/tests/94_parallel_shell_steps.sh` for examples.
-
-## PTY-based TTY tests
-
-Some CLI behavior only activates when stdout is a real TTY — the live progress tree with ANSI redraws, for example. These tests use Python's `pty.openpty()` to spawn `jaiph run` under a pseudo-terminal, capture the raw byte stream, and assert on the rendered output.
-
-Two PTY tests exist today:
-
-| Test file | What it covers |
-|-----------|----------------|
-| `e2e/tests/81_tty_progress_tree.sh` | Synchronous workflow progress rendering — verifies the tree structure, step timing, and PASS/FAIL markers under a real TTY. |
-| `e2e/tests/131_tty_async_progress.sh` | Async workflow progress rendering — verifies that `run async` branches (with `Handle<T>` deferred resolution) render per-branch progress events under subscript-numbered nodes (₁, ₂), that both branches show resolved return values in the final frame, and that no orphaned ANSI escape sequences appear. |
-
-Both tests require Python 3 and use only deterministic, non-LLM steps (sleep loops, `log`, scripts) so results are reproducible. Assertions use `assert_contains` with order-insensitive matching because async interleaving and PTY redraws make exact full-output comparison infeasible.
-
-## E2E testing
-
-Shell harnesses and CI expectations for the full repo are described in [Contributing — E2E testing](contributing.md#e2e-testing).
-
-E2E tests compare full CLI output and full artifact file contents by default. Use `e2e::expect_stdout`, `e2e::expect_out`, `e2e::expect_file`, `e2e::expect_run_file`, or `e2e::assert_equals`. Substring checks (`e2e::assert_contains`) require an inline comment justifying the exception. For the full policy (two surfaces, full equality, `assert_contains` exceptions, normalization), see [Contributing — E2E testing](contributing.md#e2e-testing). For the on-disk tree under `.jaiph/runs/`, see [Architecture — Durable artifact layout](architecture.md#durable-artifact-layout).
-
-Every `.jh` sample under `e2e/` must be wired into at least one test. Run `bash e2e/check_orphan_samples.sh` to detect unreferenced fixtures. See [Contributing — Orphan sample guard](contributing.md#orphan-sample-guard) for details.
-
-Similarly, every `.jh` and `.test.jh` file under `examples/` must be accounted for in `e2e/tests/110_examples.sh` — either exercised with strict assertions or explicitly excluded with a rationale. An orphan guard in that script enforces this. See [Contributing — Example matrix guard](contributing.md#example-matrix-guard) for details.
-
-## Landing-page sample verification
-
-The project includes a Playwright-based test (`e2e/playwright/landing-page.spec.ts`) that verifies landing-page code samples stay in sync with real CLI behavior. Run it with `npm run test:samples`. See [Contributing — Landing-page sample verification](contributing.md#landing-page-sample-verification-playwright) for details.
-
-## Limitations (v1)
+## Related
 
-- **Prompt mocks** must be written **inside the test file** (inline `mock prompt "…"`, `mock prompt <const>`, or `mock prompt { … }`) — there are no external mock-config file paths. Inline responses must use **double** quotes (not single quotes).
-- **Do not combine** `mock prompt { … }` with queue-style `mock prompt "…"` / `mock prompt <const>` in the same test block; when a block is present, queued entries are ignored.
-- **`mock workflow` / `mock rule` / `mock script`** require `ref()` with parentheses — empty `()` when there are no parameters.
-- **Capture**: only a **non-empty** return value on success bypasses concatenating `*.out` files; exit 0 with an empty return, failures without a runtime error string, and other edge cases use the `*.out` / aggregated-output path described above.
-- **`expect_*` right-hand side** is either a double-quoted literal or a test `const` name — not an arbitrary expression.
-- **`expectContain` / `expectEqual` / `expectNotContain` (camelCase)** are rejected; use `expect_contain`, `expect_equal`, `expect_not_contain`.
-- **Extra CLI arguments** after the path (`jaiph test <path> [extra...]`) are accepted but ignored (reserved for future use).
+- [Architecture — Test runner integration](architecture.md#test-runner-integration-testjh-in-the-kernel) — how `runTestFile` reuses the same module graph and runtime as `jaiph run`.
+- [Configure backend & model](/how-to/configure-backend) — workflows under test still read `config { … }`; pin agent settings in env when CI must be deterministic.
+- [Authenticate agent backends](/how-to/agent-auth) — only needed when a test reaches a live `prompt`; fully mocked suites skip agent credentials and the `jaiph run` pre-flight.
diff --git a/docs/why-jaiph.md b/docs/why-jaiph.md
new file mode 100644
index 00000000..37505124
--- /dev/null
+++ b/docs/why-jaiph.md
@@ -0,0 +1,60 @@
+---
+title: Why Jaiph
+permalink: /why-jaiph
+diataxis: explanation
+---
+
+# Why Jaiph
+
+Jaiph is a small language and runtime for AI-assisted automation. This page is the design context — what kind of problem it is meant for, what shape the solution takes, and which trade-offs it deliberately picks. For the implementation map see [Architecture](architecture.md); for syntax see [Language](language.md) and [Grammar](grammar.md).
+
+## The problem
+
+Modern automation pipelines have to do three different kinds of work in the same flow:
+
+- **Deterministic checks** — does this file exist, does the build pass, does the schema match.
+- **Real shell** — invoking a build tool, calling a CLI, manipulating files.
+- **Non-deterministic AI steps** — asking an agent to summarize a diff, write a fix, classify a finding.
+
+You can wire these together in any general-purpose language. The cost is glue: you write argument plumbing for each tool, hand-roll structured output handling for each agent call, and decide every time how to capture stdout, where to put logs, when to retry on failure, and how to fail loudly when something violates the structure you expected.
+
+Jaiph treats orchestration as the language. The structure that an ad-hoc bash script picks up over time — "every step gets captured, every prompt is logged, every failure has a footer with paths to the artifact files" — is the **built-in** behavior, not something the workflow author has to write.
+
+## The model
+
+A `.jh` file declares four primitives, and the orchestration is what they compose into:
+
+- **`rule`** — a non-mutating check. Calls other rules via `ensure`, calls scripts via `run`. The compiler rejects `send`, `prompt`, inline shell, and `run async` in rule bodies; rules are the place to put assumptions the rest of the workflow gets to rely on.
+- **`script`** — a named executable block (shell, Python, Node, anything with a shebang). Workflow bodies can also run inline shell or `` run `body`(args) `` steps, but reusable shell lives in `script` definitions. Scripts do not inherit module-scoped `const` bindings; pass values as positional arguments.
+- **`prompt`** — a task delegated to an AI agent. The body is interpolated, the agent's stdout is captured, and structured output (`returns "{ field: type }"`) is parsed and validated against a schema.
+- **`workflow`** — the orchestration unit. Composes the other three, plus `run async` for concurrency, channels for message passing, `if` / `match` / `for_lines` for flow control, and `recover` / `catch` for failure handling.
+
+Orchestration values are strings, every step is logged, and every run leaves durable artifacts under `.jaiph/runs/` (per-step `.out` and `.err` captures, plus an append-only `run_summary.jsonl`). That is the payoff over hand-rolled shell: repeatable, inspectable, testable automation.
+
+## Three commitments
+
+The design rests on three commitments that decide a lot of smaller questions:
+
+1. **Strict structure around AI steps.** Agent responses are non-deterministic, so the language gives you the surrounding pieces that *are* deterministic. `rule` and `ensure` let you assert preconditions and postconditions in the same pipeline as the prompt. `prompt … returns "{ … }"` constrains the agent's output to a JSON shape; if it fails, the step fails. `recover` retries a failed `run` after a repair body executes, up to `run.recover_limit` — a common pattern when an agent's output needs correction before the pipeline continues.
+
+2. **Sandbox by default.** `jaiph run` runs inside a Docker container with capabilities dropped, mounts allowlisted, and host environment variables stripped down to an explicit prefix list. The sandbox can be turned off (`JAIPH_UNSAFE=true` or `jaiph run --unsafe`), but only by the host — a workflow file cannot disable it from inside. The point is not to claim Docker is impenetrable; the [Sandboxing](sandboxing.md) page is explicit about what it does and does not protect, and about making the safe path the path of least resistance for workflows pulled from elsewhere.
+
+3. **No vendor lock-in.** Choose a backend with `agent.backend` (`cursor`, `claude`, or `codex`). Cursor and Claude invoke their respective CLIs; Codex uses an HTTP chat-completions path. On the **cursor** backend, `agent.command` can name any stdin→stdout executable — a wrapper around a local model or self-hosted endpoint works without implementing Jaiph's stream-json framing. Workflow authors do not need a proprietary agent protocol.
+
+## What Jaiph is not
+
+Naming the boundaries helps as much as naming the design:
+
+- **Not a general-purpose programming language.** Workflows are linear orchestration with the control flow they need (`if`, `match`, `for_lines`, `recover`, `catch`). Anything fancier belongs in a `script`.
+- **Not a distributed system.** Channels are an in-process, drain-driven handoff between workflows in the same run — see [Inbox & Dispatch](inbox.md). There is no broker, no cross-process routing, no retry queue.
+- **Not a CI replacement.** Jaiph runs the same way locally and inside CI containers; it does not provide the test-matrix, artifact-publishing, or environment-management work that CI platforms do.
+- **Not a prompt framework.** There is no chain abstraction, no agent class hierarchy, no built-in memory store. A `prompt` step calls a backend; if you want chaining, compose steps.
+
+The deliberate smallness is the point. The promise is that a `.jh` file behaves the way it reads, and the structure around it — sandboxing, logging, testing, formatting — is the runtime's job, not the workflow author's.
+
+## Where to go next
+
+- [Architecture](architecture.md) — the implementation map: parser, validator, runtime, CLI, contracts.
+- [Sandboxing](sandboxing.md) — the design of the Docker boundary and what it does and does not protect against.
+- [Inbox & Dispatch](inbox.md) — how `channel` and `send` compose workflows without a broker.
+- [Spec: Async Handles](spec-async-handles.md) — the value model behind `run async`.
diff --git a/e2e/lib/common.sh b/e2e/lib/common.sh
index 8b7dd080..c776d621 100644
--- a/e2e/lib/common.sh
+++ b/e2e/lib/common.sh
@@ -432,6 +432,13 @@ e2e::prepare_shared_context() {
   export JAIPH_BIN_DIR="${JAIPH_E2E_BIN_DIR}"
   # Docker sandbox is opt-in (beta); keep it disabled for e2e tests.
   export JAIPH_DOCKER_ENABLED="${JAIPH_DOCKER_ENABLED:-false}"
+  # The host pre-flight credential check (src/cli/run/preflight-credentials.ts)
+  # warns when an explicit `agent.backend` is declared but no credential env is
+  # set. E2E uses mock agent binaries that don't need real keys, so seed dummy
+  # values to keep the pre-flight silent. Tests that exercise the missing-key
+  # path explicitly unset them via `env -u`.
+  export CURSOR_API_KEY="${CURSOR_API_KEY:-e2e-dummy}"
+  export ANTHROPIC_API_KEY="${ANTHROPIC_API_KEY:-e2e-dummy}"
 
   if [[ -z "${JAIPH_REPO_URL:-}" ]]; then
     export JAIPH_REPO_URL="${E2E_REPO_ROOT}"
diff --git a/e2e/test_all.sh b/e2e/test_all.sh
index d99eb90e..739818ef 100755
--- a/e2e/test_all.sh
+++ b/e2e/test_all.sh
@@ -9,6 +9,7 @@ trap e2e::cleanup EXIT
 TEST_SCRIPTS=(
   "e2e/tests/00_install_and_init.sh"
   "e2e/tests/05_jaiph_use_pinned_version.sh"
+  "e2e/tests/07_installer_binary.sh"
   "e2e/tests/10_basic_workflows.sh"
   "e2e/tests/20_rule_and_prompt.sh"
   "e2e/tests/22_assign_capture.sh"
@@ -89,6 +90,10 @@ TEST_SCRIPTS=(
   "e2e/tests/133_return_bare_identifier.sh"
   "e2e/tests/134_script_imports.sh"
   "e2e/tests/135_for_string_lines.sh"
+  "e2e/tests/136_if_else_branch.sh"
+  "e2e/tests/137_inline_script_catch_recover.sh"
+  "e2e/tests/138_if_match_dot_subject.sh"
+  "e2e/tests/210_standalone_binary.sh"
 )
 
 PASS_COUNT=0
diff --git a/e2e/tests/05_jaiph_use_pinned_version.sh b/e2e/tests/05_jaiph_use_pinned_version.sh
index 4470683b..f17c0a5a 100644
--- a/e2e/tests/05_jaiph_use_pinned_version.sh
+++ b/e2e/tests/05_jaiph_use_pinned_version.sh
@@ -8,6 +8,14 @@ trap e2e::cleanup EXIT
 
 e2e::prepare_test_env "jaiph_use_pinned"
 
+# docs/install now builds the standalone binary from local sources via
+# `npm run build:standalone`, which requires bun. Match the precedent in
+# 210_standalone_binary.sh: skip rather than fail on CI hosts without bun.
+if ! command -v bun >/dev/null 2>&1; then
+  e2e::skip "bun not installed — skipping jaiph use local-source install check"
+  exit 0
+fi
+
 VERSION="$(node -p "require('${E2E_REPO_ROOT}/package.json').version")"
 USE_BIN="${JAIPH_E2E_TEST_DIR}/use_bin"
 mkdir -p "${USE_BIN}"
diff --git a/e2e/tests/07_installer_binary.sh b/e2e/tests/07_installer_binary.sh
new file mode 100755
index 00000000..6d9ca4ab
--- /dev/null
+++ b/e2e/tests/07_installer_binary.sh
@@ -0,0 +1,182 @@
+#!/usr/bin/env bash
+#
+# Acceptance for the binary installer rewrite (docs/install + docs/install-from-local.sh):
+#   - Checksum mismatch → non-zero exit, nothing installed.
+#   - Unsupported platform → non-zero exit with the documented message.
+#   - Parity check: local-build install dir contains a single executable `jaiph`
+#     (no shim script, no LIB_DIR/runtime tree) and works with node/npm/bun
+#     absent from PATH (same self-contained installation as the release path).
+#
+# The download checksum/platform paths are network-free: they point the installer
+# at a `file://` URL served from a local directory via JAIPH_RELEASE_BASE_URL
+# and shim `uname` on a temporary PATH prefix.
+#
+# The parity step requires bun (the build:standalone target) and is skipped on
+# CI hosts where bun is not available — same convention as 210_standalone_binary.sh.
+
+set -euo pipefail
+
+ROOT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/../.." && pwd)"
+source "${ROOT_DIR}/e2e/lib/common.sh"
+trap e2e::cleanup EXIT
+
+e2e::prepare_test_env "installer_binary"
+TEST_DIR="${JAIPH_E2E_TEST_DIR}"
+INSTALL_SCRIPT="${ROOT_DIR}/docs/install"
+
+# Pick a checksum tool that exists on the host (shasum on macOS; sha256sum on Linux).
+if command -v sha256sum >/dev/null 2>&1; then
+  host_sha256() { sha256sum "$1" | awk '{print $1}'; }
+elif command -v shasum >/dev/null 2>&1; then
+  host_sha256() { shasum -a 256 "$1" | awk '{print $1}'; }
+else
+  e2e::skip "no sha256sum/shasum on host — skipping installer acceptance"
+  exit 0
+fi
+
+# Resolve the target asset name from the host (matches the installer's mapping).
+host_uname_s="$(uname -s)"
+host_uname_m="$(uname -m)"
+case "${host_uname_s}" in
+  Darwin) HOST_OS="darwin" ;;
+  Linux)  HOST_OS="linux" ;;
+  *) e2e::skip "host platform ${host_uname_s} not supported by installer — skipping"; exit 0 ;;
+esac
+case "${host_uname_m}" in
+  arm64|aarch64) HOST_ARCH="arm64" ;;
+  x86_64|x64)    HOST_ARCH="x64" ;;
+  *) e2e::skip "host arch ${host_uname_m} not supported by installer — skipping"; exit 0 ;;
+esac
+HOST_BIN_NAME="jaiph-${HOST_OS}-${HOST_ARCH}"
+
+# ── Checksum mismatch ────────────────────────────────────────────────────────
+
+e2e::section "Checksum mismatch fails and installs nothing"
+
+RELEASE_DIR="${TEST_DIR}/release-mismatch"
+BIN_DIR_BAD="${TEST_DIR}/bin-mismatch"
+mkdir -p "${RELEASE_DIR}" "${BIN_DIR_BAD}"
+
+printf 'real-binary-bytes' > "${RELEASE_DIR}/${HOST_BIN_NAME}"
+# Hand-craft SHA256SUMS with the wrong hash for HOST_BIN_NAME so the installer
+# reaches the verify step and fails with a checksum mismatch (not an http 404).
+printf '%s  %s\n' "0000000000000000000000000000000000000000000000000000000000000000" "${HOST_BIN_NAME}" \
+  > "${RELEASE_DIR}/SHA256SUMS"
+
+bad_status=0
+# Unset JAIPH_REPO_URL: the shared e2e context points it at this repo root,
+# which would otherwise trigger the local-source branch instead of download.
+bad_output="$(
+  unset JAIPH_REPO_URL
+  JAIPH_RELEASE_BASE_URL="file://${RELEASE_DIR}" \
+  JAIPH_BIN_DIR="${BIN_DIR_BAD}" \
+  bash "${INSTALL_SCRIPT}" 2>&1
+)" || bad_status=$?
+e2e::assert_equals "${bad_status}" "1" "checksum mismatch exits non-zero"
+# assert_contains: full message text includes ANSI colors and per-host hashes
+e2e::assert_contains "${bad_output}" "Checksum mismatch" "checksum mismatch is reported"
+if [ -e "${BIN_DIR_BAD}/jaiph" ]; then
+  e2e::fail "installer left ${BIN_DIR_BAD}/jaiph on checksum failure"
+fi
+e2e::pass "checksum mismatch is non-recoverable and leaves no binary"
+
+# ── Unsupported platform ──────────────────────────────────────────────────────
+
+e2e::section "Unsupported platform exits with documented message"
+
+FAKE_PATH_DIR="${TEST_DIR}/fake-uname"
+BIN_DIR_UNSUPPORTED="${TEST_DIR}/bin-unsupported"
+mkdir -p "${FAKE_PATH_DIR}" "${BIN_DIR_UNSUPPORTED}"
+
+cat > "${FAKE_PATH_DIR}/uname" <<'FAKE_UNAME'
+#!/usr/bin/env bash
+case "${1:-}" in
+  -s) echo "AIX" ;;
+  -m) echo "powerpc" ;;
+  *)  echo "AIX powerpc" ;;
+esac
+FAKE_UNAME
+chmod +x "${FAKE_PATH_DIR}/uname"
+
+unsupported_status=0
+unsupported_output="$(
+  unset JAIPH_REPO_URL
+  PATH="${FAKE_PATH_DIR}:${PATH}" \
+  JAIPH_BIN_DIR="${BIN_DIR_UNSUPPORTED}" \
+  bash "${INSTALL_SCRIPT}" 2>&1
+)" || unsupported_status=$?
+e2e::assert_equals "${unsupported_status}" "1" "unsupported platform exits non-zero"
+# assert_contains: ANSI codes and uname strings vary between OSes
+e2e::assert_contains "${unsupported_output}" "Unsupported platform: AIX powerpc" \
+  "error names the detected platform"
+e2e::assert_contains "${unsupported_output}" "contributing" \
+  "error points at the from-source instructions"
+if [ -e "${BIN_DIR_UNSUPPORTED}/jaiph" ]; then
+  e2e::fail "installer left a binary in ${BIN_DIR_UNSUPPORTED} on unsupported platform"
+fi
+e2e::pass "unsupported platform is non-recoverable and leaves no binary"
+
+# ── Parity check (local install) ──────────────────────────────────────────────
+
+if ! command -v bun >/dev/null 2>&1; then
+  e2e::skip "bun not installed — skipping local install parity check"
+  exit 0
+fi
+
+e2e::section "install-from-local.sh produces a single self-contained binary"
+
+PARITY_BIN_DIR="${TEST_DIR}/bin-parity"
+mkdir -p "${PARITY_BIN_DIR}"
+
+# install-from-local.sh execs docs/install with the repo path. Cap the bin dir
+# to a test-owned directory so we never touch ~/.local/bin.
+JAIPH_BIN_DIR="${PARITY_BIN_DIR}" \
+  bash "${ROOT_DIR}/docs/install-from-local.sh" "${ROOT_DIR}" >/dev/null
+
+[ -x "${PARITY_BIN_DIR}/jaiph" ] || e2e::fail "install-from-local.sh did not produce ${PARITY_BIN_DIR}/jaiph"
+
+# Single executable, no shim, no LIB_DIR/runtime tree.
+entries="$(find "${PARITY_BIN_DIR}" -mindepth 1 -maxdepth 1 -printf '%f\n' 2>/dev/null \
+  || find "${PARITY_BIN_DIR}" -mindepth 1 -maxdepth 1 -exec basename {} \;)"
+if [ "$(printf '%s\n' "${entries}" | sort)" != "jaiph" ]; then
+  printf 'Unexpected entries in %s:\n%s\n' "${PARITY_BIN_DIR}" "${entries}" >&2
+  e2e::fail "install dir should contain only the jaiph executable"
+fi
+# The installed jaiph must be a real binary, not a `node …` shim script.
+if head -c 2 "${PARITY_BIN_DIR}/jaiph" | grep -q '^#!'; then
+  e2e::fail "installed jaiph is a shebang shim, not a self-contained binary"
+fi
+e2e::pass "install dir contains only the self-contained jaiph binary"
+
+# Strip node/npm/bun from PATH and confirm --version and run still work.
+CLEAN_PATH="/usr/bin:/bin"
+for tool in node npm bun; do
+  if PATH="${CLEAN_PATH}" command -v "${tool}" >/dev/null 2>&1; then
+    e2e::fail "${tool} unexpectedly visible on stripped PATH (${CLEAN_PATH})"
+  fi
+done
+
+WORK_DIR="${TEST_DIR}/parity-work"
+mkdir -p "${WORK_DIR}"
+cat > "${WORK_DIR}/sample.jh" <<'EOF'
+script say_hello = `echo hello-from-local`
+workflow default() {
+  const msg = run say_hello()
+  return "${msg}"
+}
+EOF
+
+version_out="$(env -i PATH="${CLEAN_PATH}" HOME="${WORK_DIR}" "${PARITY_BIN_DIR}/jaiph" --version)"
+expected_version="$(node -p "require('${ROOT_DIR}/package.json').version" 2>/dev/null || echo "")"
+if [ -n "${expected_version}" ]; then
+  e2e::assert_equals "${version_out}" "jaiph ${expected_version}" "jaiph --version without node/npm/bun"
+else
+  # assert_contains: package.json version not readable in this env
+  e2e::assert_contains "${version_out}" "jaiph " "jaiph --version prints a version banner"
+fi
+
+run_out="$(cd "${WORK_DIR}" && env -i PATH="${CLEAN_PATH}" HOME="${WORK_DIR}" JAIPH_UNSAFE=true "${PARITY_BIN_DIR}/jaiph" run sample.jh)"
+case "${run_out}" in
+  *"hello-from-local"*) e2e::pass "locally-built binary runs a workflow without node/npm/bun" ;;
+  *) printf "%s\n" "${run_out}" >&2; e2e::fail "locally-built jaiph did not run sample.jh as expected" ;;
+esac
diff --git a/e2e/tests/125_test_discovery_errors.sh b/e2e/tests/125_test_discovery_errors.sh
index 12fbb967..9a09a2dc 100755
--- a/e2e/tests/125_test_discovery_errors.sh
+++ b/e2e/tests/125_test_discovery_errors.sh
@@ -10,25 +10,65 @@ e2e::prepare_test_env "test_discovery_errors"
 TEST_DIR="${JAIPH_E2E_TEST_DIR}"
 
 # ==========================================================================
-# Section 1: jaiph test on empty directory — no .test.jh files found
+# Section 1: jaiph test on empty directory — exits 0 with notice (discovery)
 # ==========================================================================
 
 e2e::section "jaiph test: empty directory"
 
 mkdir -p "${TEST_DIR}/empty_dir"
 
+empty_err="$(mktemp)"
+if ! jaiph test "${TEST_DIR}/empty_dir" >/dev/null 2>"${empty_err}"; then
+  cat "${empty_err}" >&2
+  rm -f "${empty_err}"
+  e2e::fail "jaiph test on empty directory should exit 0 in discovery mode"
+fi
+empty_out="$(cat "${empty_err}")"
+rm -f "${empty_err}"
+
+e2e::assert_equals "${empty_out}" \
+  "jaiph test: no *.test.jh files found (nothing to do)" \
+  "empty directory prints discovery notice on stderr"
+
+# ==========================================================================
+# Section 1a: jaiph test (no args) in a workspace without test files
+# ==========================================================================
+
+e2e::section "jaiph test: no args in empty workspace"
+
+mkdir -p "${TEST_DIR}/empty_workspace"
+
+noargs_err="$(mktemp)"
+if ! (cd "${TEST_DIR}/empty_workspace" && jaiph test >/dev/null 2>"${noargs_err}"); then
+  cat "${noargs_err}" >&2
+  rm -f "${noargs_err}"
+  e2e::fail "jaiph test with no args in empty workspace should exit 0"
+fi
+noargs_out="$(cat "${noargs_err}")"
+rm -f "${noargs_err}"
+
+e2e::assert_equals "${noargs_out}" \
+  "jaiph test: no *.test.jh files found (nothing to do)" \
+  "no args in empty workspace prints discovery notice"
+
+# ==========================================================================
+# Section 1b: jaiph test on nonexistent file — exits non-zero
+# ==========================================================================
+
+e2e::section "jaiph test: nonexistent file rejected"
+
 set +e
-empty_out="$(jaiph test "${TEST_DIR}/empty_dir" 2>&1)"
-empty_exit=$?
+missing_out="$(jaiph test "${TEST_DIR}/does_not_exist.test.jh" 2>&1)"
+missing_exit=$?
 set -e
 
-if [[ ${empty_exit} -eq 0 ]]; then
-  printf "%s\n" "${empty_out}" >&2
-  e2e::fail "jaiph test on empty directory should exit non-zero"
+if [[ ${missing_exit} -eq 0 ]]; then
+  printf "%s\n" "${missing_out}" >&2
+  e2e::fail "jaiph test on nonexistent file should exit non-zero"
 fi
-# assert_contains: error message includes varying directory path
-e2e::assert_contains "${empty_out}" "no *.test.jh files" \
-  "empty directory produces discovery error"
+# assert_contains: ENOENT message includes absolute path which varies per machine
+e2e::assert_contains "${missing_out}" "does_not_exist.test.jh" \
+  "nonexistent file is reported as error"
 
 # ==========================================================================
 # Section 2: jaiph test on a plain .jh file (not .test.jh)
diff --git a/e2e/tests/136_if_else_branch.sh b/e2e/tests/136_if_else_branch.sh
new file mode 100755
index 00000000..ff702974
--- /dev/null
+++ b/e2e/tests/136_if_else_branch.sh
@@ -0,0 +1,96 @@
+#!/usr/bin/env bash
+
+set -euo pipefail
+
+ROOT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/../.." && pwd)"
+source "${ROOT_DIR}/e2e/lib/common.sh"
+trap e2e::cleanup EXIT
+
+e2e::prepare_test_env "if_else_branch"
+TEST_DIR="${JAIPH_E2E_TEST_DIR}"
+
+# ── 1. if/else in workflow: then branch runs, else skipped ──────────────────
+
+e2e::section "if/else workflow: then branch runs when condition true"
+
+e2e::file "if_else_wf.jh" <<'EOF'
+workflow default(status) {
+  if status == "ok" {
+    log "healthy"
+  } else {
+    log "unhealthy: ${status}"
+  }
+  log "done"
+}
+EOF
+
+then_out="$(e2e::run "if_else_wf.jh" "ok")"
+e2e::expect_stdout "${then_out}" <<'EOF'
+
+Jaiph: Running if_else_wf.jh
+
+workflow default (status="ok")
+  ℹ healthy
+  ℹ done
+
+✓ PASS workflow default (<time>)
+EOF
+e2e::pass "if/else workflow: only then-branch runs when condition is true"
+
+# ── 2. if/else in workflow: else branch runs ────────────────────────────────
+
+e2e::section "if/else workflow: else branch runs when condition false"
+
+else_out="$(e2e::run "if_else_wf.jh" "bad")"
+e2e::expect_stdout "${else_out}" <<'EOF'
+
+Jaiph: Running if_else_wf.jh
+
+workflow default (status="bad")
+  ℹ unhealthy: bad
+  ℹ done
+
+✓ PASS workflow default (<time>)
+EOF
+e2e::pass "if/else workflow: only else-branch runs when condition is false"
+
+# ── 3. if/else in rule: both branches reachable ─────────────────────────────
+
+e2e::section "if/else rule: then branch runs when condition true"
+
+e2e::file "if_else_rule.jh" <<'EOF'
+rule check(value) {
+  if value == "" {
+    fail "value was empty"
+  } else {
+    log "value: ${value}"
+  }
+}
+
+workflow default(value) {
+  ensure check(value)
+  log "validated"
+}
+EOF
+
+rule_ok_out="$(e2e::run "if_else_rule.jh" "hello")"
+e2e::expect_stdout "${rule_ok_out}" <<'EOF'
+
+Jaiph: Running if_else_rule.jh
+
+workflow default (value="hello")
+  ▸ rule check (value="hello")
+  ·   ℹ value: hello
+  ✓ rule check (<time>)
+  ℹ validated
+
+✓ PASS workflow default (<time>)
+EOF
+e2e::pass "if/else rule: else branch runs and rule passes when value non-empty"
+
+# ── 4. if/else in rule: then branch fails ───────────────────────────────────
+
+e2e::section "if/else rule: then branch fails workflow when condition true"
+
+e2e::expect_fail "if_else_rule.jh"
+e2e::pass "if/else rule: then branch fails when value empty"
diff --git a/e2e/tests/137_inline_script_catch_recover.sh b/e2e/tests/137_inline_script_catch_recover.sh
new file mode 100755
index 00000000..69c85047
--- /dev/null
+++ b/e2e/tests/137_inline_script_catch_recover.sh
@@ -0,0 +1,81 @@
+#!/usr/bin/env bash
+
+set -euo pipefail
+
+ROOT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/../.." && pwd)"
+source "${ROOT_DIR}/e2e/lib/common.sh"
+trap e2e::cleanup EXIT
+
+e2e::prepare_test_env "inline_script_catch_recover"
+TEST_DIR="${JAIPH_E2E_TEST_DIR}"
+
+# ---------------------------------------------------------------------------
+e2e::section "inline script catch: failing body, catch body runs once with merged output"
+# ---------------------------------------------------------------------------
+
+e2e::file "inline_catch.jh" <<'EOF'
+workflow default() {
+  run `echo "bad" 1>&2; exit 3`() catch (err) {
+    log "caught: ${err}"
+  }
+}
+EOF
+
+catch_out="$(e2e::run "inline_catch.jh")"
+
+# assert_contains: inline script hash name is content-dependent and not predictable in heredoc
+e2e::assert_contains "${catch_out}" "script __inline_" "tree shows inline script step"
+e2e::assert_contains "${catch_out}" "caught: bad" "catch body ran once with merged stdout+stderr bound"
+e2e::assert_contains "${catch_out}" "PASS workflow default" "catch absorbed the failure"
+
+e2e::pass "inline script catch: single-shot recovery"
+
+# ---------------------------------------------------------------------------
+e2e::section "inline script recover: retries until counter-file repair makes it pass"
+# ---------------------------------------------------------------------------
+
+COUNTER="${TEST_DIR}/inline_recover_counter"
+rm -f "${COUNTER}" "${COUNTER}.done"
+
+e2e::file "inline_recover.jh" <<EOF
+workflow default() {
+  run \`test -f "${COUNTER}.done"\`() recover(err) {
+    run \`\`\`
+count=\$(cat "${COUNTER}" 2>/dev/null || echo 0)
+count=\$((count+1))
+echo "\${count}" > "${COUNTER}"
+if [ "\${count}" -ge 2 ]; then touch "${COUNTER}.done"; fi
+\`\`\`()
+  }
+}
+EOF
+
+recover_out="$(e2e::run "inline_recover.jh")"
+
+e2e::assert_file_exists "${COUNTER}.done" "recover body created the repair marker"
+counter_value="$(cat "${COUNTER}")"
+e2e::assert_equals "${counter_value}" "2" "recover ran exactly twice before the inline check passed"
+e2e::assert_contains "${recover_out}" "PASS workflow default" "workflow passes after recover retries"
+
+e2e::pass "inline script recover: retry loop with counter-file repair"
+
+# ---------------------------------------------------------------------------
+e2e::section "inline script catch in rule body"
+# ---------------------------------------------------------------------------
+
+e2e::file "inline_catch_rule.jh" <<'EOF'
+script noop = `true`
+rule gate() {
+  run `exit 5`() catch (err) {
+    run noop()
+  }
+}
+workflow default() {
+  ensure gate()
+}
+EOF
+
+rule_out="$(e2e::run "inline_catch_rule.jh")"
+e2e::assert_contains "${rule_out}" "PASS workflow default" "rule with inline-script catch passes"
+
+e2e::pass "inline script catch in rule body"
diff --git a/e2e/tests/138_if_match_dot_subject.sh b/e2e/tests/138_if_match_dot_subject.sh
new file mode 100755
index 00000000..d6b48154
--- /dev/null
+++ b/e2e/tests/138_if_match_dot_subject.sh
@@ -0,0 +1,69 @@
+#!/usr/bin/env bash
+
+set -euo pipefail
+
+ROOT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/../.." && pwd)"
+source "${ROOT_DIR}/e2e/lib/common.sh"
+trap e2e::cleanup EXIT
+
+e2e::prepare_test_env "if_match_dot_subject"
+TEST_DIR="${JAIPH_E2E_TEST_DIR}"
+
+# ── 1. if + match with dot-notation subject select branches by field value ──
+
+e2e::section "if/match dot-notation subject on typed prompt capture"
+
+e2e::file "verdict.jh" <<'EOF'
+#!/usr/bin/env jaiph
+workflow classify() {
+  const r = prompt "Verdict?" returns "{ verdict: string }"
+  if r.verdict == "ok" {
+    log "approved"
+  } else {
+    log "rejected"
+  }
+  const label = match r.verdict {
+    "ok" => "approved-arm"
+    "reject" => "rejected-arm"
+    _ => "unknown-arm"
+  }
+  return "${label}"
+}
+EOF
+
+e2e::file "verdict.test.jh" <<'EOF'
+import "verdict.jh" as v
+
+test "ok verdict selects then-branch and ok arm" {
+  mock prompt "{\"verdict\":\"ok\"}"
+  const out = run v.classify()
+  expect_equal out "approved-arm"
+}
+
+test "reject verdict selects else-branch and reject arm" {
+  mock prompt "{\"verdict\":\"reject\"}"
+  const out = run v.classify()
+  expect_equal out "rejected-arm"
+}
+
+test "unknown verdict selects else-branch and wildcard arm" {
+  mock prompt "{\"verdict\":\"maybe\"}"
+  const out = run v.classify()
+  expect_equal out "unknown-arm"
+}
+EOF
+
+pass_out="$(jaiph test "${TEST_DIR}/verdict.test.jh" 2>&1)"
+
+e2e::expect_stdout "${pass_out}" <<'EOF'
+testing verdict.test.jh
+  ▸ ok verdict selects then-branch and ok arm
+  ✓ <time>
+  ▸ reject verdict selects else-branch and reject arm
+  ✓ <time>
+  ▸ unknown verdict selects else-branch and wildcard arm
+  ✓ <time>
+✓ 3 test(s) passed
+EOF
+
+e2e::pass "dot-notation subjects route both if and match branches"
diff --git a/e2e/tests/139_agent_credentials_preflight.sh b/e2e/tests/139_agent_credentials_preflight.sh
new file mode 100755
index 00000000..ac442878
--- /dev/null
+++ b/e2e/tests/139_agent_credentials_preflight.sh
@@ -0,0 +1,130 @@
+#!/usr/bin/env bash
+#
+# Pre-flight agent-credential check: fails fast on Docker, warns on host.
+#
+# Runs without needing a real Docker daemon: setting JAIPH_DOCKER_ENABLED=true
+# causes runWorkflow to consult the pre-flight before `checkDockerAvailable`,
+# so the credential check fires and exits before any container can spawn.
+#
+
+set -euo pipefail
+
+ROOT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/../.." && pwd)"
+source "${ROOT_DIR}/e2e/lib/common.sh"
+trap e2e::cleanup EXIT
+
+e2e::prepare_test_env "agent_credentials_preflight"
+TEST_DIR="${JAIPH_E2E_TEST_DIR}"
+
+# ── 1. Docker on + claude + no creds → hard fail with E_AGENT_CREDENTIALS ────
+
+e2e::section "claude under Docker without credentials fails before launch"
+
+e2e::file "claude_docker.jh" <<'EOF'
+config {
+  agent.backend = "claude"
+  agent.default_model = "sonnet-test"
+}
+
+workflow default() {
+  log "should not run"
+}
+EOF
+
+err_file="$(mktemp)"
+exit_code=0
+env -u ANTHROPIC_API_KEY -u CLAUDE_CODE_OAUTH_TOKEN \
+  JAIPH_DOCKER_ENABLED=true \
+  jaiph run "${TEST_DIR}/claude_docker.jh" 2>"${err_file}" >/dev/null \
+  || exit_code=$?
+err_msg="$(cat "${err_file}")"
+rm -f "${err_file}"
+
+if [[ "${exit_code}" == "0" ]]; then
+  printf "stderr was:\n%s\n" "${err_msg}" >&2
+  e2e::fail "expected non-zero exit when claude credentials are missing under Docker"
+fi
+e2e::pass "non-zero exit when claude credentials missing under Docker"
+
+# Message contract: backend + model + entry path + scope.
+# assert_contains: each substring is part of a single composed line whose
+# format is exercised by exhaustive unit tests; here we just confirm wiring.
+e2e::assert_contains "${err_msg}" "E_AGENT_CREDENTIALS" "stderr names error code"
+e2e::assert_contains "${err_msg}" "claude" "stderr names the backend"
+e2e::assert_contains "${err_msg}" "sonnet-test" "stderr names the configured model"
+e2e::assert_contains "${err_msg}" "claude_docker.jh" "stderr names the entry .jh file"
+e2e::assert_contains "${err_msg}" "module config" "stderr names the config scope"
+
+# The run dir must NOT exist — pre-flight aborts before any runner/container starts.
+if [[ -d "${TEST_DIR}/.jaiph/runs" ]]; then
+  shopt -s nullglob
+  matches=( "${TEST_DIR}/.jaiph/runs/"*/*"claude_docker.jh"/ )
+  shopt -u nullglob
+  if [[ ${#matches[@]} -gt 0 ]]; then
+    e2e::fail "expected no run dir to be created (pre-flight should abort before launch)"
+  fi
+fi
+e2e::pass "no run directory created — runner/container never launched"
+
+# ── 2. Host (Docker off) + claude + no creds → warn, but proceed ────────────
+
+e2e::section "claude on host without credentials warns but proceeds"
+
+# Use --unsafe to force Docker off without needing a Docker daemon.
+err_file="$(mktemp)"
+stdout_file="$(mktemp)"
+exit_code=0
+env -u ANTHROPIC_API_KEY -u CLAUDE_CODE_OAUTH_TOKEN \
+  jaiph run --unsafe "${TEST_DIR}/claude_docker.jh" >"${stdout_file}" 2>"${err_file}" \
+  || exit_code=$?
+err_msg="$(cat "${err_file}")"
+out_msg="$(cat "${stdout_file}")"
+rm -f "${err_file}" "${stdout_file}"
+
+if [[ "${exit_code}" != "0" ]]; then
+  printf "stdout was:\n%s\nstderr was:\n%s\n" "${out_msg}" "${err_msg}" >&2
+  e2e::fail "host run with missing claude creds should not hard-fail (warn only)"
+fi
+e2e::pass "zero exit on host run with missing claude credentials"
+
+# assert_contains: stderr also carries unrelated lines (banner, hooks etc.)
+e2e::assert_contains "${err_msg}" "warning" "stderr contains a warning"
+e2e::assert_contains "${err_msg}" "claude" "warning names the backend"
+e2e::assert_contains "${err_msg}" "module config" "warning names the config scope"
+
+# Hard-error code must NOT appear on the host warn-only path.
+if [[ "${err_msg}" == *"E_AGENT_CREDENTIALS"* ]]; then
+  printf "%s\n" "${err_msg}" >&2
+  e2e::fail "host run must not emit E_AGENT_CREDENTIALS — that is the Docker contract"
+fi
+e2e::pass "no E_AGENT_CREDENTIALS on host warn-only path"
+
+# ── 3. codex + no OPENAI_API_KEY → hard fail on host (no login path) ────────
+
+e2e::section "codex on host without OPENAI_API_KEY fails fast"
+
+e2e::file "codex_host.jh" <<'EOF'
+config {
+  agent.backend = "codex"
+}
+
+workflow default() {
+  log "should not run"
+}
+EOF
+
+err_file="$(mktemp)"
+exit_code=0
+env -u OPENAI_API_KEY \
+  jaiph run --unsafe "${TEST_DIR}/codex_host.jh" 2>"${err_file}" >/dev/null \
+  || exit_code=$?
+err_msg="$(cat "${err_file}")"
+rm -f "${err_file}"
+
+if [[ "${exit_code}" == "0" ]]; then
+  printf "stderr was:\n%s\n" "${err_msg}" >&2
+  e2e::fail "expected non-zero exit when OPENAI_API_KEY missing for codex (host)"
+fi
+e2e::assert_contains "${err_msg}" "E_AGENT_CREDENTIALS" "codex host: stderr names error code"
+e2e::assert_contains "${err_msg}" "OPENAI_API_KEY" "codex host: stderr names the env var"
+e2e::pass "codex hard-fails on both host and Docker"
diff --git a/e2e/tests/210_standalone_binary.sh b/e2e/tests/210_standalone_binary.sh
new file mode 100755
index 00000000..b01c6704
--- /dev/null
+++ b/e2e/tests/210_standalone_binary.sh
@@ -0,0 +1,87 @@
+#!/usr/bin/env bash
+#
+# Verifies the bun --compile standalone binary is fully self-contained:
+#   - works from any directory with no repo checkout,
+#   - has no node/npm/bun on PATH,
+#   - successfully runs `--version`, `init`, `compile`, and `run` against a
+#     deterministic sample workflow.
+#
+# Skipped (not failed) when `bun` is unavailable on the host so the rest of
+# the e2e suite still runs on CI images that ship only node.
+
+set -euo pipefail
+
+ROOT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/../.." && pwd)"
+source "${ROOT_DIR}/e2e/lib/common.sh"
+trap e2e::cleanup EXIT
+
+e2e::prepare_test_env "standalone_binary"
+TEST_DIR="${JAIPH_E2E_TEST_DIR}"
+
+if ! command -v bun >/dev/null 2>&1; then
+  e2e::skip "bun not installed — skipping standalone binary self-contained check"
+  exit 0
+fi
+
+e2e::section "Build standalone binary"
+(cd "${ROOT_DIR}" && npm run build:standalone >/dev/null)
+[[ -x "${ROOT_DIR}/dist/jaiph" ]] || e2e::fail "dist/jaiph missing after build:standalone"
+e2e::pass "dist/jaiph built"
+
+# Stage the binary in an isolated dir; deliberately copy only `jaiph` —
+# no sibling `runtime/` or `docs/` so we prove the assets are embedded.
+STAGE_DIR="${TEST_DIR}/stage"
+mkdir -p "${STAGE_DIR}"
+cp "${ROOT_DIR}/dist/jaiph" "${STAGE_DIR}/jaiph"
+chmod +x "${STAGE_DIR}/jaiph"
+
+# Strip node/npm/bun from PATH. /usr/bin:/bin is enough for the shell builtins
+# the test relies on (bash, mkdir, cat, etc.).
+CLEAN_PATH="/usr/bin:/bin"
+for tool in node npm bun; do
+  if PATH="${CLEAN_PATH}" command -v "${tool}" >/dev/null 2>&1; then
+    e2e::fail "${tool} unexpectedly visible on stripped PATH (${CLEAN_PATH})"
+  fi
+done
+e2e::pass "stripped PATH has no node/npm/bun"
+
+WORK_DIR="${TEST_DIR}/work"
+mkdir -p "${WORK_DIR}"
+JAIPH_BIN="${STAGE_DIR}/jaiph"
+
+# Deterministic sample workflow: no prompts, no network — runs to completion.
+cat > "${WORK_DIR}/sample.jh" <<'EOF'
+script say_hello = `echo hello-standalone`
+workflow default() {
+  const msg = run say_hello()
+  return "${msg}"
+}
+EOF
+
+e2e::section "jaiph --version"
+version_out="$(cd "${WORK_DIR}" && env -i PATH="${CLEAN_PATH}" HOME="${WORK_DIR}" "${JAIPH_BIN}" --version)"
+# Read from package.json so the test does not need an update on every version bump
+# (single source of truth — see .jaiph/prepare_release.jh).
+pkg_version="$(node -p "require('${ROOT_DIR}/package.json').version")"
+e2e::assert_equals "${version_out}" "jaiph ${pkg_version}" "version output"
+
+e2e::section "jaiph init writes SKILL.md from embedded asset"
+(cd "${WORK_DIR}" && env -i PATH="${CLEAN_PATH}" HOME="${WORK_DIR}" "${JAIPH_BIN}" init >/dev/null)
+SKILL_PATH="${WORK_DIR}/.jaiph/SKILL.md"
+[[ -s "${SKILL_PATH}" ]] || e2e::fail "SKILL.md missing or empty after init"
+# Embedded copy must match docs/jaiph-skill.md byte-for-byte.
+e2e::assert_equals \
+  "$(cat "${SKILL_PATH}")" \
+  "$(cat "${ROOT_DIR}/docs/jaiph-skill.md")" \
+  "SKILL.md matches docs/jaiph-skill.md"
+
+e2e::section "jaiph compile sample.jh"
+(cd "${WORK_DIR}" && env -i PATH="${CLEAN_PATH}" HOME="${WORK_DIR}" "${JAIPH_BIN}" compile sample.jh)
+e2e::pass "compile sample.jh exits 0"
+
+e2e::section "jaiph run sample.jh"
+run_out="$(cd "${WORK_DIR}" && env -i PATH="${CLEAN_PATH}" HOME="${WORK_DIR}" JAIPH_UNSAFE=true "${JAIPH_BIN}" run sample.jh)"
+case "${run_out}" in
+  *"hello-standalone"*) e2e::pass "run sample.jh prints captured echo" ;;
+  *) printf "%s\n" "${run_out}" >&2; e2e::fail "run sample.jh did not produce expected output" ;;
+esac
diff --git a/e2e/tests/50_cli_and_parse_guards.sh b/e2e/tests/50_cli_and_parse_guards.sh
index c57d98d9..5e672e48 100644
--- a/e2e/tests/50_cli_and_parse_guards.sh
+++ b/e2e/tests/50_cli_and_parse_guards.sh
@@ -66,17 +66,18 @@ EOF
 
 # When
 empty_err="$(mktemp)"
-if jaiph test "${TEST_DIR}/empty_tests" 2>"${empty_err}"; then
+if ! jaiph test "${TEST_DIR}/empty_tests" >/dev/null 2>"${empty_err}"; then
   cat "${empty_err}" >&2
   rm -f "${empty_err}"
-  e2e::fail "jaiph test should fail when directory has no test files"
+  e2e::fail "jaiph test on empty directory should exit 0 in discovery mode"
 fi
 empty_out="$(cat "${empty_err}")"
 rm -f "${empty_err}"
 
 # Then
-# assert_contains: error message includes absolute directory path which varies per machine
-e2e::assert_contains "${empty_out}" "no *.test.jh files" "jaiph test reports no tests in directory"
+e2e::assert_equals "${empty_out}" \
+  "jaiph test: no *.test.jh files found (nothing to do)" \
+  "jaiph test reports discovery notice for empty directory"
 
 e2e::section "jaiph run requires workflow default"
 
diff --git a/e2e/tests/61_ensure_recover.sh b/e2e/tests/61_ensure_recover.sh
index 0cd5e260..05e241ed 100644
--- a/e2e/tests/61_ensure_recover.sh
+++ b/e2e/tests/61_ensure_recover.sh
@@ -130,7 +130,8 @@ set -e
 
 # Then
 e2e::assert_equals "${exit_fail}" "1" "jaiph run exits 1 when ensure fails without recover"
-e2e::assert_contains "${out_fail}" "Workflow execution failed." "stderr reports workflow failure"
+e2e::assert_contains "${out_fail}" "Workflow execution failed (exit 1) with no error output" "stderr reports workflow failure with exit code"
+e2e::assert_contains "${out_fail}" "inspect run_summary.jsonl and step artifacts under" "stderr points at run artifacts"
 e2e::pass "ensure without recover: exit 1 on failure"
 
 e2e::section "ensure ... catch { multiline prompt with param } parses and runs"
diff --git a/e2e/tests/86_metadata_scope_nested.sh b/e2e/tests/86_metadata_scope_nested.sh
index 753ad32d..da81002c 100644
--- a/e2e/tests/86_metadata_scope_nested.sh
+++ b/e2e/tests/86_metadata_scope_nested.sh
@@ -43,11 +43,14 @@ unset JAIPH_AGENT_BACKEND 2>/dev/null || true
 jaiph run "${TEST_DIR}/parent.jh" >/dev/null
 
 # Then
+# Cross-module `run` applies the callee module's config on top of the caller's
+# effective env (respecting `_LOCKED` env flags) and restores the caller's
+# scope when the call returns.
 actual="$(cat "${META_FILE}")"
 expected="$(printf '%s\n' \
   'parent_before:cursor' \
-  'child:cursor' \
+  'child:claude' \
   'parent_after:cursor')"
 
-e2e::assert_equals "${actual}" "${expected}" "nested workflow inherits caller config and preserves parent state"
+e2e::assert_equals "${actual}" "${expected}" "cross-module run sees callee module config; caller scope restored"
 e2e::expect_out_files "parent.jh" 5
diff --git a/e2e/tests/87_workflow_config.sh b/e2e/tests/87_workflow_config.sh
index de8db725..5154073c 100755
--- a/e2e/tests/87_workflow_config.sh
+++ b/e2e/tests/87_workflow_config.sh
@@ -103,9 +103,10 @@ e2e::assert_equals "${actual}" "${expected}" \
   "rule inside overriding workflow sees workflow model; rule in non-overriding sees module model"
 
 # ---------------------------------------------------------------------------
-# Section 3: Interaction — nested run with workflow config precedence
+# Section 3: Interaction — nested cross-module run applies callee module
+# config and restores caller scope after
 # ---------------------------------------------------------------------------
-e2e::section "workflow config + nested run interaction"
+e2e::section "cross-module run applies callee module config; caller scope restored"
 
 NESTED_LOG="${TEST_DIR}/nested.log"
 export JAIPH_NESTED_LOG="${NESTED_LOG}"
@@ -151,10 +152,10 @@ jaiph run "${TEST_DIR}/parent_nested.jh" >/dev/null
 actual="$(cat "${NESTED_LOG}")"
 expected="$(printf '%s\n' \
   'parent_before:claude' \
-  'child_backend:claude' \
+  'child_backend:cursor' \
   'parent_after:claude')"
 e2e::assert_equals "${actual}" "${expected}" \
-  "workflow-level config locks backend for nested cross-module call and restores after"
+  "cross-module call sees callee module backend; caller workflow-level backend restored after"
 
 # ---------------------------------------------------------------------------
 # Section 4: Env variable still wins over workflow config
diff --git a/e2e/tests/91_inbox_dispatch.sh b/e2e/tests/91_inbox_dispatch.sh
index 2967d1ce..2bc742d8 100755
--- a/e2e/tests/91_inbox_dispatch.sh
+++ b/e2e/tests/91_inbox_dispatch.sh
@@ -394,3 +394,52 @@ if [[ "$invalid_lines" -gt 0 ]]; then
   e2e::fail "run_summary.jsonl has ${invalid_lines} invalid JSON lines"
 fi
 e2e::pass "multi-target: run_summary.jsonl lines are valid JSON"
+
+e2e::section "Imported channel send: lib.topic normalizes to topic for routing"
+
+# Given — entry declares channel + route, lib declares the same channel,
+# entry workflow sends via the imported alias `lib.topic`
+e2e::file "lib_inbox.jh" <<'EOF'
+channel topic
+EOF
+
+e2e::file "main_imported_inbox.jh" <<'EOF'
+import "lib_inbox.jh" as lib
+
+channel topic -> handler
+
+script write_imported_received = `echo "$1" > imported_received.txt`
+workflow handler(message, chan, sender) {
+  run write_imported_received(message)
+}
+
+workflow default() {
+  lib.topic <- "x"
+}
+EOF
+
+# When
+e2e::run "main_imported_inbox.jh" >/dev/null
+
+# Then — handler was dispatched with payload "x"
+e2e::assert_file_exists "${TEST_DIR}/imported_received.txt" "handler invoked via lib.topic send"
+e2e::assert_equals "$(cat "${TEST_DIR}/imported_received.txt")" "x" "handler received payload via normalized channel key"
+
+# Then — inbox audit file uses bare channel name
+e2e::expect_file "*inbox/001-topic.txt" <<'EOF'
+x
+EOF
+
+# Then — INBOX_ENQUEUE in run_summary.jsonl uses bare channel name
+imported_run_dir="$(e2e::run_dir "main_imported_inbox.jh")"
+imported_summary="${imported_run_dir}/run_summary.jsonl"
+e2e::assert_file_exists "${imported_summary}" "imported send run_summary.jsonl exists"
+# assert_contains: run_summary.jsonl contains other lines with varying ts/run_id
+enqueue_channel="$(python3 -c "import json
+for line in open('${imported_summary}'):
+    obj = json.loads(line)
+    if obj.get('type') == 'INBOX_ENQUEUE':
+        print(obj['channel'])
+        break
+")"
+e2e::assert_equals "${enqueue_channel}" "topic" "INBOX_ENQUEUE channel is bare name (alias prefix stripped)"
diff --git a/integration/docs-explanation-task3.test.ts b/integration/docs-explanation-task3.test.ts
new file mode 100644
index 00000000..9a059a7e
--- /dev/null
+++ b/integration/docs-explanation-task3.test.ts
@@ -0,0 +1,173 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readFileSync } from "node:fs";
+import { join } from "node:path";
+
+// Task 3 acceptance: Explanation quadrant pages exist, the sandboxing
+// explanation is understanding-oriented (threat model present, enabling
+// procedure + config-key table absent), and the four pages are reachable
+// from the nav. These guards fail when the contract is violated — they
+// are independent of the broader docs-lint harness in task 2.
+
+const REPO_ROOT = process.cwd();
+const DOCS_DIR = join(REPO_ROOT, "docs");
+const NAV_LAYOUT = join(DOCS_DIR, "_layouts", "docs.html");
+
+function readPage(name: string): string {
+  return readFileSync(join(DOCS_DIR, name), "utf8");
+}
+
+function frontMatterDiataxis(source: string): string | null {
+  const m = source.match(/^---\n([\s\S]*?)\n---/);
+  if (!m) return null;
+  const dl = m[1].split("\n").find((l) => /^diataxis\s*:/.test(l));
+  if (!dl) return null;
+  return dl.replace(/^diataxis\s*:\s*/, "").trim().replace(/^['"]|['"]$/g, "");
+}
+
+function frontMatterPermalink(source: string): string | null {
+  const m = source.match(/^---\n([\s\S]*?)\n---/);
+  if (!m) return null;
+  const pl = m[1].split("\n").find((l) => /^permalink\s*:/.test(l));
+  if (!pl) return null;
+  return pl.replace(/^permalink\s*:\s*/, "").trim().replace(/^['"]|['"]$/g, "");
+}
+
+function bodyWithoutFrontMatter(source: string): string {
+  const m = source.match(/^---\n[\s\S]*?\n---\n?/);
+  return m ? source.slice(m[0].length) : source;
+}
+
+const EXPLANATION_PAGES: Array<{
+  file: string;
+  permalink: string;
+  label: string;
+}> = [
+  { file: "why-jaiph.md", permalink: "/why-jaiph", label: "Why Jaiph" },
+  { file: "inbox.md", permalink: "/inbox", label: "Inbox" },
+  {
+    file: "spec-async-handles.md",
+    permalink: "/spec-async-handles",
+    label: "Async Handles",
+  },
+  { file: "sandboxing.md", permalink: "/sandboxing", label: "Sandboxing" },
+];
+
+test("task-3: each new explanation page declares 'diataxis: explanation' and the expected permalink", () => {
+  for (const page of EXPLANATION_PAGES) {
+    const src = readPage(page.file);
+    assert.equal(
+      frontMatterDiataxis(src),
+      "explanation",
+      `${page.file} must declare 'diataxis: explanation'`,
+    );
+    assert.equal(
+      frontMatterPermalink(src),
+      page.permalink,
+      `${page.file} must declare 'permalink: ${page.permalink}'`,
+    );
+  }
+});
+
+test("task-3: every new explanation page is reachable from the nav exactly once", () => {
+  const nav = readFileSync(NAV_LAYOUT, "utf8");
+  const linkRe = /<a\s+href="\{\{\s*'([^']+)'\s*\|\s*relative_url\s*\}\}"/g;
+  const counts = new Map<string, number>();
+  let m: RegExpExecArray | null;
+  while ((m = linkRe.exec(nav)) !== null) {
+    counts.set(m[1], (counts.get(m[1]) ?? 0) + 1);
+  }
+  for (const page of EXPLANATION_PAGES) {
+    assert.equal(
+      counts.get(page.permalink) ?? 0,
+      1,
+      `nav must link to ${page.permalink} exactly once (found ${counts.get(page.permalink) ?? 0})`,
+    );
+  }
+});
+
+test("task-3: sandboxing explanation contains threat-model content", () => {
+  const body = bodyWithoutFrontMatter(readPage("sandboxing.md")).toLowerCase();
+  // A real threat-model section must call out both halves of the boundary.
+  assert.ok(
+    /what docker protects against/.test(body),
+    "sandboxing.md must explicitly describe what the Docker sandbox protects against",
+  );
+  assert.ok(
+    /what docker does \*\*not\*\* protect against|what docker does not protect against/.test(
+      body,
+    ),
+    "sandboxing.md must explicitly describe what the Docker sandbox does NOT protect against",
+  );
+  // Each side must mention at least one concrete claim from the source-grounded list.
+  assert.ok(
+    /cap-drop all|--cap-drop all|capabilities dropped|capability surface/.test(body),
+    "sandboxing.md threat-model must mention dropped capabilities",
+  );
+  assert.ok(
+    /allowlist/.test(body),
+    "sandboxing.md threat-model must mention the env-var allowlist",
+  );
+  assert.ok(
+    /hooks run on the host|hooks.*host/.test(body),
+    "sandboxing.md must call out that hooks run on the host (a deliberate non-protection)",
+  );
+  assert.ok(
+    /network egress/.test(body),
+    "sandboxing.md must call out default-on network egress (a deliberate non-protection)",
+  );
+});
+
+test("task-3: sandboxing explanation has no 'Enabling Docker' procedure heading", () => {
+  const body = bodyWithoutFrontMatter(readPage("sandboxing.md"));
+  // The enabling procedure was a numbered/step-driven section in the legacy
+  // page; it moves to a how-to in task 4 and must not survive in the
+  // understanding-oriented explanation.
+  const headingRe = /^#{2,4}\s+Enabling Docker\b/im;
+  assert.ok(
+    !headingRe.test(body),
+    "sandboxing.md must not contain an 'Enabling Docker' heading — that procedure belongs in a how-to (task 4)",
+  );
+  // Same constraint phrased structurally: no numbered list under a heading
+  // that includes the word 'enabling' or 'enable'.
+  const lines = body.split("\n");
+  let inSuspectSection = false;
+  for (const line of lines) {
+    const h = line.match(/^(#{2,4})\s+(.+)$/);
+    if (h) {
+      inSuspectSection = /enabl/i.test(h[2]);
+      continue;
+    }
+    if (inSuspectSection && /^\s*1\.\s+/.test(line)) {
+      assert.fail(
+        "sandboxing.md contains a numbered enabling procedure under an 'enable*' heading — that belongs in a how-to (task 4)",
+      );
+    }
+  }
+});
+
+test("task-3: sandboxing explanation has no config-key reference table", () => {
+  const body = bodyWithoutFrontMatter(readPage("sandboxing.md"));
+  // Reference key tables follow the shape `| Key | Type | Default | …` or list
+  // backtick-wrapped `runtime.docker_*` keys in a markdown table row.
+  const keyHeaderRe = /^\|\s*Key\s*\|/im;
+  assert.ok(
+    !keyHeaderRe.test(body),
+    "sandboxing.md must not contain a '| Key | …' reference table — config keys belong in the reference (task 5)",
+  );
+  const runtimeKeyRowRe = /^\|\s*`runtime\.docker_[a-z_]+`\s*\|/im;
+  assert.ok(
+    !runtimeKeyRowRe.test(body),
+    "sandboxing.md must not contain a table row listing `runtime.docker_*` keys — that belongs in the reference (task 5)",
+  );
+  // A "Configuration keys" or "Failure modes" reference heading is the same
+  // kind of bleed and is also out of scope for an explanation page.
+  assert.ok(
+    !/^#{2,4}\s+Configuration keys\b/im.test(body),
+    "sandboxing.md must not contain a 'Configuration keys' section — reference content lives elsewhere (task 5)",
+  );
+  assert.ok(
+    !/^#{2,4}\s+Failure modes\b/im.test(body),
+    "sandboxing.md must not contain a 'Failure modes' section — reference content lives elsewhere (task 5)",
+  );
+});
diff --git a/integration/docs-how-to-task4.test.ts b/integration/docs-how-to-task4.test.ts
new file mode 100644
index 00000000..4d0f519c
--- /dev/null
+++ b/integration/docs-how-to-task4.test.ts
@@ -0,0 +1,198 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readFileSync } from "node:fs";
+import { join } from "node:path";
+
+// Task 4 acceptance: How-to quadrant pages exist as task-oriented recipes, each
+// with `diataxis: how-to`, a `/how-to/...` permalink, the right `redirect_from`
+// for any retired slug, and a nav entry. The agent-auth recipe additionally
+// must name every backend credential and the credential-pre-flight error code
+// — that contract comes from src/cli/run/preflight-credentials.ts.
+
+const REPO_ROOT = process.cwd();
+const DOCS_DIR = join(REPO_ROOT, "docs");
+const NAV_LAYOUT = join(DOCS_DIR, "_layouts", "docs.html");
+
+interface HowToPage {
+  /** File under docs/ (immediate child). */
+  file: string;
+  /** Expected `permalink:` value. */
+  permalink: string;
+  /** Old/retired permalinks that must appear under `redirect_from:` (`[]` if none). */
+  redirectFrom: string[];
+  /** Nav label substring used to grep the nav entry's anchor. */
+  navPermalink: string;
+}
+
+const HOW_TO_PAGES: HowToPage[] = [
+  {
+    file: "setup.md",
+    permalink: "/how-to/install",
+    redirectFrom: ["/setup"],
+    navPermalink: "/how-to/install",
+  },
+  {
+    file: "sandbox-run.md",
+    permalink: "/how-to/sandbox-run",
+    redirectFrom: [],
+    navPermalink: "/how-to/sandbox-run",
+  },
+  {
+    file: "agent-auth.md",
+    permalink: "/how-to/agent-auth",
+    redirectFrom: [],
+    navPermalink: "/how-to/agent-auth",
+  },
+  {
+    file: "configure-backend.md",
+    permalink: "/how-to/configure-backend",
+    redirectFrom: [],
+    navPermalink: "/how-to/configure-backend",
+  },
+  {
+    file: "hooks.md",
+    permalink: "/how-to/hooks",
+    redirectFrom: ["/hooks"],
+    navPermalink: "/how-to/hooks",
+  },
+  {
+    file: "libraries.md",
+    permalink: "/how-to/libraries",
+    redirectFrom: ["/libraries"],
+    navPermalink: "/how-to/libraries",
+  },
+  {
+    file: "artifacts.md",
+    permalink: "/how-to/artifacts",
+    redirectFrom: ["/artifacts"],
+    navPermalink: "/how-to/artifacts",
+  },
+  {
+    file: "testing.md",
+    permalink: "/how-to/testing",
+    redirectFrom: ["/testing"],
+    navPermalink: "/how-to/testing",
+  },
+];
+
+function readPage(name: string): string {
+  return readFileSync(join(DOCS_DIR, name), "utf8");
+}
+
+function frontMatterBlock(source: string): string | null {
+  const m = source.match(/^---\n([\s\S]*?)\n---/);
+  return m ? m[1] : null;
+}
+
+function frontMatterScalar(fm: string, key: string): string | null {
+  const line = fm.split("\n").find((l) => new RegExp(`^${key}\\s*:`).test(l));
+  if (!line) return null;
+  return line.replace(new RegExp(`^${key}\\s*:\\s*`), "").trim().replace(/^['"]|['"]$/g, "");
+}
+
+function frontMatterList(fm: string, key: string): string[] {
+  const lines = fm.split("\n");
+  const startIdx = lines.findIndex((l) => new RegExp(`^${key}\\s*:\\s*$`).test(l));
+  if (startIdx === -1) return [];
+  const out: string[] = [];
+  for (let i = startIdx + 1; i < lines.length; i++) {
+    const m = lines[i].match(/^\s*-\s+(.+)$/);
+    if (!m) break;
+    out.push(m[1].trim().replace(/^['"]|['"]$/g, ""));
+  }
+  return out;
+}
+
+test("task-4: every how-to page declares 'diataxis: how-to' and the expected permalink", () => {
+  for (const page of HOW_TO_PAGES) {
+    const fm = frontMatterBlock(readPage(page.file));
+    assert.ok(fm, `${page.file}: missing front-matter block`);
+    assert.equal(
+      frontMatterScalar(fm!, "diataxis"),
+      "how-to",
+      `${page.file}: must declare 'diataxis: how-to'`,
+    );
+    assert.equal(
+      frontMatterScalar(fm!, "permalink"),
+      page.permalink,
+      `${page.file}: must declare 'permalink: ${page.permalink}'`,
+    );
+  }
+});
+
+test("task-4: every retired permalink is absorbed by the new how-to page's redirect_from", () => {
+  for (const page of HOW_TO_PAGES) {
+    if (page.redirectFrom.length === 0) continue;
+    const fm = frontMatterBlock(readPage(page.file));
+    assert.ok(fm, `${page.file}: missing front-matter block`);
+    const declared = frontMatterList(fm!, "redirect_from");
+    for (const slug of page.redirectFrom) {
+      assert.ok(
+        declared.includes(slug),
+        `${page.file}: redirect_from must include '${slug}' so the retired permalink keeps resolving (declared: ${declared.join(", ") || "<none>"})`,
+      );
+    }
+  }
+});
+
+test("task-4: every how-to page is reachable from the nav exactly once", () => {
+  const nav = readFileSync(NAV_LAYOUT, "utf8");
+  const linkRe = /<a\s+href="\{\{\s*'([^']+)'\s*\|\s*relative_url\s*\}\}"/g;
+  const counts = new Map<string, number>();
+  let m: RegExpExecArray | null;
+  while ((m = linkRe.exec(nav)) !== null) {
+    counts.set(m[1], (counts.get(m[1]) ?? 0) + 1);
+  }
+  for (const page of HOW_TO_PAGES) {
+    const count = counts.get(page.navPermalink) ?? 0;
+    assert.equal(
+      count,
+      1,
+      `nav must link to ${page.navPermalink} exactly once (found ${count})`,
+    );
+  }
+});
+
+test("task-4: agent-auth how-to names every backend credential and the pre-flight error code", () => {
+  // The pre-flight implementation is src/cli/run/preflight-credentials.ts; the
+  // recipe must name every credential it checks plus the stable error code so
+  // a user hitting that error can find the page by searching for the literal.
+  const body = readPage("agent-auth.md");
+  const required = [
+    "ANTHROPIC_API_KEY",
+    "CLAUDE_CODE_OAUTH_TOKEN",
+    "CURSOR_API_KEY",
+    "OPENAI_API_KEY",
+    "E_AGENT_CREDENTIALS",
+  ];
+  for (const literal of required) {
+    assert.ok(
+      body.includes(literal),
+      `agent-auth.md must mention the literal '${literal}' (matches the credential pre-flight in src/cli/run/preflight-credentials.ts)`,
+    );
+  }
+  // Also assert that claude's setup-token instruction is present, since that
+  // is the documented path for obtaining a CLAUDE_CODE_OAUTH_TOKEN.
+  assert.ok(
+    /claude setup-token/.test(body),
+    "agent-auth.md must show `claude setup-token` as the way to obtain CLAUDE_CODE_OAUTH_TOKEN",
+  );
+});
+
+test("task-4: how-to pages stay recipe-shaped (goal → numbered steps → verification)", () => {
+  // A recipe is identifiable by numbered steps and a verification section.
+  // This is a structural sanity check — fail if a page drifted back into
+  // open-ended prose without a verifiable conclusion.
+  for (const page of HOW_TO_PAGES) {
+    const body = readPage(page.file);
+    assert.ok(
+      /^##\s+Verification\b/im.test(body) ||
+        /^##\s+Verify(\b|ication\b)/im.test(body),
+      `${page.file}: how-to recipe must include a 'Verification' (or 'Verify') section`,
+    );
+    assert.ok(
+      /^##\s+\d\.\s+/im.test(body) || /^###\s+\d\.\s+/im.test(body),
+      `${page.file}: how-to recipe must include at least one numbered step heading`,
+    );
+  }
+});
diff --git a/integration/docs-nav-structure-task7.test.ts b/integration/docs-nav-structure-task7.test.ts
new file mode 100644
index 00000000..6ac65210
--- /dev/null
+++ b/integration/docs-nav-structure-task7.test.ts
@@ -0,0 +1,157 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readdirSync, readFileSync } from "node:fs";
+import { join } from "node:path";
+
+// Task 7 acceptance: the docs nav is the Diátaxis spine — every published
+// docs/*.md with a `diataxis:` front-matter value must appear under the
+// matching section exactly once, the five section headings must appear in
+// the documented order, and miscategorisation / duplication / omission is a
+// hard failure. The redirect-coverage and clean-jekyll checks live in
+// docs-structure.test.ts and docs-legacy-quarantine.test.ts respectively; this
+// file owns the section-structure contract alone.
+
+const REPO_ROOT = process.cwd();
+const DOCS_DIR = join(REPO_ROOT, "docs");
+const NAV_LAYOUT = join(DOCS_DIR, "_layouts", "docs.html");
+
+const SECTIONS: Array<{ heading: string; diataxis: string }> = [
+  { heading: "Tutorials", diataxis: "tutorial" },
+  { heading: "How-to guides", diataxis: "how-to" },
+  { heading: "Reference", diataxis: "reference" },
+  { heading: "Explanation", diataxis: "explanation" },
+  { heading: "Contributing", diataxis: "contributor" },
+];
+
+interface Page {
+  file: string;
+  permalink: string;
+  diataxis: string;
+}
+
+function frontMatter(source: string): string | null {
+  const m = source.match(/^---\n([\s\S]*?)\n---/);
+  return m ? m[1] : null;
+}
+
+function scalar(fm: string, key: string): string | null {
+  const line = fm.split("\n").find((l) => new RegExp(`^${key}\\s*:`).test(l));
+  if (!line) return null;
+  return line
+    .replace(new RegExp(`^${key}\\s*:\\s*`), "")
+    .trim()
+    .replace(/^['"]|['"]$/g, "");
+}
+
+function loadPublishedPages(): Page[] {
+  const pages: Page[] = [];
+  for (const entry of readdirSync(DOCS_DIR)) {
+    if (!entry.endsWith(".md")) continue;
+    const src = readFileSync(join(DOCS_DIR, entry), "utf8");
+    const fm = frontMatter(src);
+    if (!fm) continue;
+    const diataxis = scalar(fm, "diataxis");
+    const permalink = scalar(fm, "permalink");
+    if (!diataxis || !permalink) continue;
+    pages.push({ file: entry, permalink, diataxis });
+  }
+  return pages;
+}
+
+interface NavParse {
+  headings: string[];
+  bySection: Map<string, string[]>;
+}
+
+function parseNav(): NavParse {
+  const html = readFileSync(NAV_LAYOUT, "utf8");
+  const itemRe =
+    /<li(?:\s+class="docs-nav-group")?\s*>(?:<a\s+href="\{\{\s*'([^']+)'\s*\|\s*relative_url\s*\}\}"[^>]*>([^<]+)<\/a>|([^<]+))<\/li>/g;
+  const headings: string[] = [];
+  const bySection = new Map<string, string[]>();
+  let currentHeading: string | null = null;
+  let m: RegExpExecArray | null;
+  while ((m = itemRe.exec(html)) !== null) {
+    const isGroup = /class="docs-nav-group"/.test(m[0]);
+    if (isGroup) {
+      currentHeading = (m[3] ?? "").trim();
+      headings.push(currentHeading);
+      bySection.set(currentHeading, []);
+      continue;
+    }
+    const permalink = m[1];
+    if (!permalink || permalink === "/" || currentHeading === null) continue;
+    bySection.get(currentHeading)!.push(permalink);
+  }
+  return { headings, bySection };
+}
+
+test("task-7: nav contains the five Diátaxis section headings in the documented order", () => {
+  const { headings } = parseNav();
+  const expected = SECTIONS.map((s) => s.heading);
+  // Slice to handle the case where the nav adds further <li class="docs-nav-group">
+  // headings in the future; the contract is "these five, in this order, before
+  // anything else". A simple equality is fine today and tightens the contract.
+  assert.deepEqual(
+    headings,
+    expected,
+    `nav section headings must be exactly ${JSON.stringify(expected)} in this order; got ${JSON.stringify(headings)}`,
+  );
+});
+
+test("task-7: every published diataxis page appears under its section exactly once (no miss / no miscategorisation / no dup)", () => {
+  const pages = loadPublishedPages();
+  const { bySection } = parseNav();
+
+  for (const section of SECTIONS) {
+    const links = bySection.get(section.heading) ?? [];
+    const pagesInSection = pages.filter((p) => p.diataxis === section.diataxis);
+    const expectedPermalinks = pagesInSection.map((p) => p.permalink).sort();
+    const actualPermalinks = [...links].sort();
+
+    assert.deepEqual(
+      actualPermalinks,
+      expectedPermalinks,
+      `section "${section.heading}" (diataxis: ${section.diataxis}) members drifted from the set of published pages with that diataxis.\n  expected: ${JSON.stringify(expectedPermalinks)}\n  actual:   ${JSON.stringify(actualPermalinks)}`,
+    );
+
+    // Defensive: assert no duplicate permalinks within the section's own list.
+    const counts = new Map<string, number>();
+    for (const link of links) counts.set(link, (counts.get(link) ?? 0) + 1);
+    for (const [link, n] of counts) {
+      assert.equal(
+        n,
+        1,
+        `section "${section.heading}" lists ${link} ${n} times — every page must appear exactly once`,
+      );
+    }
+  }
+
+  // And cross-section: no permalink may appear under more than one section.
+  const seen = new Map<string, string>();
+  for (const section of SECTIONS) {
+    for (const link of bySection.get(section.heading) ?? []) {
+      const owner = seen.get(link);
+      assert.ok(
+        owner === undefined,
+        `${link} appears under both "${owner}" and "${section.heading}" — pages may only appear in one section`,
+      );
+      seen.set(link, section.heading);
+    }
+  }
+
+  // And every published diataxis page is reachable: nothing landed orphaned
+  // between sections because the section's heading was missing.
+  for (const p of pages) {
+    const section = SECTIONS.find((s) => s.diataxis === p.diataxis);
+    assert.ok(
+      section,
+      `${p.file}: diataxis '${p.diataxis}' has no nav section`,
+    );
+    const links = bySection.get(section!.heading) ?? [];
+    assert.ok(
+      links.includes(p.permalink),
+      `${p.file}: published page ${p.permalink} (diataxis: ${p.diataxis}) is missing from the "${section!.heading}" section`,
+    );
+  }
+});
diff --git a/integration/docs-reference-task5.test.ts b/integration/docs-reference-task5.test.ts
new file mode 100644
index 00000000..eea72afb
--- /dev/null
+++ b/integration/docs-reference-task5.test.ts
@@ -0,0 +1,203 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readFileSync, readdirSync, statSync } from "node:fs";
+import { join } from "node:path";
+
+// Task 5 acceptance: Reference quadrant pages exist as pure lookup pages, the
+// env-var reference is source-parity-pinned against `src/` (drift in either
+// direction fails the test), and reference pages contain no tutorial-shaped
+// prose. These guards fail when the contract is violated — they are
+// independent of the broader docs-lint harness in task 2.
+
+const REPO_ROOT = process.cwd();
+const DOCS_DIR = join(REPO_ROOT, "docs");
+const NAV_LAYOUT = join(DOCS_DIR, "_layouts", "docs.html");
+const SRC_DIR = join(REPO_ROOT, "src");
+
+const REFERENCE_PAGES: Array<{ file: string; permalink: string }> = [
+  { file: "cli.md", permalink: "/reference/cli" },
+  { file: "configuration.md", permalink: "/reference/configuration" },
+  { file: "grammar.md", permalink: "/reference/grammar" },
+  { file: "language.md", permalink: "/reference/language" },
+  { file: "env-vars.md", permalink: "/reference/env-vars" },
+];
+
+function readPage(name: string): string {
+  return readFileSync(join(DOCS_DIR, name), "utf8");
+}
+
+function frontMatterBlock(source: string): string | null {
+  const m = source.match(/^---\n([\s\S]*?)\n---/);
+  return m ? m[1] : null;
+}
+
+function frontMatterScalar(fm: string, key: string): string | null {
+  const line = fm.split("\n").find((l) => new RegExp(`^${key}\\s*:`).test(l));
+  if (!line) return null;
+  return line.replace(new RegExp(`^${key}\\s*:\\s*`), "").trim().replace(/^['"]|['"]$/g, "");
+}
+
+function bodyWithoutFrontMatter(source: string): string {
+  const m = source.match(/^---\n[\s\S]*?\n---\n?/);
+  return m ? source.slice(m[0].length) : source;
+}
+
+function walkSourceFiles(dir: string, out: string[] = []): string[] {
+  for (const entry of readdirSync(dir)) {
+    if (entry === "node_modules" || entry === ".git") continue;
+    const full = join(dir, entry);
+    const st = statSync(full);
+    if (st.isDirectory()) {
+      walkSourceFiles(full, out);
+    } else if (
+      entry.endsWith(".ts") &&
+      !entry.endsWith(".d.ts")
+    ) {
+      out.push(full);
+    }
+  }
+  return out;
+}
+
+function collectJaiphEnvNamesFromSource(): Set<string> {
+  // Source-parity pattern: greppable `<anyIdentifier>env.JAIPH_X` /
+  // `process.env.JAIPH_X` / `process.env["JAIPH_X"]` anywhere under src/.
+  // The leading `[a-zA-Z]*` lets the test catch both `env.JAIPH_*` (the
+  // host-side runner env in `src/cli/run/env.ts`), `process.env.JAIPH_*`
+  // (callers that go through the full Node `process.env` namespace), and
+  // `parentEnv.JAIPH_*` (the runtime's metadata-merge lock checks in
+  // `src/runtime/kernel/node-workflow-runtime.ts`). All three forms are
+  // semantically equivalent reads of the same variable.
+  const PATTERNS = [
+    /[a-zA-Z]*[Ee]nv\.JAIPH_([A-Z_]+)/g,
+    /process\.env\[["']JAIPH_([A-Z_]+)["']\]/g,
+  ];
+  const names = new Set<string>();
+  for (const file of walkSourceFiles(SRC_DIR)) {
+    const text = readFileSync(file, "utf8");
+    for (const re of PATTERNS) {
+      re.lastIndex = 0;
+      let m: RegExpExecArray | null;
+      while ((m = re.exec(text)) !== null) {
+        names.add(`JAIPH_${m[1]}`);
+      }
+    }
+  }
+  return names;
+}
+
+function extractParityNamesFromEnvVarsPage(): Set<string> {
+  const body = bodyWithoutFrontMatter(readPage("env-vars.md"));
+  // The canonical parity-pinned table is delimited by HTML markers so other
+  // sections (installer-only vars, vendor credentials) are not subject to the
+  // strict src-drift gate.
+  const m = body.match(
+    /<!--\s*begin:\s*src-parity\s*-->([\s\S]*?)<!--\s*end:\s*src-parity\s*-->/,
+  );
+  assert.ok(
+    m,
+    "env-vars.md must include a `<!-- begin: src-parity -->` / `<!-- end: src-parity -->` block delimiting the source-parity table",
+  );
+  const block = m![1];
+  // Match every backtick-wrapped `JAIPH_NAME` token in the block — every table
+  // row's first column wraps the variable name in backticks.
+  const names = new Set<string>();
+  const tokenRe = /`(JAIPH_[A-Z_]+)`/g;
+  let mm: RegExpExecArray | null;
+  while ((mm = tokenRe.exec(block)) !== null) {
+    names.add(mm[1]);
+  }
+  return names;
+}
+
+test("task-5: every reference page declares 'diataxis: reference' and the expected permalink", () => {
+  for (const page of REFERENCE_PAGES) {
+    const fm = frontMatterBlock(readPage(page.file));
+    assert.ok(fm, `${page.file}: missing front-matter block`);
+    assert.equal(
+      frontMatterScalar(fm!, "diataxis"),
+      "reference",
+      `${page.file}: must declare 'diataxis: reference'`,
+    );
+    assert.equal(
+      frontMatterScalar(fm!, "permalink"),
+      page.permalink,
+      `${page.file}: must declare 'permalink: ${page.permalink}'`,
+    );
+  }
+});
+
+test("task-5: every reference page is reachable from the nav exactly once", () => {
+  const nav = readFileSync(NAV_LAYOUT, "utf8");
+  const linkRe = /<a\s+href="\{\{\s*'([^']+)'\s*\|\s*relative_url\s*\}\}"/g;
+  const counts = new Map<string, number>();
+  let m: RegExpExecArray | null;
+  while ((m = linkRe.exec(nav)) !== null) {
+    counts.set(m[1], (counts.get(m[1]) ?? 0) + 1);
+  }
+  for (const page of REFERENCE_PAGES) {
+    const count = counts.get(page.permalink) ?? 0;
+    assert.equal(
+      count,
+      1,
+      `nav must link to ${page.permalink} exactly once (found ${count})`,
+    );
+  }
+});
+
+test("task-5: env-vars reference is source-parity-pinned against src/ (drift in either direction fails)", () => {
+  const fromSource = collectJaiphEnvNamesFromSource();
+  const fromPage = extractParityNamesFromEnvVarsPage();
+
+  const missingFromPage = [...fromSource].filter((n) => !fromPage.has(n)).sort();
+  const missingFromSource = [...fromPage].filter((n) => !fromSource.has(n)).sort();
+
+  assert.deepEqual(
+    missingFromPage,
+    [],
+    `env-vars.md must list every JAIPH_* name read in src/. Missing from page: ${missingFromPage.join(", ") || "<none>"}`,
+  );
+  assert.deepEqual(
+    missingFromSource,
+    [],
+    `env-vars.md must not list a JAIPH_* name absent from src/. Page rows without a src reference: ${missingFromSource.join(", ") || "<none>"}`,
+  );
+
+  // A non-empty intersection is the goal; assert the parity table is not empty
+  // so a future "delete every row" regression also trips this guard.
+  assert.ok(
+    fromPage.size > 30,
+    `env-vars.md parity table looks suspiciously short — only ${fromPage.size} rows`,
+  );
+});
+
+test("task-5: reference pages contain no tutorial-shaped numbered walkthroughs", () => {
+  for (const page of REFERENCE_PAGES) {
+    const body = bodyWithoutFrontMatter(readPage(page.file));
+    // Reject numbered ## / ### section headings (the how-to recipe shape).
+    const numberedHeading = /^#{2,4}\s+\d+\.\s+/m;
+    assert.ok(
+      !numberedHeading.test(body),
+      `${page.file}: reference pages must not use numbered '## 1. <step>' / '### 2. <step>' section headings — that shape belongs in a how-to`,
+    );
+    // Reject the how-to recipe's terminal section.
+    assert.ok(
+      !/^#{2,4}\s+(Verification|Verify(?:\s|$))/im.test(body),
+      `${page.file}: reference pages must not include a 'Verification' / 'Verify' section — that shape belongs in a how-to`,
+    );
+    // Reject paragraphs that begin with second-person imperative procedure verbs.
+    const tutorialLeads = /^(You can now|You will|Now you|Now, you|First,? you|Next,? you|Finally,? you)/im;
+    assert.ok(
+      !tutorialLeads.test(body),
+      `${page.file}: reference pages must avoid second-person tutorial prose ('You will…', 'Now you…', etc.)`,
+    );
+    // Heuristic upper bound on second-person pronouns. Reference is allowed
+    // some 'your run dir' / 'your workflow' phrasing, but a high count is a
+    // signal of drifted tutorial content.
+    const pronouns = (body.match(/\b(you|your|yourself)\b/gi) ?? []).length;
+    assert.ok(
+      pronouns <= 12,
+      `${page.file}: too many second-person pronouns (${pronouns}); reference pages should describe the system, not address the reader`,
+    );
+  }
+});
diff --git a/integration/docs-structure.test.ts b/integration/docs-structure.test.ts
new file mode 100644
index 00000000..ac69e2a8
--- /dev/null
+++ b/integration/docs-structure.test.ts
@@ -0,0 +1,348 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { spawnSync } from "node:child_process";
+import { readdirSync, readFileSync } from "node:fs";
+import { join } from "node:path";
+
+const REPO_ROOT = process.cwd();
+const DOCS_DIR = join(REPO_ROOT, "docs");
+const NAV_LAYOUT = join(DOCS_DIR, "_layouts", "docs.html");
+
+const VALID_DIATAXIS = new Set([
+  "tutorial",
+  "how-to",
+  "reference",
+  "explanation",
+  "contributor",
+]);
+
+interface PageInfo {
+  name: string;
+  body: string;
+  permalink: string | null;
+  redirectFrom: string[];
+  diataxis: string | null;
+  anchors: Set<string>;
+}
+
+function stripQuotes(value: string): string {
+  if (
+    (value.startsWith('"') && value.endsWith('"')) ||
+    (value.startsWith("'") && value.endsWith("'"))
+  ) {
+    return value.slice(1, -1);
+  }
+  return value;
+}
+
+// Minimal YAML-ish front-matter parser. Supports `key: scalar` lines and
+// `key:` followed by `  - value` list items, which is everything our docs
+// front-matter uses. Anything more exotic is intentionally out of scope.
+function parseFrontMatter(source: string): {
+  fm: Record<string, string | string[]>;
+  body: string;
+} {
+  const normalized = source.replace(/\r\n/g, "\n");
+  if (!normalized.startsWith("---\n")) {
+    return { fm: {}, body: normalized };
+  }
+  const lines = normalized.split("\n");
+  let end = -1;
+  for (let i = 1; i < lines.length; i++) {
+    if (lines[i].trim() === "---") {
+      end = i;
+      break;
+    }
+  }
+  if (end === -1) return { fm: {}, body: normalized };
+
+  const fm: Record<string, string | string[]> = {};
+  let currentListKey: string | null = null;
+  for (let i = 1; i < end; i++) {
+    const line = lines[i];
+    const trimmed = line.trim();
+    if (!trimmed) continue;
+    if (/^-\s+/.test(trimmed) && currentListKey) {
+      const value = stripQuotes(trimmed.replace(/^-\s+/, ""));
+      (fm[currentListKey] as string[]).push(value);
+      continue;
+    }
+    const m = line.match(/^([a-zA-Z_][a-zA-Z0-9_-]*)\s*:\s*(.*)$/);
+    if (!m) {
+      currentListKey = null;
+      continue;
+    }
+    const key = m[1];
+    const value = m[2].trim();
+    if (value === "") {
+      fm[key] = [];
+      currentListKey = key;
+    } else {
+      fm[key] = stripQuotes(value);
+      currentListKey = null;
+    }
+  }
+  return { fm, body: lines.slice(end + 1).join("\n") };
+}
+
+function slugify(headingText: string): string {
+  // kramdown / GFM heading slug: drop code-span ticks, drop emphasis marks,
+  // lowercase, keep [a-z0-9-], collapse whitespace to dashes.
+  return headingText
+    .replace(/`([^`]*)`/g, "$1")
+    .replace(/[*_~]/g, "")
+    .toLowerCase()
+    .replace(/[^a-z0-9\s-]/g, "")
+    .trim()
+    .replace(/\s+/g, "-");
+}
+
+function extractAnchors(body: string): Set<string> {
+  const anchors = new Set<string>();
+  let inFence = false;
+  for (const line of body.split("\n")) {
+    if (/^```/.test(line)) {
+      inFence = !inFence;
+      continue;
+    }
+    if (inFence) continue;
+    // ATX heading: # ... [{#explicit-id} | {:#explicit-id} | {: #explicit-id}]
+    const h = line.match(/^(#{1,6})\s+(.+?)\s*#*\s*$/);
+    if (h) {
+      const text = h[2].trim();
+      const explicit = text.match(/\{:?\s*#([a-zA-Z0-9_-]+)\}\s*$/);
+      if (explicit) {
+        anchors.add(explicit[1]);
+        anchors.add(slugify(text.replace(/\{:?\s*#[^}]+\}\s*$/, "")));
+      } else {
+        anchors.add(slugify(text));
+      }
+    }
+    // kramdown Inline Attribute List attached to any preceding block:
+    //   {:#anchor}  /  {: #anchor}  on its own line.
+    const ial = line.match(/^\s*\{:\s*#([a-zA-Z0-9_-]+)\s*\}\s*$/);
+    if (ial) anchors.add(ial[1]);
+  }
+  return anchors;
+}
+
+function loadPages(): PageInfo[] {
+  const pages: PageInfo[] = [];
+  for (const entry of readdirSync(DOCS_DIR)) {
+    if (!entry.endsWith(".md")) continue;
+    const source = readFileSync(join(DOCS_DIR, entry), "utf8");
+    const { fm, body } = parseFrontMatter(source);
+    pages.push({
+      name: entry,
+      body,
+      permalink: typeof fm.permalink === "string" ? fm.permalink : null,
+      redirectFrom: Array.isArray(fm.redirect_from) ? fm.redirect_from : [],
+      diataxis: typeof fm.diataxis === "string" ? fm.diataxis : null,
+      anchors: extractAnchors(body),
+    });
+  }
+  return pages;
+}
+
+function extractNavPermalinks(navHtml: string): string[] {
+  // Counts every <a href="{{ '/foo' | relative_url }}"> as exactly one nav entry.
+  const linkPattern = /<a\s+href="\{\{\s*'([^']+)'\s*\|\s*relative_url\s*\}\}"/g;
+  const links: string[] = [];
+  let m: RegExpExecArray | null;
+  while ((m = linkPattern.exec(navHtml)) !== null) {
+    links.push(m[1]);
+  }
+  return links;
+}
+
+function pageByPermalink(pages: PageInfo[]): Map<string, PageInfo> {
+  const map = new Map<string, PageInfo>();
+  for (const p of pages) {
+    if (p.permalink) map.set(p.permalink, p);
+  }
+  return map;
+}
+
+function allKnownRoutes(pages: PageInfo[]): Set<string> {
+  const routes = new Set<string>(["/"]);
+  for (const p of pages) {
+    if (p.permalink) routes.add(p.permalink);
+    for (const r of p.redirectFrom) routes.add(r);
+  }
+  return routes;
+}
+
+function collectHistoricalNavPermalinks(): Set<string> | null {
+  const proc = spawnSync(
+    "git",
+    ["log", "-p", "--all", "--", "docs/_layouts/docs.html"],
+    { cwd: REPO_ROOT, encoding: "utf8", maxBuffer: 64 * 1024 * 1024 },
+  );
+  if (proc.status !== 0) return null;
+  const set = new Set<string>();
+  const re = /'(\/[a-zA-Z0-9_-][a-zA-Z0-9_/-]*)'\s*\|\s*relative_url/g;
+  let m: RegExpExecArray | null;
+  while ((m = re.exec(proc.stdout)) !== null) {
+    set.add(m[1]);
+  }
+  return set;
+}
+
+test("docs-lint: every published docs/*.md has a valid 'diataxis:' front-matter value", () => {
+  const pages = loadPages();
+  assert.ok(pages.length > 0, "expected at least one published doc under docs/");
+  for (const p of pages) {
+    assert.notEqual(
+      p.diataxis,
+      null,
+      `${p.name}: missing 'diataxis:' front-matter (allowed: ${[...VALID_DIATAXIS].join(", ")})`,
+    );
+    assert.ok(
+      VALID_DIATAXIS.has(p.diataxis!),
+      `${p.name}: invalid 'diataxis: ${p.diataxis}' (allowed: ${[...VALID_DIATAXIS].join(", ")})`,
+    );
+  }
+});
+
+test("docs-lint: every nav permalink corresponds to a published page", () => {
+  const nav = readFileSync(NAV_LAYOUT, "utf8");
+  const links = extractNavPermalinks(nav);
+  const pages = loadPages();
+  const byPermalink = pageByPermalink(pages);
+
+  for (const link of links) {
+    if (link === "/" || link === "") continue;
+    assert.ok(
+      byPermalink.has(link),
+      `nav link ${link} has no matching published page (no docs/*.md declares 'permalink: ${link}')`,
+    );
+  }
+});
+
+test("docs-lint: every published page is linked from nav exactly once", () => {
+  const nav = readFileSync(NAV_LAYOUT, "utf8");
+  const links = extractNavPermalinks(nav);
+  const pages = loadPages();
+  const counts = new Map<string, number>();
+  for (const link of links) counts.set(link, (counts.get(link) ?? 0) + 1);
+
+  for (const p of pages) {
+    assert.ok(
+      p.permalink,
+      `${p.name}: published page must declare a 'permalink:' so nav can target it exactly once`,
+    );
+    const count = counts.get(p.permalink!) ?? 0;
+    assert.equal(
+      count,
+      1,
+      `${p.name}: expected exactly one nav entry for ${p.permalink} but found ${count}`,
+    );
+  }
+});
+
+test("docs-lint: every internal markdown link / permalink / redirect_from resolves", () => {
+  const pages = loadPages();
+  const routes = allKnownRoutes(pages);
+  const byPermalink = pageByPermalink(pages);
+  const byName = new Map(pages.map((p) => [p.name, p]));
+
+  // [label](href) but not images (![label](href))
+  const mdLinkRe = /(?<!!)\[([^\]]+)\]\(([^)\s]+)\)/g;
+
+  for (const p of pages) {
+    let m: RegExpExecArray | null;
+    while ((m = mdLinkRe.exec(p.body)) !== null) {
+      const label = m[1];
+      const href = m[2];
+      if (/^(https?:|mailto:|tel:)/i.test(href)) continue;
+      let path = href;
+      let anchor: string | null = null;
+      const hashIdx = path.indexOf("#");
+      if (hashIdx >= 0) {
+        anchor = path.slice(hashIdx + 1);
+        path = path.slice(0, hashIdx);
+      }
+
+      if (!path) {
+        // in-page anchor link
+        assert.ok(
+          anchor !== null && p.anchors.has(anchor),
+          `${p.name}: in-page link [${label}](${href}) has no matching heading`,
+        );
+        continue;
+      }
+
+      let route: string;
+      if (path.startsWith("/")) {
+        route = path.replace(/\/$/, "") || "/";
+      } else if (path.endsWith(".md")) {
+        // Relative file link. jekyll-relative-links rewrites it to the target
+        // page's permalink, so resolve by the target FILE's declared permalink
+        // (basename -> page -> permalink), not a naive "/basename" — pages may
+        // live at nested permalinks (e.g. /tutorials/first-workflow).
+        const targetName = path.split("/").pop()!;
+        const target = byName.get(targetName);
+        assert.ok(
+          target && target.permalink,
+          `${p.name}: link [${label}](${href}) — no published page file '${targetName}'`,
+        );
+        route = target!.permalink!;
+      } else {
+        route = "/" + path.replace(/\/$/, "");
+      }
+
+      assert.ok(
+        routes.has(route),
+        `${p.name}: link [${label}](${href}) — route '${route}' does not resolve to any published page or redirect_from`,
+      );
+
+      // Only verify anchor when the route resolves to a real live page.
+      // If it resolves only via a redirect_from, the target page is a redirect
+      // landing and almost never carries the original section anchor; future
+      // Diátaxis pages will own those anchors.
+      if (anchor) {
+        const target = byPermalink.get(route);
+        if (target) {
+          assert.ok(
+            target.anchors.has(anchor),
+            `${p.name}: link [${label}](${href}) — anchor '#${anchor}' not found in ${target.name}`,
+          );
+        }
+      }
+    }
+
+    // redirect_from must not collide with another page's permalink
+    for (const r of p.redirectFrom) {
+      const owner = byPermalink.get(r);
+      assert.ok(
+        !owner || owner === p,
+        `${p.name}: redirect_from '${r}' collides with permalink of ${owner?.name}`,
+      );
+    }
+  }
+});
+
+test("docs-lint: every historical nav permalink still resolves (via page or redirect_from)", () => {
+  const historical = collectHistoricalNavPermalinks();
+  if (historical === null) {
+    // git unavailable in this sandbox — historical coverage cannot be checked.
+    return;
+  }
+  const pages = loadPages();
+  const routes = allKnownRoutes(pages);
+  for (const link of historical) {
+    if (link === "/" || link === "") continue;
+    assert.ok(
+      routes.has(link),
+      `historical nav permalink '${link}' no longer resolves: add it under 'redirect_from:' on a live page (architecture.md or jaiph-skill.md)`,
+    );
+  }
+});
+
+test("docs-lint: docs/_legacy/ no longer exists (post-redesign cleanup)", () => {
+  const legacy = join(DOCS_DIR, "_legacy");
+  assert.ok(
+    !readdirSync(DOCS_DIR).includes("_legacy"),
+    `docs/_legacy/ must be removed after the Diátaxis redesign; found ${legacy}`,
+  );
+});
diff --git a/integration/docs-tutorials-task6.test.ts b/integration/docs-tutorials-task6.test.ts
new file mode 100644
index 00000000..345609c7
--- /dev/null
+++ b/integration/docs-tutorials-task6.test.ts
@@ -0,0 +1,223 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { spawnSync } from "node:child_process";
+import {
+  existsSync,
+  mkdtempSync,
+  readFileSync,
+  rmSync,
+  writeFileSync,
+} from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+
+// Task 6 acceptance: Tutorials quadrant pages exist, are wired into nav,
+// retire `/getting-started` via redirect_from, and the first-workflow
+// tutorial's `.jh` snippet is *executable* — extracting the first ```jh
+// fenced block and running it with `JAIPH_UNSAFE=true` produces the
+// documented output. This guards against tutorials drifting into
+// aspirational prose where the copy-pasted commands no longer work.
+
+const REPO_ROOT = process.cwd();
+const DOCS_DIR = join(REPO_ROOT, "docs");
+const NAV_LAYOUT = join(DOCS_DIR, "_layouts", "docs.html");
+const JAIPH_BIN = join(REPO_ROOT, "dist", "src", "cli.js");
+
+const TUTORIAL_PAGES: Array<{ file: string; permalink: string }> = [
+  { file: "first-workflow.md", permalink: "/tutorials/first-workflow" },
+  { file: "first-agent-run.md", permalink: "/tutorials/first-agent-run" },
+];
+
+function readPage(name: string): string {
+  return readFileSync(join(DOCS_DIR, name), "utf8");
+}
+
+function frontMatterBlock(source: string): string | null {
+  const m = source.match(/^---\n([\s\S]*?)\n---/);
+  return m ? m[1] : null;
+}
+
+function frontMatterScalar(fm: string, key: string): string | null {
+  const line = fm.split("\n").find((l) => new RegExp(`^${key}\\s*:`).test(l));
+  if (!line) return null;
+  return line.replace(new RegExp(`^${key}\\s*:\\s*`), "").trim().replace(/^['"]|['"]$/g, "");
+}
+
+function frontMatterList(fm: string, key: string): string[] {
+  const lines = fm.split("\n");
+  const startIdx = lines.findIndex((l) => new RegExp(`^${key}\\s*:\\s*$`).test(l));
+  if (startIdx === -1) return [];
+  const out: string[] = [];
+  for (let i = startIdx + 1; i < lines.length; i++) {
+    const m = lines[i].match(/^\s*-\s+(.+)$/);
+    if (!m) break;
+    out.push(m[1].trim().replace(/^['"]|['"]$/g, ""));
+  }
+  return out;
+}
+
+function extractFencedBlocks(body: string, lang: string): string[] {
+  // CommonMark: a fenced block opens with ```<lang> on its own line and
+  // closes on the next line that is exactly ``` (allowing trailing space).
+  // The tutorial deliberately uses single-backtick script bodies so no
+  // nested ``` appears inside ```jh blocks — keep this extractor simple.
+  const lines = body.split("\n");
+  const blocks: string[] = [];
+  let i = 0;
+  while (i < lines.length) {
+    const open = lines[i].match(/^```(\w[\w-]*)\s*$/);
+    if (!open) {
+      i++;
+      continue;
+    }
+    const openLang = open[1];
+    i++;
+    const start = i;
+    while (i < lines.length && !/^```\s*$/.test(lines[i])) i++;
+    if (openLang === lang) {
+      blocks.push(lines.slice(start, i).join("\n"));
+    }
+    i++; // skip the closing fence
+  }
+  return blocks;
+}
+
+function normalizeRunTimings(out: string): string {
+  // Strip per-step and total elapsed times so output comparison is stable.
+  // Matches "(0s)", "(0.2s)", "(123ms)", "(1.5s)".
+  return out.replace(/\(\d+(\.\d+)?(s|ms)\)/g, "(<time>)");
+}
+
+test("task-6: every tutorial page declares 'diataxis: tutorial' and the expected permalink", () => {
+  for (const page of TUTORIAL_PAGES) {
+    const fm = frontMatterBlock(readPage(page.file));
+    assert.ok(fm, `${page.file}: missing front-matter block`);
+    assert.equal(
+      frontMatterScalar(fm!, "diataxis"),
+      "tutorial",
+      `${page.file}: must declare 'diataxis: tutorial'`,
+    );
+    assert.equal(
+      frontMatterScalar(fm!, "permalink"),
+      page.permalink,
+      `${page.file}: must declare 'permalink: ${page.permalink}'`,
+    );
+  }
+});
+
+test("task-6: every tutorial is reachable from the nav exactly once", () => {
+  const nav = readFileSync(NAV_LAYOUT, "utf8");
+  const linkRe = /<a\s+href="\{\{\s*'([^']+)'\s*\|\s*relative_url\s*\}\}"/g;
+  const counts = new Map<string, number>();
+  let m: RegExpExecArray | null;
+  while ((m = linkRe.exec(nav)) !== null) {
+    counts.set(m[1], (counts.get(m[1]) ?? 0) + 1);
+  }
+  for (const page of TUTORIAL_PAGES) {
+    const count = counts.get(page.permalink) ?? 0;
+    assert.equal(
+      count,
+      1,
+      `nav must link to ${page.permalink} exactly once (found ${count})`,
+    );
+  }
+  // The nav must surface a "Tutorials" group label so the two pages render
+  // as a learning quadrant rather than dangling next to How-to / Reference.
+  assert.match(
+    nav,
+    /<li class="docs-nav-group">Tutorials<\/li>/,
+    "nav must include a 'Tutorials' group heading",
+  );
+});
+
+test("task-6: '/getting-started' is absorbed by the first-workflow tutorial's redirect_from", () => {
+  // The retired permalink must be claimed by exactly one live page (the new
+  // tutorial). Any other live page declaring 'permalink: /getting-started'
+  // or duplicating the redirect_from would conflict with jekyll-redirect-from.
+  const fm = frontMatterBlock(readPage("first-workflow.md"));
+  assert.ok(fm, "first-workflow.md: missing front-matter block");
+  const declared = frontMatterList(fm!, "redirect_from");
+  assert.ok(
+    declared.includes("/getting-started"),
+    `first-workflow.md: redirect_from must include '/getting-started' (declared: ${declared.join(", ") || "<none>"})`,
+  );
+  // Defensive: architecture.md previously claimed /getting-started while no
+  // tutorial existed. Once this tutorial owns the slug, the older entry must
+  // be gone so jekyll-redirect-from does not emit two competing stubs.
+  const archFm = frontMatterBlock(readPage("architecture.md"));
+  assert.ok(archFm, "architecture.md: missing front-matter block");
+  const archRedirects = frontMatterList(archFm!, "redirect_from");
+  assert.ok(
+    !archRedirects.includes("/getting-started"),
+    "architecture.md must no longer claim '/getting-started' under redirect_from — the tutorial owns it now",
+  );
+});
+
+test("task-6: first-workflow tutorial's `.jh` snippet runs end-to-end and matches the documented output", () => {
+  const page = readPage("first-workflow.md");
+  const jhBlocks = extractFencedBlocks(page, "jh");
+  assert.ok(
+    jhBlocks.length >= 1,
+    "first-workflow.md: expected at least one ```jh fenced code block",
+  );
+  const textBlocks = extractFencedBlocks(page, "text");
+  assert.ok(
+    textBlocks.length >= 1,
+    "first-workflow.md: expected at least one ```text fenced block (documented output)",
+  );
+
+  const snippet = jhBlocks[0];
+  const expectedOutput = textBlocks[0];
+
+  // The snippet is parameterised with `who`. The tutorial copy-paste invokes
+  // it with "Adam"; pinning the same argument here keeps the contract honest.
+  const args = ["Adam"];
+
+  const tmp = mkdtempSync(join(tmpdir(), "jaiph-tutorial-"));
+  try {
+    const entry = join(tmp, "hello.jh");
+    writeFileSync(entry, snippet);
+
+    assert.ok(
+      existsSync(JAIPH_BIN),
+      `${JAIPH_BIN} not found — run \`npm run build\` first`,
+    );
+
+    const env = {
+      // Clean env: PATH for child shell + script execve, HOME for any
+      // tooling that touches it, JAIPH_UNSAFE so Docker is bypassed in CI,
+      // and TERM so the runtime does not try to render TTY escapes.
+      PATH: process.env.PATH ?? "/usr/bin:/bin",
+      HOME: tmp,
+      JAIPH_UNSAFE: "true",
+      TERM: "dumb",
+      NO_COLOR: "1",
+    };
+
+    const result = spawnSync(
+      process.execPath,
+      [JAIPH_BIN, "run", entry, ...args],
+      { env, encoding: "utf8", cwd: tmp, timeout: 60_000 },
+    );
+
+    assert.equal(
+      result.status,
+      0,
+      `tutorial snippet should exit 0; got status=${result.status}\nstderr:\n${result.stderr}\nstdout:\n${result.stdout}`,
+    );
+
+    const got = normalizeRunTimings(result.stdout.trim());
+    const want = normalizeRunTimings(expectedOutput.trim());
+    assert.equal(
+      got,
+      want,
+      `tutorial documented output drifted from actual run.\n--- got ---\n${got}\n--- want ---\n${want}`,
+    );
+
+    // The artifacts the tutorial points at must exist on disk after a run.
+    const runRoot = join(tmp, ".jaiph", "runs");
+    assert.ok(existsSync(runRoot), ".jaiph/runs/ must exist after a successful run");
+  } finally {
+    rmSync(tmp, { recursive: true, force: true });
+  }
+});
diff --git a/integration/sample-build/build.test.ts b/integration/sample-build/build.test.ts
index 6964f256..e5121aab 100644
--- a/integration/sample-build/build.test.ts
+++ b/integration/sample-build/build.test.ts
@@ -3,8 +3,7 @@ import assert from "node:assert/strict";
 import { existsSync, mkdirSync, mkdtempSync, readFileSync, readdirSync, rmSync, writeFileSync } from "node:fs";
 import { tmpdir } from "node:os";
 import { join } from "node:path";
-import { buildScripts, resolveImportPath } from "../../src/transpiler";
-import { parsejaiph } from "../../src/parser";
+import { buildScripts } from "../../src/transpiler";
 
 import "./helpers";
 
@@ -87,29 +86,6 @@ test("build fails on missing import file", () => {
   }
 });
 
-// Regression: .jaiph/main.jh once imported implement_from_queue.jh which had been
-// renamed to engineer.jh, causing E_IMPORT_NOT_FOUND for every `jaiph test` run
-// in the workspace. `jaiph test` now builds from the test file entrypoint only;
-// this still checks main.jh imports and that the whole `.jaiph` graph builds.
-test(".jaiph/main.jh imports only existing modules", () => {
-  const jaiphDir = join(process.cwd(), ".jaiph");
-  const mainJh = join(jaiphDir, "main.jh");
-  assert.ok(existsSync(mainJh), ".jaiph/main.jh should exist");
-
-  const ast = parsejaiph(readFileSync(mainJh, "utf8"), mainJh);
-  for (const imp of ast.imports) {
-    const resolved = resolveImportPath(mainJh, imp.path, process.cwd());
-    assert.ok(existsSync(resolved), `import "${imp.alias}" resolves to missing file "${resolved}"`);
-  }
-
-  const outDir = join(jaiphDir, ".tmp-build-out");
-  try {
-    assert.doesNotThrow(() => buildScripts(jaiphDir, outDir, process.cwd()));
-  } finally {
-    rmSync(outDir, { recursive: true, force: true });
-  }
-});
-
 test("build rejects command substitution in prompt text", () => {
   const rootSubshell = mkdtempSync(join(tmpdir(), "jaiph-build-prompt-subshell-"));
   try {
diff --git a/integration/sample-build/cli-tree.test.ts b/integration/sample-build/cli-tree.test.ts
index bafc96df..e4ced24f 100644
--- a/integration/sample-build/cli-tree.test.ts
+++ b/integration/sample-build/cli-tree.test.ts
@@ -36,7 +36,7 @@ test("jaiph init creates workspace structure and guidance", () => {
     assert.doesNotMatch(bootstrap, /\$1/);
     assert.equal(statSync(join(root, ".jaiph/bootstrap.jh")).mode & 0o777, 0o755);
     const localSkill = readFileSync(join(root, ".jaiph/SKILL.md"), "utf8");
-    assert.match(localSkill, /Jaiph Bootstrap Skill/);
+    assert.match(localSkill, /Jaiph Skill \(for Agents\)/);
     assert.equal(existsSync(join(root, ".gitignore")), false);
     assert.equal(readFileSync(join(root, ".jaiph", ".gitignore"), "utf8"), "runs\ntmp\n");
     assert.match(initResult.stdout, /Jaiph init/);
@@ -172,7 +172,7 @@ test("jaiph run tree shows workflow params inline when run has key=value args",
       [
         'import "sub.jh" as sub',
         "workflow default() {",
-        '  run sub.default(path="docs/cli.md" mode="strict")',
+        '  run sub.default(path="docs/cli.md", mode="strict")',
         "}",
         "",
       ].join("\n"),
diff --git a/integration/sample-build/recover-handle.test.ts b/integration/sample-build/recover-handle.test.ts
index 32d7e557..2f5e2e72 100644
--- a/integration/sample-build/recover-handle.test.ts
+++ b/integration/sample-build/recover-handle.test.ts
@@ -113,6 +113,105 @@ test("recover: retry limit exhaustion fails the workflow", () => {
   }
 });
 
+test("recover: workflow-level run.recover_limit overrides module-level", () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-recover-workflow-cfg-"));
+  try {
+    writeFileSync(join(root, ".counter"), "0");
+    writeFileSync(
+      join(root, "main.jh"),
+      [
+        "config {",
+        "  run.recover_limit = 50",
+        "}",
+        "",
+        "script bump_and_fail = ```",
+        "count=$(cat .counter)",
+        "echo $(( count + 1 )) > .counter",
+        "exit 1",
+        "```",
+        "workflow failing() {",
+        "  run bump_and_fail()",
+        "}",
+        "workflow default() {",
+        "  config {",
+        "    run.recover_limit = 2",
+        "  }",
+        '  run failing() recover(err) {',
+        '    log "repair attempt"',
+        '  }',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const cliPath = join(process.cwd(), "dist/src/cli.js");
+    const r = spawnSync("node", [cliPath, "run", join(root, "main.jh")], {
+      encoding: "utf8",
+      cwd: root,
+      env: { ...process.env, JAIPH_DOCKER_ENABLED: "false" },
+    });
+    assert.notEqual(r.status, 0, "should fail after retry limit exhausted");
+    const combined = r.stdout + r.stderr;
+    assert.match(combined, /FAIL/);
+    const counter = require("node:fs").readFileSync(join(root, ".counter"), "utf8").trim();
+    // limit=2 means 1 initial attempt + 2 retries = 3 invocations of the failing script.
+    assert.equal(counter, "3", `expected 3 attempts, got ${counter}`);
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("recover: sibling workflow without own config uses module-level run.recover_limit", () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-recover-sibling-cfg-"));
+  try {
+    writeFileSync(join(root, ".counter"), "0");
+    writeFileSync(
+      join(root, "main.jh"),
+      [
+        "config {",
+        "  run.recover_limit = 2",
+        "}",
+        "",
+        "script bump_and_fail = ```",
+        "count=$(cat .counter)",
+        "echo $(( count + 1 )) > .counter",
+        "exit 1",
+        "```",
+        "workflow failing() {",
+        "  run bump_and_fail()",
+        "}",
+        "workflow other_default() {",
+        "  config {",
+        "    run.recover_limit = 50",
+        "  }",
+        '  run failing() recover(err) {',
+        '    log "ignored"',
+        '  }',
+        "}",
+        "workflow default() {",
+        '  run failing() recover(err) {',
+        '    log "repair attempt"',
+        '  }',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const cliPath = join(process.cwd(), "dist/src/cli.js");
+    const r = spawnSync("node", [cliPath, "run", join(root, "main.jh")], {
+      encoding: "utf8",
+      cwd: root,
+      env: { ...process.env, JAIPH_DOCKER_ENABLED: "false" },
+    });
+    assert.notEqual(r.status, 0, "should fail after retry limit exhausted");
+    const combined = r.stdout + r.stderr;
+    assert.match(combined, /FAIL/);
+    const counter = require("node:fs").readFileSync(join(root, ".counter"), "utf8").trim();
+    // Module-level limit=2 → 1 initial + 2 retries = 3 attempts in `default` (no own config).
+    assert.equal(counter, "3", `expected 3 attempts, got ${counter}`);
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
 test("recover: retry limit configurable via config", () => {
   const root = mkdtempSync(join(tmpdir(), "jaiph-recover-limit-"));
   try {
diff --git a/integration/sample-build/run-prompt-agent.test.ts b/integration/sample-build/run-prompt-agent.test.ts
index 6299ed56..e2c61fad 100644
--- a/integration/sample-build/run-prompt-agent.test.ts
+++ b/integration/sample-build/run-prompt-agent.test.ts
@@ -305,6 +305,10 @@ test("jaiph run agent.backend = claude without claude in PATH fails with clear e
       ...process.env,
       JAIPH_DOCKER_ENABLED: "false",
       PATH: `${nodeOnlyBin}:/nonexistent`,
+      // Disable prompt-retry backoff for this single-attempt failure assertion;
+      // otherwise the default schedule (15s → 1m → 10m → 30m → 2h) would
+      // re-run the missing-claude pre-flight five more times.
+      JAIPH_PROMPT_RETRY: "0",
     };
     delete runEnv.JAIPH_AGENT_BACKEND;
     const runResult = spawnSync("node", [cliPath, "run", filePath], {
diff --git a/integration/subcommand-help.test.ts b/integration/subcommand-help.test.ts
new file mode 100644
index 00000000..0c65353e
--- /dev/null
+++ b/integration/subcommand-help.test.ts
@@ -0,0 +1,40 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { spawnSync } from "node:child_process";
+import { join } from "node:path";
+
+const CLI_PATH = join(process.cwd(), "dist/src/cli.js");
+
+const SUBCOMMANDS = ["run", "test", "compile", "format", "init", "install", "use"];
+
+for (const cmd of SUBCOMMANDS) {
+  for (const helpFlag of ["--help", "-h"]) {
+    test(`jaiph ${cmd} ${helpFlag} prints usage to stdout and exits 0`, () => {
+      const result = spawnSync("node", [CLI_PATH, cmd, helpFlag], {
+        encoding: "utf8",
+        stdio: ["ignore", "pipe", "pipe"],
+      });
+      assert.equal(result.status, 0, `expected exit 0, got ${result.status}\nstderr: ${result.stderr}`);
+      assert.ok(
+        result.stdout.includes("Usage"),
+        `stdout should contain "Usage": ${JSON.stringify(result.stdout)}`,
+      );
+      assert.ok(
+        result.stdout.includes(cmd),
+        `stdout should contain subcommand "${cmd}": ${JSON.stringify(result.stdout)}`,
+      );
+    });
+  }
+}
+
+test("jaiph run --help does not attempt to resolve --help as a file", () => {
+  const result = spawnSync("node", [CLI_PATH, "run", "--help"], {
+    encoding: "utf8",
+    stdio: ["ignore", "pipe", "pipe"],
+  });
+  assert.equal(result.status, 0);
+  // Filename resolution would emit ENOENT / "no such file" via the thrown error path.
+  assert.ok(!result.stderr.includes("ENOENT"));
+  assert.ok(!result.stderr.includes("no such file"));
+  assert.ok(!result.stderr.includes("requires a .jh file"));
+});
diff --git a/package-lock.json b/package-lock.json
index 393fb652..69476611 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "jaiph",
-  "version": "0.9.4",
+  "version": "0.10.0",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "jaiph",
-      "version": "0.9.4",
+      "version": "0.10.0",
       "bin": {
         "jaiph": "dist/src/cli.js"
       },
diff --git a/package.json b/package.json
index bd08315e..e538a991 100644
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "jaiph",
-  "version": "0.9.4",
+  "version": "0.10.0",
   "description": "jaiph compiler/transpiler",
   "repository": {
     "type": "git",
@@ -16,11 +16,14 @@
   },
   "scripts": {
     "clean": "rm -rf dist",
-    "build": "tsc -p tsconfig.json && node -e \"require('node:fs').cpSync('src/runtime','dist/src/runtime',{recursive:true})\" && node -e \"require('node:fs').cpSync('runtime/overlay-run.sh','dist/src/runtime/overlay-run.sh')\"",
+    "prepare": "node tools/embed-assets.js",
+    "embed-assets": "node tools/embed-assets.js",
+    "build": "npm run embed-assets && tsc -p tsconfig.json && node -e \"require('node:fs').cpSync('src/runtime','dist/src/runtime',{recursive:true})\" && node -e \"require('node:fs').cpSync('runtime/overlay-run.sh','dist/src/runtime/overlay-run.sh')\"",
     "build:standalone": "npm run build && node -e \"const fs=require('node:fs'); fs.cpSync('dist/src/runtime','dist/runtime',{recursive:true});\" && bun build --compile ./src/cli.ts --outfile ./dist/jaiph",
+    "registry:build": "npm run build && node scripts/build-registry.mjs",
     "test:compiler": "npm run build && node --test dist/test-infra/compiler-test-runner.js",
     "test:golden-ast": "npm run build && node --test dist/test-infra/golden-ast-runner.js",
-    "test": "npm run clean && npm run build && JAIPH_UNSAFE=true NODE_OPTIONS='--max-old-space-size=32768 --enable-source-maps' node --test $(find dist/integration -name '*.test.js') $(find dist/src -name '*.test.js' -o -name '*.acceptance.test.js') dist/test-infra/compiler-test-runner.js dist/test-infra/golden-ast-runner.js",
+    "test": "npm run clean && npm run build && JAIPH_UNSAFE=true NODE_OPTIONS='--max-old-space-size=32768 --enable-source-maps' node --test $(find dist/integration -name '*.test.js') $(find dist/src -name '*.test.js' -o -name '*.acceptance.test.js') scripts/build-registry.test.mjs dist/test-infra/compiler-test-runner.js dist/test-infra/golden-ast-runner.js",
     "test:acceptance:compiler": "npm run build && node --test $(find dist/src -name '*.acceptance.test.js')",
     "test:acceptance:runtime": "bash ./e2e/test_all.sh",
     "test:acceptance": "npm run test:acceptance:compiler && npm run test:acceptance:runtime",
diff --git a/scripts/build-registry.mjs b/scripts/build-registry.mjs
new file mode 100644
index 00000000..8c0b4140
--- /dev/null
+++ b/scripts/build-registry.mjs
@@ -0,0 +1,96 @@
+#!/usr/bin/env node
+// Regenerates docs/registry from the upstream jaiphlang/registry index.
+//
+// Usage: node scripts/build-registry.mjs [source]
+//   source defaults to JAIPH_REGISTRY_SOURCE if set, otherwise the upstream
+//   raw URL; argv wins over env.
+//
+// The fetched document is written to a sibling tmp file, validated through
+// the built loadRegistryIndex (imported from dist/ — run `npm run build`
+// first), then renamed onto docs/registry. On any failure (unreachable
+// source, invalid JSON, schema mismatch) the script exits non-zero and
+// leaves docs/registry untouched.
+//
+// Importable: scripts/build-registry.test.mjs imports `buildRegistry` to
+// exercise the contract against local fixtures without spawning a process.
+
+import { readFileSync, renameSync, unlinkSync, writeFileSync } from "node:fs";
+import { fileURLToPath } from "node:url";
+import { dirname, resolve } from "node:path";
+import { createRequire } from "node:module";
+
+const here = dirname(fileURLToPath(import.meta.url));
+const ROOT = resolve(here, "..");
+const OUT_PATH = resolve(ROOT, "docs/registry");
+const DEFAULT_SOURCE = "https://raw.githubusercontent.com/jaiphlang/registry/main/registry.json";
+
+function resolveSource(argv, env) {
+  if (argv.length > 0) return argv[0];
+  if (env.JAIPH_REGISTRY_SOURCE && env.JAIPH_REGISTRY_SOURCE.length > 0) {
+    return env.JAIPH_REGISTRY_SOURCE;
+  }
+  return DEFAULT_SOURCE;
+}
+
+async function readSource(source) {
+  if (source.startsWith("file://")) {
+    return readFileSync(fileURLToPath(source), "utf8");
+  }
+  if (!source.includes("://")) {
+    return readFileSync(source, "utf8");
+  }
+  const res = await fetch(source);
+  if (!res.ok) {
+    throw new Error(`failed to fetch ${source}: HTTP ${res.status}`);
+  }
+  return await res.text();
+}
+
+/**
+ * Fetch `source`, validate via `loadRegistryIndex`, write to `outPath`.
+ * On any failure throws without touching `outPath`.
+ */
+export async function buildRegistry({ source, outPath, loadRegistryIndex }) {
+  const text = await readSource(source);
+  const tmpPath = `${outPath}.tmp-build-${process.pid}-${Date.now()}`;
+  writeFileSync(tmpPath, text);
+  try {
+    await loadRegistryIndex(tmpPath);
+    renameSync(tmpPath, outPath);
+  } catch (err) {
+    try { unlinkSync(tmpPath); } catch {}
+    // Strip the internal tmp path from the validator's message so the user sees
+    // the source they actually passed in.
+    const msg = (err && err.message ? err.message : String(err)).split(tmpPath).join(source);
+    const wrapped = new Error(msg);
+    if (err && err.stack) wrapped.stack = err.stack;
+    throw wrapped;
+  }
+  return { source, outPath, bytes: Buffer.byteLength(text) };
+}
+
+async function main() {
+  const source = resolveSource(process.argv.slice(2), process.env);
+  const require = createRequire(import.meta.url);
+  const distPath = resolve(ROOT, "dist/src/cli/commands/registry.js");
+  let loadRegistryIndex;
+  try {
+    ({ loadRegistryIndex } = require(distPath));
+  } catch (err) {
+    process.stderr.write(
+      `build-registry: cannot load ${distPath} — run \`npm run build\` first (${err.message})\n`,
+    );
+    process.exit(1);
+  }
+  try {
+    const result = await buildRegistry({ source, outPath: OUT_PATH, loadRegistryIndex });
+    process.stdout.write(`wrote ${result.outPath} (${result.bytes} bytes) from ${result.source}\n`);
+  } catch (err) {
+    process.stderr.write(`build-registry: ${err.message}\n`);
+    process.exit(1);
+  }
+}
+
+if (import.meta.url === `file://${process.argv[1]}`) {
+  await main();
+}
diff --git a/scripts/build-registry.test.mjs b/scripts/build-registry.test.mjs
new file mode 100644
index 00000000..f01037a7
--- /dev/null
+++ b/scripts/build-registry.test.mjs
@@ -0,0 +1,90 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { mkdtempSync, readdirSync, readFileSync, rmSync, writeFileSync } from "node:fs";
+import { join } from "node:path";
+import { tmpdir } from "node:os";
+import { buildRegistry } from "./build-registry.mjs";
+import { loadRegistryIndex } from "../dist/src/cli/commands/registry.js";
+
+async function withTmp(body) {
+  const dir = mkdtempSync(join(tmpdir(), "build-registry-"));
+  try {
+    return await body(dir);
+  } finally {
+    rmSync(dir, { recursive: true, force: true });
+  }
+}
+
+test("build-registry: valid local source produces byte-identical docs/registry", async () => {
+  await withTmp(async (dir) => {
+    const srcText = JSON.stringify({
+      libs: {
+        mylib: { url: "https://example.com/mylib.git", description: "demo" },
+      },
+    }, null, 2) + "\n";
+    const srcPath = join(dir, "registry.json");
+    writeFileSync(srcPath, srcText);
+    const outPath = join(dir, "registry");
+    await buildRegistry({ source: srcPath, outPath, loadRegistryIndex });
+    assert.equal(readFileSync(outPath, "utf8"), srcText, "output must be byte-identical to source");
+  });
+});
+
+test("build-registry: invalid JSON rejects and leaves previous output untouched", async () => {
+  await withTmp(async (dir) => {
+    const outPath = join(dir, "registry");
+    const previousText = '{"libs":{"prev":{"url":"https://example.com/prev.git","description":"prev"}}}\n';
+    writeFileSync(outPath, previousText);
+    const srcPath = join(dir, "registry.json");
+    writeFileSync(srcPath, "{ not valid json");
+    await assert.rejects(
+      () => buildRegistry({ source: srcPath, outPath, loadRegistryIndex }),
+      /failed to parse registry/,
+    );
+    assert.equal(readFileSync(outPath, "utf8"), previousText, "previous output must be untouched");
+  });
+});
+
+test("build-registry: schema mismatch leaves previous output untouched", async () => {
+  await withTmp(async (dir) => {
+    const outPath = join(dir, "registry");
+    const previousText = '{"libs":{"prev":{"url":"https://example.com/prev.git","description":"prev"}}}\n';
+    writeFileSync(outPath, previousText);
+    const srcPath = join(dir, "registry.json");
+    // Valid JSON but wrong shape — missing required `description` on the entry.
+    writeFileSync(srcPath, JSON.stringify({ libs: { bad: { url: "https://example.com/x.git" } } }));
+    await assert.rejects(
+      () => buildRegistry({ source: srcPath, outPath, loadRegistryIndex }),
+      /missing string "description"/,
+    );
+    assert.equal(readFileSync(outPath, "utf8"), previousText, "previous output must be untouched");
+  });
+});
+
+test("build-registry: missing source rejects and leaves previous output untouched", async () => {
+  await withTmp(async (dir) => {
+    const outPath = join(dir, "registry");
+    const previousText = '{"libs":{"prev":{"url":"https://example.com/prev.git","description":"prev"}}}\n';
+    writeFileSync(outPath, previousText);
+    const missingSrc = join(dir, "does-not-exist.json");
+    await assert.rejects(
+      () => buildRegistry({ source: missingSrc, outPath, loadRegistryIndex }),
+      /ENOENT|no such file/,
+    );
+    assert.equal(readFileSync(outPath, "utf8"), previousText, "previous output must be untouched");
+  });
+});
+
+test("build-registry: no tmp residue alongside outPath on failure", async () => {
+  await withTmp(async (dir) => {
+    const outPath = join(dir, "registry");
+    const previousText = "previous\n";
+    writeFileSync(outPath, previousText);
+    const srcPath = join(dir, "registry.json");
+    writeFileSync(srcPath, "{ broken");
+    await assert.rejects(() => buildRegistry({ source: srcPath, outPath, loadRegistryIndex }));
+    const stale = readdirSync(dir).filter((n) => n.startsWith("registry.tmp-build-"));
+    assert.deepEqual(stale, [], `stale tmp files left behind: ${stale.join(", ")}`);
+    assert.equal(readFileSync(outPath, "utf8"), previousText);
+  });
+});
diff --git a/src/cli/commands/compile.ts b/src/cli/commands/compile.ts
index a375bfaa..b45f055d 100644
--- a/src/cli/commands/compile.ts
+++ b/src/cli/commands/compile.ts
@@ -1,11 +1,13 @@
-import { existsSync, readFileSync, statSync } from "node:fs";
+import { existsSync, statSync } from "node:fs";
 import { dirname, resolve } from "node:path";
-import { parsejaiph } from "../../parser";
-import { validateReferences } from "../../transpile/validate";
-import { resolveImportPath } from "../../transpile/resolve";
-import { collectTransitiveJhModules, walkjhFiles } from "../../transpile/build";
+import { loadModuleGraph } from "../../transpile/module-graph";
+import { collectDiagnostics } from "../../transpile/validate";
+import { walkjhFiles } from "../../transpile/build";
 import { detectWorkspaceRoot } from "../shared/paths";
-import type { ValidateContext } from "../../transpile/validate";
+import {
+  diagnosticFromThrown as parseThrownDiagnostic,
+  type JaiphDiagnostic,
+} from "../../diagnostics";
 
 export interface CompileDiagnostic {
   file: string;
@@ -17,38 +19,38 @@ export interface CompileDiagnostic {
 
 /** Parse `path:line:col CODE message` from {@link jaiphError} and similar throws. */
 export function diagnosticFromThrown(err: unknown): CompileDiagnostic | null {
-  if (!(err instanceof Error)) return null;
-  const m = err.message.match(/^(.+):(\d+):(\d+) (\S+) (.+)$/s);
-  if (!m) return null;
-  return {
-    file: m[1],
-    line: Number(m[2]),
-    col: Number(m[3]),
-    code: m[4],
-    message: m[5].trimEnd(),
-  };
+  const d = parseThrownDiagnostic(err);
+  return d ? { file: d.file, line: d.line, col: d.col, code: d.code, message: d.message } : null;
 }
 
-function makeValidateContext(workspaceRoot?: string): ValidateContext {
-  return {
-    resolveImportPath,
-    existsSync,
-    readFile: (path: string) => readFileSync(path, "utf8"),
-    parse: parsejaiph,
-    workspaceRoot,
-  };
+function toCompileDiagnostic(d: JaiphDiagnostic): CompileDiagnostic {
+  return { file: d.file, line: d.line, col: d.col, code: d.code, message: d.message };
 }
 
-function printUsage(): void {
-  process.stderr.write(
-    "Usage: jaiph compile [--json] [--workspace <dir>] <file.jh | directory> ...\n\n" +
-      "Parse import closures and run validateReferences only (same compile-time checks as before jaiph run).\n" +
-      "Does not emit scripts/, does not run buildRuntimeGraph, does not spawn the workflow runner.\n" +
-      "With a directory, all non-test *.jh files are used as entrypoints; each file's import closure is validated.\n" +
-      "Pass *.test.jh explicitly to validate a test module.\n\n" +
-      "  --json       Print one JSON array of diagnostics to stdout (empty on success).\n" +
-      "  --workspace  Override workspace root for import resolution for all paths.\n",
-  );
+const COMPILE_USAGE =
+  "Usage: jaiph compile [--json] [--workspace <dir>] <file.jh | directory> ...\n\n" +
+  "Parse import closures and run validateReferences only (same compile-time checks as before jaiph run).\n" +
+  "Does not emit scripts/, does not run buildRuntimeGraph, does not spawn the workflow runner.\n" +
+  "With a directory, all non-test *.jh files are used as entrypoints; each file's import closure is validated.\n" +
+  "Pass *.test.jh explicitly to validate a test module.\n\n" +
+  "  --json             print one JSON array of diagnostics to stdout (empty on success)\n" +
+  "  --workspace <dir>  workspace root for import resolution (default: auto-detect per file)\n" +
+  "  -h, --help         show this help\n\n" +
+  "Example:\n" +
+  "  jaiph compile flow.jh\n";
+
+function printUsageError(): void {
+  process.stderr.write(COMPILE_USAGE);
+}
+
+function writeDiagnostics(json: boolean, diags: CompileDiagnostic[]): void {
+  if (json) {
+    process.stdout.write(JSON.stringify(diags) + "\n");
+    return;
+  }
+  for (const d of diags) {
+    process.stderr.write(`${d.file}:${d.line}:${d.col} ${d.code} ${d.message}\n`);
+  }
 }
 
 export function runCompile(args: string[]): number {
@@ -64,7 +66,7 @@ export function runCompile(args: string[]): number {
     if (args[i] === "--workspace") {
       const w = args[i + 1];
       if (!w) {
-        printUsage();
+        printUsageError();
         return 1;
       }
       workspaceFlag = resolve(w);
@@ -72,18 +74,18 @@ export function runCompile(args: string[]): number {
       continue;
     }
     if (args[i] === "--help" || args[i] === "-h") {
-      printUsage();
+      process.stdout.write(COMPILE_USAGE);
       return 0;
     }
     paths.push(args[i]);
   }
 
   if (paths.length === 0) {
-    printUsage();
+    printUsageError();
     return 1;
   }
 
-  const filesToValidate = new Set<string>();
+  const entries: Array<{ file: string; workspaceRoot: string }> = [];
 
   try {
     for (const p of paths) {
@@ -97,15 +99,11 @@ export function runCompile(args: string[]): number {
           throw new Error(`compile expects .jh files: ${p}`);
         }
         const wr = workspaceFlag ?? detectWorkspaceRoot(dirname(abs));
-        for (const f of collectTransitiveJhModules(abs, wr)) {
-          filesToValidate.add(f);
-        }
+        entries.push({ file: abs, workspaceRoot: wr });
       } else if (st.isDirectory()) {
         const wr = workspaceFlag ?? detectWorkspaceRoot(abs);
         for (const entry of walkjhFiles(abs)) {
-          for (const f of collectTransitiveJhModules(entry, wr)) {
-            filesToValidate.add(f);
-          }
+          entries.push({ file: entry, workspaceRoot: wr });
         }
       } else {
         throw new Error(`not a file or directory: ${p}`);
@@ -113,52 +111,47 @@ export function runCompile(args: string[]): number {
     }
   } catch (err) {
     const d = diagnosticFromThrown(err);
-    if (json) {
-      const fallback: CompileDiagnostic = {
-        file: "",
-        line: 1,
-        col: 1,
-        code: "E_COMPILE",
-        message: err instanceof Error ? err.message : String(err),
-      };
-      process.stdout.write(JSON.stringify(d ? [d] : [fallback]) + "\n");
-    } else {
-      process.stderr.write((err instanceof Error ? err.message : String(err)) + "\n");
-    }
+    const fallback: CompileDiagnostic = {
+      file: "",
+      line: 1,
+      col: 1,
+      code: "E_COMPILE",
+      message: err instanceof Error ? err.message : String(err),
+    };
+    writeDiagnostics(json, [d ?? fallback]);
     return 1;
   }
 
-  const sorted = [...filesToValidate].sort();
+  const collected: CompileDiagnostic[] = [];
   const seen = new Set<string>();
-
-  for (const file of sorted) {
+  for (const { file, workspaceRoot } of entries) {
     if (seen.has(file)) continue;
     seen.add(file);
-    const wr = workspaceFlag ?? detectWorkspaceRoot(dirname(file));
-    const ctx = makeValidateContext(wr);
     try {
-      const ast = parsejaiph(readFileSync(file, "utf8"), file);
-      validateReferences(ast, ctx);
+      const graph = loadModuleGraph(file, workspaceRoot);
+      const diag = collectDiagnostics(graph);
+      for (const d of diag.sorted()) collected.push(toCompileDiagnostic(d));
+      for (const reachable of graph.modules.keys()) seen.add(reachable);
     } catch (err) {
+      // Loader / parser errors are fatal (unrecoverable AST). Surface them
+      // as a single diagnostic; they do not flow through `Diagnostics`.
       const d = diagnosticFromThrown(err);
-      if (json) {
-        const fallback: CompileDiagnostic = {
+      collected.push(
+        d ?? {
           file,
           line: 1,
           col: 1,
           code: "E_COMPILE",
           message: err instanceof Error ? err.message : String(err),
-        };
-        process.stdout.write(JSON.stringify(d ? [d] : [fallback]) + "\n");
-      } else {
-        process.stderr.write((err instanceof Error ? err.message : String(err)) + "\n");
-      }
-      return 1;
+        },
+      );
     }
   }
 
-  if (json) {
-    process.stdout.write("[]\n");
+  if (collected.length === 0) {
+    if (json) process.stdout.write("[]\n");
+    return 0;
   }
-  return 0;
+  writeDiagnostics(json, collected);
+  return 1;
 }
diff --git a/src/cli/commands/format.ts b/src/cli/commands/format.ts
index 05162bef..07293c28 100644
--- a/src/cli/commands/format.ts
+++ b/src/cli/commands/format.ts
@@ -1,9 +1,23 @@
 import { readFileSync, writeFileSync } from "node:fs";
 import { resolve } from "node:path";
-import { parsejaiph } from "../../parser";
+import { parsejaiphWithTrivia } from "../../parser";
 import { emitModule } from "../../format/emit";
+import { hasHelpFlag } from "../shared/usage";
+
+const FORMAT_USAGE =
+  "Usage: jaiph format [--check] [--indent <n>] <file.jh ...>\n\n" +
+  "Rewrite .jh files into canonical style.\n\n" +
+  "  --check         exit non-zero when file(s) need formatting (no writes)\n" +
+  "  --indent <n>    spaces per indent level (default: 2)\n" +
+  "  -h, --help      show this help\n\n" +
+  "Example:\n" +
+  "  jaiph format flow.jh\n";
 
 export function runFormat(args: string[]): number {
+  if (hasHelpFlag(args)) {
+    process.stdout.write(FORMAT_USAGE);
+    return 0;
+  }
   let check = false;
   let indent = 2;
   const files: string[] = [];
@@ -52,16 +66,16 @@ export function runFormat(args: string[]): number {
     const firstLine = source.split(/\r?\n/, 1)[0];
     const shebang = firstLine.startsWith("#!") ? firstLine : null;
 
-    let mod;
+    let parsed;
     try {
-      mod = parsejaiph(source, abs);
+      parsed = parsejaiphWithTrivia(source, abs);
     } catch (err) {
       const msg = err instanceof Error ? err.message : String(err);
       process.stderr.write(`parse error: ${msg}\n`);
       return 1;
     }
 
-    let formatted = emitModule(mod, { indent });
+    let formatted = emitModule(parsed.ast, parsed.trivia, { indent });
     if (shebang) {
       formatted = shebang + "\n\n" + formatted;
     }
diff --git a/src/cli/commands/init.ts b/src/cli/commands/init.ts
index daaef957..6d0949df 100644
--- a/src/cli/commands/init.ts
+++ b/src/cli/commands/init.ts
@@ -1,7 +1,16 @@
 import { chmodSync, existsSync, mkdirSync, readFileSync, statSync, writeFileSync } from "node:fs";
 import { join, resolve } from "node:path";
 import { colorPalette } from "../shared/errors";
-import { resolveInstalledSkillPath } from "../shared/paths";
+import { loadInstalledSkillContent } from "../shared/paths";
+import { hasHelpFlag } from "../shared/usage";
+
+const INIT_USAGE =
+  "Usage: jaiph init [workspace-path]\n\n" +
+  "Initialize a Jaiph workspace under <workspace-path> (defaults to the current\n" +
+  "directory). Writes .jaiph/bootstrap.jh, .jaiph/.gitignore, and .jaiph/SKILL.md.\n\n" +
+  "  -h, --help      show this help\n\n" +
+  "Example:\n" +
+  "  jaiph init\n";
 
 const BOOTSTRAP_TEMPLATE = `#!/usr/bin/env jaiph
 
@@ -34,6 +43,10 @@ workflow default() {
 const JAIPH_DIR_GITIGNORE_TEMPLATE = "runs\ntmp\n";
 
 export function runInit(rest: string[]): number {
+  if (hasHelpFlag(rest)) {
+    process.stdout.write(INIT_USAGE);
+    return 0;
+  }
   const workspaceArg = rest[0] ?? ".";
   const workspaceRoot = resolve(workspaceArg);
   const stats = statSync(workspaceRoot);
@@ -82,12 +95,7 @@ export function runInit(rest: string[]): number {
   }
   chmodSync(bootstrapPath, 0o755);
 
-  const installedSkillPath = resolveInstalledSkillPath();
-  let wroteSkill = false;
-  if (installedSkillPath) {
-    writeFileSync(skillPath, readFileSync(installedSkillPath, "utf8"), "utf8");
-    wroteSkill = true;
-  }
+  writeFileSync(skillPath, loadInstalledSkillContent(), "utf8");
 
   process.stdout.write(`${palette.green}✓ Initialized ${join(".jaiph", "bootstrap.jh")}${palette.reset}\n`);
   if (createdGitignore) {
@@ -100,13 +108,7 @@ export function runInit(rest: string[]): number {
   if (!createdBootstrap) {
     process.stdout.write(`${palette.dim}▸ Note: bootstrap file already existed; left unchanged.${palette.reset}\n`);
   }
-  if (wroteSkill) {
-    process.stdout.write(`${palette.green}✓ Wrote ${join(".jaiph", "SKILL.md")} from installation${palette.reset}\n`);
-  } else {
-    process.stdout.write(
-      `${palette.dim}▸ Note: skill file not found in installation (${join(".jaiph", "SKILL.md")} not written). Set JAIPH_SKILL_PATH and run again.${palette.reset}\n`,
-    );
-  }
+  process.stdout.write(`${palette.green}✓ Wrote ${join(".jaiph", "SKILL.md")} from installation${palette.reset}\n`);
   process.stdout.write("\n");
   process.stdout.write("Try:\n");
   process.stdout.write("  ./.jaiph/bootstrap.jh\n");
diff --git a/src/cli/commands/install.test.ts b/src/cli/commands/install.test.ts
index ad4d1a20..cdcb042e 100644
--- a/src/cli/commands/install.test.ts
+++ b/src/cli/commands/install.test.ts
@@ -1,10 +1,51 @@
 import test from "node:test";
 import assert from "node:assert/strict";
-import { mkdirSync, writeFileSync, rmSync } from "node:fs";
+import { existsSync, mkdirSync, readFileSync, rmSync, writeFileSync } from "node:fs";
 import { join } from "node:path";
 import { execSync } from "node:child_process";
 import { tmpdir } from "node:os";
-import { parseUrlAndVersion } from "./install";
+import { parseUrlAndVersion, runInstall, type CloneRunner, type CloneOutcome, type InstallSpec } from "./install";
+
+/**
+ * Run a body with JAIPH_REGISTRY set to `value`. Restore the prior value
+ * (including absent) on exit. Wraps each registry-dependent test so they can
+ * share the global env without leaking between cases.
+ */
+async function withRegistry<T>(value: string, body: () => Promise<T>): Promise<T> {
+  const prev = process.env.JAIPH_REGISTRY;
+  process.env.JAIPH_REGISTRY = value;
+  try {
+    return await body();
+  } finally {
+    if (prev === undefined) {
+      delete process.env.JAIPH_REGISTRY;
+    } else {
+      process.env.JAIPH_REGISTRY = prev;
+    }
+  }
+}
+
+function writeRegistryFile(dir: string, libs: Record<string, { url: string; description: string }>): string {
+  const path = join(dir, "registry.json");
+  writeFileSync(path, JSON.stringify({ libs }), "utf8");
+  return path;
+}
+
+/** Capture process.stderr writes during `body`. Restores the prior writer on exit. */
+async function captureStderr<T>(body: () => Promise<T>): Promise<{ result: T; stderr: string }> {
+  const chunks: string[] = [];
+  const orig = process.stderr.write;
+  process.stderr.write = ((chunk: string | Uint8Array) => {
+    chunks.push(String(chunk));
+    return true;
+  }) as typeof process.stderr.write;
+  try {
+    const result = await body();
+    return { result, stderr: chunks.join("") };
+  } finally {
+    process.stderr.write = orig;
+  }
+}
 
 const CLI_PATH = join(__dirname, "../../../src/cli.js");
 
@@ -83,3 +124,504 @@ test("install: missing lockfile shows no libs message", () => {
     cleanup(dir);
   }
 });
+
+test("install: missing libraries clone concurrently", async () => {
+  const dir = makeTempProject();
+  try {
+    let active = 0;
+    let maxActive = 0;
+    const cloneRunner: CloneRunner = async (spec: InstallSpec): Promise<CloneOutcome> => {
+      active += 1;
+      maxActive = Math.max(maxActive, active);
+      // Mimic git clone side effect so the lib directory is materialized.
+      // Post-clone hygiene requires at least one .jh file in the tree.
+      mkdirSync(spec.libDir, { recursive: true });
+      writeFileSync(join(spec.libDir, "lib.jh"), "", "utf8");
+      await new Promise((resolve) => setTimeout(resolve, 30));
+      active -= 1;
+      return { spec, ok: true };
+    };
+
+    const code = await runInstall(
+      [
+        "https://example.com/alpha.git",
+        "https://example.com/beta.git",
+        "https://example.com/gamma.git",
+      ],
+      { cwd: dir, cloneRunner, concurrency: 4 },
+    );
+
+    assert.equal(code, 0);
+    assert.ok(maxActive >= 2, `expected overlapping clones; observed peak ${maxActive}`);
+
+    const lock = JSON.parse(readFileSync(join(dir, ".jaiph", "libs.lock"), "utf8")) as {
+      libs: { name: string }[];
+    };
+    assert.deepEqual(
+      lock.libs.map((e) => e.name).sort(),
+      ["alpha", "beta", "gamma"],
+      "all three should land in the lockfile",
+    );
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: explicit warm path skips existing directories without invoking git", async () => {
+  const dir = makeTempProject();
+  try {
+    const libDir = join(dir, ".jaiph", "libs", "alpha");
+    mkdirSync(libDir, { recursive: true });
+    writeFileSync(join(libDir, "sentinel"), "warm\n", "utf8");
+
+    let callCount = 0;
+    const cloneRunner: CloneRunner = async (spec) => {
+      callCount += 1;
+      return { spec, ok: true };
+    };
+
+    const code = await runInstall(["https://example.com/alpha.git"], { cwd: dir, cloneRunner });
+
+    assert.equal(code, 0);
+    assert.equal(callCount, 0, "cloneRunner must not be called when target dir exists and --force is absent");
+    assert.equal(readFileSync(join(libDir, "sentinel"), "utf8"), "warm\n");
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: restore-from-lock warm path skips existing directories without invoking git", async () => {
+  const dir = makeTempProject();
+  try {
+    const lockPath = join(dir, ".jaiph", "libs.lock");
+    mkdirSync(join(dir, ".jaiph"), { recursive: true });
+    writeFileSync(
+      lockPath,
+      JSON.stringify({
+        libs: [
+          { name: "alpha", url: "https://example.com/alpha.git" },
+          { name: "beta", url: "https://example.com/beta.git" },
+        ],
+      }) + "\n",
+      "utf8",
+    );
+    const alphaDir = join(dir, ".jaiph", "libs", "alpha");
+    const betaDir = join(dir, ".jaiph", "libs", "beta");
+    mkdirSync(alphaDir, { recursive: true });
+    mkdirSync(betaDir, { recursive: true });
+    writeFileSync(join(alphaDir, "sentinel"), "alpha-warm\n", "utf8");
+    writeFileSync(join(betaDir, "sentinel"), "beta-warm\n", "utf8");
+
+    let callCount = 0;
+    const cloneRunner: CloneRunner = async (spec) => {
+      callCount += 1;
+      return { spec, ok: true };
+    };
+
+    const code = await runInstall([], { cwd: dir, cloneRunner });
+
+    assert.equal(code, 0);
+    assert.equal(callCount, 0, "cloneRunner must not be called for restore-from-lock warm path");
+    // restore-from-lock with no args must not invent new lock entries; pre-existing two stay.
+    const lock = JSON.parse(readFileSync(lockPath, "utf8")) as { libs: { name: string }[] };
+    assert.deepEqual(lock.libs.map((e) => e.name).sort(), ["alpha", "beta"]);
+    assert.equal(readFileSync(join(alphaDir, "sentinel"), "utf8"), "alpha-warm\n");
+    assert.equal(readFileSync(join(betaDir, "sentinel"), "utf8"), "beta-warm\n");
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: invalid remote/path failure exits non-zero and does not lock the failed lib", async () => {
+  const dir = makeTempProject();
+  try {
+    const bogus = join(dir, "does-not-exist-bogus-remote");
+    const code = await runInstall([bogus], { cwd: dir });
+
+    assert.notEqual(code, 0, "invalid remote/path must exit non-zero");
+    const lockPath = join(dir, ".jaiph", "libs.lock");
+    assert.ok(existsSync(lockPath), "lockfile is written but should not contain failed entries");
+    const lock = JSON.parse(readFileSync(lockPath, "utf8")) as { libs: { name: string }[] };
+    assert.equal(lock.libs.length, 0, "failed clone must not produce a lock entry");
+    assert.ok(
+      !existsSync(join(dir, ".jaiph", "libs", "does-not-exist-bogus-remote")),
+      "no lib directory should remain after a failed clone",
+    );
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: unknown ref failure exits non-zero and does not lock the failed lib", async () => {
+  const dir = makeTempProject();
+  try {
+    // Create a local repo with one commit so clone-from-path is valid, but the ref is not.
+    const remoteDir = join(dir, "remote-repo");
+    mkdirSync(remoteDir, { recursive: true });
+    execSync("git init", { cwd: remoteDir, stdio: "pipe" });
+    writeFileSync(join(remoteDir, "README"), "hi\n", "utf8");
+    execSync("git add README", { cwd: remoteDir, stdio: "pipe" });
+    execSync(
+      `git -c user.email=test@example.com -c user.name=test commit -m init`,
+      { cwd: remoteDir, stdio: "pipe" },
+    );
+
+    const code = await runInstall([`${remoteDir}@nonexistent-ref-xyz`], { cwd: dir });
+
+    assert.notEqual(code, 0, "unknown ref must exit non-zero");
+    const lockPath = join(dir, ".jaiph", "libs.lock");
+    assert.ok(existsSync(lockPath));
+    const lock = JSON.parse(readFileSync(lockPath, "utf8")) as { libs: { name: string }[] };
+    assert.equal(lock.libs.length, 0, "unknown-ref clone must not produce a lock entry");
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: bare registry name installs into .jaiph/libs/<name>/ regardless of url last segment", async () => {
+  const dir = makeTempProject();
+  try {
+    const registryPath = writeRegistryFile(dir, {
+      mylib: { url: "https://example.com/some-other-repo-name.git", description: "demo" },
+    });
+
+    const seen: InstallSpec[] = [];
+    const cloneRunner: CloneRunner = async (spec) => {
+      seen.push(spec);
+      mkdirSync(spec.libDir, { recursive: true });
+      writeFileSync(join(spec.libDir, "lib.jh"), "", "utf8");
+      return { spec, ok: true };
+    };
+
+    const code = await withRegistry(registryPath, () =>
+      runInstall(["mylib"], { cwd: dir, cloneRunner }),
+    );
+
+    assert.equal(code, 0);
+    assert.equal(seen.length, 1);
+    assert.equal(seen[0]!.name, "mylib");
+    assert.equal(seen[0]!.url, "https://example.com/some-other-repo-name.git");
+    assert.equal(seen[0]!.libDir, join(dir, ".jaiph", "libs", "mylib"));
+
+    assert.ok(existsSync(join(dir, ".jaiph", "libs", "mylib")), "lib dir uses registry name, not url segment");
+    const lock = JSON.parse(readFileSync(join(dir, ".jaiph", "libs.lock"), "utf8")) as {
+      libs: { name: string; url: string }[];
+    };
+    assert.equal(lock.libs.length, 1);
+    assert.equal(lock.libs[0]!.name, "mylib");
+    assert.equal(lock.libs[0]!.url, "https://example.com/some-other-repo-name.git");
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: name@version forwards version to clone runner and records it in lock", async () => {
+  const dir = makeTempProject();
+  try {
+    const registryPath = writeRegistryFile(dir, {
+      mylib: { url: "https://example.com/mylib.git", description: "demo" },
+    });
+
+    let observed: InstallSpec | undefined;
+    const cloneRunner: CloneRunner = async (spec) => {
+      observed = spec;
+      mkdirSync(spec.libDir, { recursive: true });
+      writeFileSync(join(spec.libDir, "lib.jh"), "", "utf8");
+      return { spec, ok: true };
+    };
+
+    const code = await withRegistry(registryPath, () =>
+      runInstall(["mylib@v1.2"], { cwd: dir, cloneRunner }),
+    );
+
+    assert.equal(code, 0);
+    assert.equal(observed?.version, "v1.2");
+    const lock = JSON.parse(readFileSync(join(dir, ".jaiph", "libs.lock"), "utf8")) as {
+      libs: { name: string; version?: string }[];
+    };
+    assert.equal(lock.libs[0]!.version, "v1.2");
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: unknown registry name fails with actionable message naming the source", async () => {
+  const dir = makeTempProject();
+  try {
+    const registryPath = writeRegistryFile(dir, {
+      other: { url: "https://example.com/other.git", description: "demo" },
+    });
+
+    const { result: code, stderr } = await captureStderr(() =>
+      withRegistry(registryPath, () => runInstall(["missing"], { cwd: dir })),
+    );
+
+    assert.notEqual(code, 0);
+    assert.ok(
+      stderr.includes(`lib "missing" not found in registry ${registryPath}`),
+      `expected unknown-name error naming the source; got: ${stderr}`,
+    );
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: unreadable registry source fails with message naming source and cause", async () => {
+  const dir = makeTempProject();
+  try {
+    const missingPath = join(dir, "no-such-registry.json");
+
+    const { result: code, stderr } = await captureStderr(() =>
+      withRegistry(missingPath, () => runInstall(["mylib"], { cwd: dir })),
+    );
+
+    assert.notEqual(code, 0);
+    assert.ok(stderr.includes(missingPath), `expected error naming registry source; got: ${stderr}`);
+    assert.ok(stderr.includes("failed to read registry"), `expected read-failure message; got: ${stderr}`);
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: invalid registry JSON fails with message naming source and cause", async () => {
+  const dir = makeTempProject();
+  try {
+    const registryPath = join(dir, "registry.json");
+    writeFileSync(registryPath, "{ not valid json", "utf8");
+
+    const { result: code, stderr } = await captureStderr(() =>
+      withRegistry(registryPath, () => runInstall(["mylib"], { cwd: dir })),
+    );
+
+    assert.notEqual(code, 0);
+    assert.ok(stderr.includes(registryPath), `expected error naming registry source; got: ${stderr}`);
+    assert.ok(stderr.includes("failed to parse registry"), `expected parse-failure message; got: ${stderr}`);
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: restore-from-lock never reads the registry", async () => {
+  const dir = makeTempProject();
+  try {
+    const lockPath = join(dir, ".jaiph", "libs.lock");
+    mkdirSync(join(dir, ".jaiph"), { recursive: true });
+    writeFileSync(
+      lockPath,
+      JSON.stringify({
+        libs: [
+          { name: "alpha", url: "https://example.com/alpha.git" },
+          { name: "beta", url: "https://example.com/beta.git", version: "v2" },
+        ],
+      }) + "\n",
+      "utf8",
+    );
+
+    const seen: InstallSpec[] = [];
+    const cloneRunner: CloneRunner = async (spec) => {
+      seen.push(spec);
+      mkdirSync(spec.libDir, { recursive: true });
+      writeFileSync(join(spec.libDir, "lib.jh"), "", "utf8");
+      return { spec, ok: true };
+    };
+
+    // Point JAIPH_REGISTRY at a path that does not exist. If restore touched
+    // the registry, the load would fail. Restore must succeed regardless.
+    const bogusRegistry = join(dir, "nope-no-registry-here.json");
+    const code = await withRegistry(bogusRegistry, () =>
+      runInstall([], { cwd: dir, cloneRunner }),
+    );
+
+    assert.equal(code, 0, "restore-from-lock must succeed without contacting the registry");
+    assert.equal(seen.length, 2);
+    assert.deepEqual(
+      seen.map((s) => s.name).sort(),
+      ["alpha", "beta"],
+    );
+  } finally {
+    cleanup(dir);
+  }
+});
+
+/**
+ * Build a local git repo at <parent>/<name> usable as a clone source for
+ * tests. `withJh` controls whether the seed commit includes a `*.jh` file
+ * (set false to exercise the "not a jaiph library" path). `tag` optionally
+ * tags the seed commit so the test can `clone --branch <tag>`.
+ */
+function makeFixtureRepo(
+  parent: string,
+  name: string,
+  opts: { withJh?: boolean; tag?: string } = {},
+): string {
+  const repoDir = join(parent, name);
+  mkdirSync(repoDir, { recursive: true });
+  execSync("git init", { cwd: repoDir, stdio: "pipe" });
+  execSync("git config user.email test@example.com", { cwd: repoDir, stdio: "pipe" });
+  execSync("git config user.name test", { cwd: repoDir, stdio: "pipe" });
+  if (opts.withJh !== false) {
+    writeFileSync(join(repoDir, "main.jh"), "workflow default { log \"hi\" }\n", "utf8");
+  } else {
+    writeFileSync(join(repoDir, "README"), "no jh here\n", "utf8");
+  }
+  execSync("git add -A", { cwd: repoDir, stdio: "pipe" });
+  execSync("git commit -m init", { cwd: repoDir, stdio: "pipe" });
+  if (opts.tag) execSync(`git tag ${opts.tag}`, { cwd: repoDir, stdio: "pipe" });
+  return repoDir;
+}
+
+function gitHead(dir: string): string {
+  return execSync("git rev-parse HEAD", { cwd: dir, stdio: ["ignore", "pipe", "pipe"] })
+    .toString()
+    .trim();
+}
+
+test("install: strips .git after clone and records 40-char commit in lockfile", async () => {
+  const dir = makeTempProject();
+  try {
+    const remote = makeFixtureRepo(dir, "remote-alpha");
+    const expectedSha = gitHead(remote);
+
+    const code = await runInstall([remote], { cwd: dir });
+
+    assert.equal(code, 0, "install must succeed");
+    const libDir = join(dir, ".jaiph", "libs", "remote-alpha");
+    assert.ok(existsSync(libDir), "lib dir should exist");
+    assert.ok(
+      !existsSync(join(libDir, ".git")),
+      ".git directory must be removed from installed lib",
+    );
+
+    const lock = JSON.parse(
+      readFileSync(join(dir, ".jaiph", "libs.lock"), "utf8"),
+    ) as { libs: { name: string; commit?: string }[] };
+    assert.equal(lock.libs.length, 1);
+    assert.equal(lock.libs[0]!.name, "remote-alpha");
+    assert.match(
+      lock.libs[0]!.commit ?? "",
+      /^[0-9a-f]{40}$/,
+      "lock entry must record a 40-char commit",
+    );
+    assert.equal(lock.libs[0]!.commit, expectedSha);
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: restore detects moved tag and fails with both SHAs", async () => {
+  const dir = makeTempProject();
+  try {
+    const remote = makeFixtureRepo(dir, "remote-beta", { tag: "v1" });
+    const firstSha = gitHead(remote);
+
+    const firstCode = await runInstall([`${remote}@v1`], { cwd: dir });
+    assert.equal(firstCode, 0, "initial install must succeed");
+
+    const lockPath = join(dir, ".jaiph", "libs.lock");
+    const lockAfterFirst = JSON.parse(readFileSync(lockPath, "utf8")) as {
+      libs: { name: string; commit?: string; version?: string }[];
+    };
+    assert.equal(lockAfterFirst.libs[0]!.commit, firstSha);
+
+    // Move the tag to a new commit in the source repo.
+    writeFileSync(join(remote, "second.jh"), "workflow default { log \"two\" }\n", "utf8");
+    execSync("git add -A", { cwd: remote, stdio: "pipe" });
+    execSync("git commit -m second", { cwd: remote, stdio: "pipe" });
+    execSync("git tag -d v1", { cwd: remote, stdio: "pipe" });
+    execSync("git tag v1", { cwd: remote, stdio: "pipe" });
+    const secondSha = gitHead(remote);
+    assert.notEqual(firstSha, secondSha);
+
+    // Remove the installed copy so restore must re-clone.
+    const libDir = join(dir, ".jaiph", "libs", "remote-beta");
+    rmSync(libDir, { recursive: true, force: true });
+
+    const { result: restoreCode, stderr } = await captureStderr(() =>
+      runInstall([], { cwd: dir }),
+    );
+
+    assert.notEqual(restoreCode, 0, "restore must exit non-zero on commit mismatch");
+    assert.ok(stderr.includes(firstSha), `expected locked SHA in stderr; got: ${stderr}`);
+    assert.ok(stderr.includes(secondSha), `expected cloned SHA in stderr; got: ${stderr}`);
+    assert.ok(!existsSync(libDir), "lib dir must be removed after mismatch");
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: fixture repo with no .jh modules fails and leaves no lib dir or lock entry", async () => {
+  const dir = makeTempProject();
+  try {
+    const remote = makeFixtureRepo(dir, "remote-empty", { withJh: false });
+
+    const { result: code, stderr } = await captureStderr(() =>
+      runInstall([remote], { cwd: dir }),
+    );
+
+    assert.notEqual(code, 0, "install must exit non-zero when no .jh modules are present");
+    assert.ok(
+      stderr.includes('lib "remote-empty" contains no .jh modules — not a jaiph library?'),
+      `expected no-modules error; got: ${stderr}`,
+    );
+    assert.ok(
+      !existsSync(join(dir, ".jaiph", "libs", "remote-empty")),
+      "lib dir must be removed on no-jh failure",
+    );
+    const lockPath = join(dir, ".jaiph", "libs.lock");
+    assert.ok(existsSync(lockPath));
+    const lock = JSON.parse(readFileSync(lockPath, "utf8")) as { libs: { name: string }[] };
+    assert.equal(lock.libs.length, 0, "no lock entry must be written for no-jh failure");
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: legacy lockfile without commit field still restores", async () => {
+  const dir = makeTempProject();
+  try {
+    const remote = makeFixtureRepo(dir, "remote-gamma");
+
+    mkdirSync(join(dir, ".jaiph"), { recursive: true });
+    writeFileSync(
+      join(dir, ".jaiph", "libs.lock"),
+      JSON.stringify({ libs: [{ name: "remote-gamma", url: remote }] }) + "\n",
+      "utf8",
+    );
+
+    const code = await runInstall([], { cwd: dir });
+
+    assert.equal(code, 0, "restore from legacy lockfile (no commit) must succeed");
+    const libDir = join(dir, ".jaiph", "libs", "remote-gamma");
+    assert.ok(existsSync(libDir), "lib dir should be present after restore");
+    assert.ok(!existsSync(join(libDir, ".git")), ".git directory must still be stripped on restore");
+  } finally {
+    cleanup(dir);
+  }
+});
+
+test("install: mixed success and failure locks only the successful libs", async () => {
+  const dir = makeTempProject();
+  try {
+    const cloneRunner: CloneRunner = async (spec) => {
+      if (spec.name === "bad") {
+        return { spec, ok: false, message: "simulated failure" };
+      }
+      mkdirSync(spec.libDir, { recursive: true });
+      writeFileSync(join(spec.libDir, "lib.jh"), "", "utf8");
+      return { spec, ok: true };
+    };
+
+    const code = await runInstall(
+      ["https://example.com/good.git", "https://example.com/bad.git", "https://example.com/also-good.git"],
+      { cwd: dir, cloneRunner, concurrency: 4 },
+    );
+
+    assert.notEqual(code, 0, "any failure must propagate non-zero exit");
+    const lock = JSON.parse(readFileSync(join(dir, ".jaiph", "libs.lock"), "utf8")) as {
+      libs: { name: string }[];
+    };
+    assert.deepEqual(lock.libs.map((e) => e.name).sort(), ["also-good", "good"]);
+  } finally {
+    cleanup(dir);
+  }
+});
diff --git a/src/cli/commands/install.ts b/src/cli/commands/install.ts
index 2c7254ff..2e9af045 100644
--- a/src/cli/commands/install.ts
+++ b/src/cli/commands/install.ts
@@ -1,19 +1,72 @@
-import { existsSync, mkdirSync, readFileSync, rmSync, writeFileSync } from "node:fs";
-import { join, resolve } from "node:path";
-import { execSync } from "node:child_process";
+import { existsSync, mkdirSync, readdirSync, readFileSync, rmSync, writeFileSync } from "node:fs";
+import { join } from "node:path";
+import { execFileSync, spawn } from "node:child_process";
 import { colorPalette } from "../shared/errors";
 import { detectWorkspaceRoot } from "../shared/paths";
+import { hasHelpFlag } from "../shared/usage";
+import {
+  DEFAULT_REGISTRY_URL,
+  isRegistryNameArg,
+  loadRegistryIndex,
+  parseNameArg,
+  registrySource,
+  type RegistryIndex,
+} from "./registry";
+
+const INSTALL_USAGE =
+  "Usage: jaiph install [--force] [<name[@version]> | <repo-url[@version]> ...]\n\n" +
+  "Names are resolved via the registry (JAIPH_REGISTRY env var, else " +
+  `${DEFAULT_REGISTRY_URL}).\n` +
+  "Names match /^[A-Za-z0-9_-]+(@<version>)?$/; anything containing '/' or ':' is\n" +
+  "treated as a git clone URL. Each lib lands in .jaiph/libs/<name>/ and is\n" +
+  "recorded in .jaiph/libs.lock. With no args, restore every library listed in\n" +
+  "the lockfile (the registry is never read on restore).\n\n" +
+  "  --force         delete existing clone and re-clone\n" +
+  "  -h, --help      show this help\n\n" +
+  "Environment:\n" +
+  "  JAIPH_REGISTRY  path or URL of the registry index (default: " +
+  `${DEFAULT_REGISTRY_URL}).\n` +
+  "                  Values without '://' (or with file://) are read from disk.\n\n" +
+  "Examples:\n" +
+  "  jaiph install jaiphlang\n" +
+  "  jaiph install mylib@v1.2\n" +
+  "  jaiph install https://github.com/you/queue-lib.git@v1.0\n";
 
 interface LockEntry {
   name: string;
   url: string;
   version?: string;
+  commit?: string;
 }
 
 interface LockFile {
   libs: LockEntry[];
 }
 
+export interface InstallSpec {
+  name: string;
+  url: string;
+  version?: string;
+  libDir: string;
+  expectedCommit?: string;
+}
+
+export interface CloneOutcome {
+  spec: InstallSpec;
+  ok: boolean;
+  message?: string;
+}
+
+export type CloneRunner = (spec: InstallSpec) => Promise<CloneOutcome>;
+
+export interface RunInstallOptions {
+  cwd?: string;
+  cloneRunner?: CloneRunner;
+  concurrency?: number;
+}
+
+const DEFAULT_CONCURRENCY = 4;
+
 function deriveLibName(url: string): string {
   const lastSegment = url.split("/").pop() ?? url;
   return lastSegment.replace(/\.git$/, "");
@@ -53,80 +106,266 @@ function upsertLockEntry(lock: LockFile, entry: LockEntry): void {
   }
 }
 
-function cloneLib(
-  url: string,
-  version: string | undefined,
-  targetDir: string,
-  force: boolean,
-  palette: ReturnType<typeof colorPalette>,
-): boolean {
-  const name = deriveLibName(url);
-  const libDir = join(targetDir, name);
+function specToLockEntry(spec: InstallSpec, commit?: string): LockEntry {
+  return {
+    name: spec.name,
+    url: spec.url,
+    ...(spec.version ? { version: spec.version } : {}),
+    ...(commit ? { commit } : {}),
+  };
+}
 
-  if (existsSync(libDir)) {
-    if (force) {
-      rmSync(libDir, { recursive: true, force: true });
-    } else {
-      process.stdout.write(`${palette.dim}▸ ${name} already exists, skipping (use --force to re-clone)${palette.reset}\n`);
-      return true;
+/** True if `dir` contains at least one `*.jh` file (recursive, skipping `.git`). */
+function hasJhFileRecursive(dir: string): boolean {
+  const stack: string[] = [dir];
+  while (stack.length > 0) {
+    const d = stack.pop()!;
+    let entries;
+    try {
+      entries = readdirSync(d, { withFileTypes: true });
+    } catch {
+      continue;
+    }
+    for (const ent of entries) {
+      if (ent.name === ".git") continue;
+      if (ent.isDirectory()) {
+        stack.push(join(d, ent.name));
+      } else if (ent.isFile() && ent.name.endsWith(".jh")) {
+        return true;
+      }
     }
   }
+  return false;
+}
 
-  const branchFlag = version ? ` --branch ${version}` : "";
-  const cmd = `git clone --depth 1${branchFlag} ${url} ${libDir}`;
+/** Returns the 40-char HEAD SHA of `libDir`, or undefined when git is unavailable or there is no `.git`. */
+function revParseHead(libDir: string): string | undefined {
   try {
-    execSync(cmd, { stdio: "pipe" });
-    process.stdout.write(`${palette.green}✓ Installed ${name}${version ? ` @ ${version}` : ""}${palette.reset}\n`);
-    return true;
-  } catch (err) {
-    const msg = err instanceof Error ? err.message : String(err);
-    process.stderr.write(`Failed to install ${name}: ${msg}\n`);
-    return false;
+    const out = execFileSync("git", ["-C", libDir, "rev-parse", "HEAD"], {
+      stdio: ["ignore", "pipe", "pipe"],
+    });
+    const sha = out.toString().trim();
+    return /^[0-9a-f]{40}$/.test(sha) ? sha : undefined;
+  } catch {
+    return undefined;
   }
 }
 
-export function runInstall(rest: string[]): number {
+interface PostCloneResult {
+  ok: boolean;
+  commit?: string;
+  message?: string;
+}
+
+/**
+ * Post-clone hygiene: assert the tree contains at least one `.jh` module,
+ * capture the HEAD SHA, strip `.git` so the installed lib is plain files,
+ * and (when a locked commit was passed in via `spec.expectedCommit`) fail
+ * if the cloned commit differs from the recorded one. On any failure the
+ * lib directory is removed so callers never write a lock entry for it.
+ */
+function postCloneHygiene(spec: InstallSpec): PostCloneResult {
+  if (!hasJhFileRecursive(spec.libDir)) {
+    rmSync(spec.libDir, { recursive: true, force: true });
+    return {
+      ok: false,
+      message: `lib "${spec.name}" contains no .jh modules — not a jaiph library?`,
+    };
+  }
+  const gitDir = join(spec.libDir, ".git");
+  let commit: string | undefined;
+  if (existsSync(gitDir)) {
+    commit = revParseHead(spec.libDir);
+    rmSync(gitDir, { recursive: true, force: true });
+  }
+  if (spec.expectedCommit && commit && commit !== spec.expectedCommit) {
+    const versionLabel = spec.version ?? "<ref>";
+    rmSync(spec.libDir, { recursive: true, force: true });
+    return {
+      ok: false,
+      message:
+        `lib "${spec.name}" commit mismatch: locked ${spec.expectedCommit}, cloned ${commit} — ` +
+        `the ref may have moved; re-run \`jaiph install ${spec.name}@${versionLabel}\` ` +
+        `explicitly to accept the new commit`,
+    };
+  }
+  return { ok: true, commit };
+}
+
+/** Default clone runner: `git clone --depth 1 [--branch <ref>] <url> <libDir>` via spawn. */
+function gitCloneRunner(spec: InstallSpec): Promise<CloneOutcome> {
+  return new Promise((done) => {
+    const args = ["clone", "--depth", "1"];
+    if (spec.version) {
+      args.push("--branch", spec.version);
+    }
+    args.push(spec.url, spec.libDir);
+    const child = spawn("git", args, { stdio: ["ignore", "pipe", "pipe"] });
+    let stderr = "";
+    child.stderr.on("data", (chunk: Buffer) => {
+      stderr += chunk.toString();
+    });
+    child.on("error", (err) => {
+      done({ spec, ok: false, message: err.message });
+    });
+    child.on("close", (code) => {
+      if (code === 0) {
+        done({ spec, ok: true });
+      } else {
+        const tail = stderr.trim().split(/\r?\n/).filter(Boolean).pop();
+        done({ spec, ok: false, message: tail ?? `git clone exited with code ${code}` });
+      }
+    });
+  });
+}
+
+async function runWithConcurrency<T, R>(items: T[], limit: number, fn: (item: T) => Promise<R>): Promise<R[]> {
+  const results = new Array<R>(items.length);
+  let next = 0;
+  const worker = async (): Promise<void> => {
+    while (true) {
+      const i = next++;
+      if (i >= items.length) return;
+      results[i] = await fn(items[i]!);
+    }
+  };
+  const workerCount = Math.max(1, Math.min(limit, items.length));
+  await Promise.all(Array.from({ length: workerCount }, () => worker()));
+  return results;
+}
+
+/**
+ * Map raw arg strings to install specs. Args that look like bare registry
+ * names (no `/`, no `:`) are resolved through the registry — loaded at most
+ * once, only when at least one bare-name arg is present. Everything else is
+ * treated as a git clone URL with optional `@version`, matching prior behavior.
+ */
+async function resolveInstallSpecs(args: string[], libsDir: string): Promise<InstallSpec[]> {
+  const hasName = args.some(isRegistryNameArg);
+  let index: RegistryIndex | undefined;
+  let source: string | undefined;
+  if (hasName) {
+    source = registrySource();
+    index = await loadRegistryIndex(source);
+  }
+  const specs: InstallSpec[] = [];
+  for (const arg of args) {
+    if (isRegistryNameArg(arg)) {
+      const { name, version } = parseNameArg(arg);
+      const entry = index!.libs[name];
+      if (!entry) {
+        throw new Error(`lib "${name}" not found in registry ${source}`);
+      }
+      specs.push({ name, url: entry.url, version, libDir: join(libsDir, name) });
+    } else {
+      const { url, version } = parseUrlAndVersion(arg);
+      const name = deriveLibName(url);
+      specs.push({ name, url, version, libDir: join(libsDir, name) });
+    }
+  }
+  return specs;
+}
+
+export async function runInstall(rest: string[], opts: RunInstallOptions = {}): Promise<number> {
+  if (hasHelpFlag(rest)) {
+    process.stdout.write(INSTALL_USAGE);
+    return 0;
+  }
   const palette = colorPalette();
   const force = rest.includes("--force");
   const args = rest.filter((a) => a !== "--force");
-  const workspaceRoot = detectWorkspaceRoot(process.cwd());
+  const cwd = opts.cwd ?? process.cwd();
+  const workspaceRoot = detectWorkspaceRoot(cwd);
   const libsDir = join(workspaceRoot, ".jaiph", "libs");
   const lockPath = join(workspaceRoot, ".jaiph", "libs.lock");
+  const cloneRunner = opts.cloneRunner ?? gitCloneRunner;
+  const concurrency = Math.max(1, opts.concurrency ?? DEFAULT_CONCURRENCY);
 
   mkdirSync(libsDir, { recursive: true });
 
-  // No args: restore from lockfile
-  if (args.length === 0) {
-    const lock = readLockFile(lockPath);
+  const isRestoreFromLock = args.length === 0;
+  let lock: LockFile;
+  let specs: InstallSpec[];
+
+  if (isRestoreFromLock) {
+    lock = readLockFile(lockPath);
     if (lock.libs.length === 0) {
       process.stdout.write("No libs in lockfile.\n");
       return 0;
     }
     process.stdout.write(`\nRestoring ${lock.libs.length} lib(s) from lockfile\n\n`);
-    let ok = true;
-    for (const entry of lock.libs) {
-      if (!cloneLib(entry.url, entry.version, libsDir, force, palette)) {
-        ok = false;
+    specs = lock.libs.map((e) => ({
+      name: e.name,
+      url: e.url,
+      version: e.version,
+      libDir: join(libsDir, e.name),
+      expectedCommit: e.commit,
+    }));
+  } else {
+    process.stdout.write("\n");
+    lock = readLockFile(lockPath);
+    try {
+      specs = await resolveInstallSpecs(args, libsDir);
+    } catch (err) {
+      process.stderr.write(`${(err as Error).message}\n`);
+      return 1;
+    }
+  }
+
+  // Plan phase: skip warm-path libs without invoking the cloner; queue the rest.
+  const skipped: InstallSpec[] = [];
+  const jobs: InstallSpec[] = [];
+  for (const spec of specs) {
+    if (existsSync(spec.libDir)) {
+      if (force) {
+        rmSync(spec.libDir, { recursive: true, force: true });
+        jobs.push(spec);
+      } else {
+        process.stdout.write(`${palette.dim}▸ ${spec.name} already exists, skipping (use --force to re-clone)${palette.reset}\n`);
+        skipped.push(spec);
       }
+    } else {
+      jobs.push(spec);
     }
-    process.stdout.write("\n");
-    return ok ? 0 : 1;
   }
 
-  // Install each specified lib
-  process.stdout.write("\n");
-  const lock = readLockFile(lockPath);
-  let ok = true;
-  for (const arg of args) {
-    const { url, version } = parseUrlAndVersion(arg);
-    const name = deriveLibName(url);
-    if (!cloneLib(url, version, libsDir, force, palette)) {
-      ok = false;
-      continue;
+  const commits = new Map<string, string>();
+  const wrappedRunner: CloneRunner = async (spec) => {
+    const out = await cloneRunner(spec);
+    if (!out.ok) return out;
+    const post = postCloneHygiene(spec);
+    if (!post.ok) {
+      return { spec, ok: false, message: post.message };
+    }
+    if (post.commit) commits.set(spec.name, post.commit);
+    return out;
+  };
+  const outcomes = await runWithConcurrency(jobs, concurrency, wrappedRunner);
+
+  let allOk = true;
+  for (const outcome of outcomes) {
+    if (outcome.ok) {
+      const v = outcome.spec.version ? ` @ ${outcome.spec.version}` : "";
+      process.stdout.write(`${palette.green}✓ Installed ${outcome.spec.name}${v}${palette.reset}\n`);
+    } else {
+      allOk = false;
+      process.stderr.write(`Failed to install ${outcome.spec.name}: ${outcome.message ?? "unknown error"}\n`);
     }
-    upsertLockEntry(lock, { name, url, ...(version ? { version } : {}) });
   }
-  writeLockFile(lockPath, lock);
+
+  if (!isRestoreFromLock) {
+    for (const spec of skipped) {
+      const existing = lock.libs.find((e) => e.name === spec.name);
+      upsertLockEntry(lock, specToLockEntry(spec, existing?.commit));
+    }
+    for (const outcome of outcomes) {
+      if (outcome.ok) {
+        upsertLockEntry(lock, specToLockEntry(outcome.spec, commits.get(outcome.spec.name)));
+      }
+    }
+    writeLockFile(lockPath, lock);
+  }
+
   process.stdout.write("\n");
-  return ok ? 0 : 1;
+  return allOk ? 0 : 1;
 }
diff --git a/src/cli/commands/registry.test.ts b/src/cli/commands/registry.test.ts
new file mode 100644
index 00000000..42abba61
--- /dev/null
+++ b/src/cli/commands/registry.test.ts
@@ -0,0 +1,19 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readFileSync } from "node:fs";
+import { resolve } from "node:path";
+import { loadRegistryIndex } from "./registry";
+
+// Compiled to dist/src/cli/commands/registry.test.js — four levels up lands at repo root.
+const SHIPPED_REGISTRY = resolve(__dirname, "../../../../docs/registry");
+
+test("shipped docs/registry parses through loadRegistryIndex", async () => {
+  const index = await loadRegistryIndex(SHIPPED_REGISTRY);
+  assert.ok(Object.keys(index.libs).length > 0, "shipped registry must list at least one lib");
+});
+
+test("shipped docs/registry has no Jekyll front matter and parses as JSON", () => {
+  const text = readFileSync(SHIPPED_REGISTRY, "utf8");
+  assert.ok(!text.trimStart().startsWith("---"), "docs/registry must not carry Jekyll front matter");
+  assert.doesNotThrow(() => JSON.parse(text), "docs/registry must be valid JSON");
+});
diff --git a/src/cli/commands/registry.ts b/src/cli/commands/registry.ts
new file mode 100644
index 00000000..4dd22815
--- /dev/null
+++ b/src/cli/commands/registry.ts
@@ -0,0 +1,116 @@
+import { readFileSync } from "node:fs";
+import { fileURLToPath } from "node:url";
+
+export const DEFAULT_REGISTRY_URL = "https://jaiph.org/registry";
+
+export const REGISTRY_NAME_REGEX = /^[A-Za-z0-9_-]+$/;
+
+const NAME_ARG_REGEX = /^[A-Za-z0-9_-]+(@[A-Za-z0-9._+/-]+)?$/;
+
+export interface RegistryEntry {
+  url: string;
+  description: string;
+}
+
+export interface RegistryIndex {
+  libs: Record<string, RegistryEntry>;
+}
+
+/** True for `name` or `name@version` (single segment — no `/`, no `:`). */
+export function isRegistryNameArg(arg: string): boolean {
+  if (arg.includes("/") || arg.includes(":")) return false;
+  return NAME_ARG_REGEX.test(arg);
+}
+
+export function parseNameArg(arg: string): { name: string; version?: string } {
+  const at = arg.indexOf("@");
+  if (at > 0) {
+    return { name: arg.slice(0, at), version: arg.slice(at + 1) };
+  }
+  return { name: arg };
+}
+
+/** Pick the registry source: env override wins, else the default URL. */
+export function registrySource(env: NodeJS.ProcessEnv = process.env): string {
+  const override = env.JAIPH_REGISTRY;
+  if (override && override.length > 0) return override;
+  return DEFAULT_REGISTRY_URL;
+}
+
+/**
+ * Load and validate the registry index from `source`. `file://` URLs and any
+ * value without a `://` scheme are read from disk; everything else is fetched
+ * via global `fetch`. Throws `Error` with the source in the message on any
+ * read/parse/shape failure.
+ */
+export async function loadRegistryIndex(source: string): Promise<RegistryIndex> {
+  const text = await readRegistrySource(source);
+  let parsed: unknown;
+  try {
+    parsed = JSON.parse(text);
+  } catch (err) {
+    throw new Error(`failed to parse registry ${source}: ${(err as Error).message}`);
+  }
+  return validateRegistryIndex(parsed, source);
+}
+
+async function readRegistrySource(source: string): Promise<string> {
+  if (source.startsWith("file://")) {
+    const path = fileURLToPath(source);
+    return readDisk(path, source);
+  }
+  if (!source.includes("://")) {
+    return readDisk(source, source);
+  }
+  let res: Response;
+  try {
+    res = await fetch(source);
+  } catch (err) {
+    throw new Error(`failed to fetch registry ${source}: ${(err as Error).message}`);
+  }
+  if (!res.ok) {
+    throw new Error(`failed to fetch registry ${source}: HTTP ${res.status}`);
+  }
+  try {
+    return await res.text();
+  } catch (err) {
+    throw new Error(`failed to fetch registry ${source}: ${(err as Error).message}`);
+  }
+}
+
+function readDisk(path: string, source: string): string {
+  try {
+    return readFileSync(path, "utf8");
+  } catch (err) {
+    throw new Error(`failed to read registry ${source}: ${(err as Error).message}`);
+  }
+}
+
+function validateRegistryIndex(parsed: unknown, source: string): RegistryIndex {
+  if (typeof parsed !== "object" || parsed === null || Array.isArray(parsed)) {
+    throw new Error(`failed to parse registry ${source}: top-level must be an object`);
+  }
+  const libs = (parsed as { libs?: unknown }).libs;
+  if (typeof libs !== "object" || libs === null || Array.isArray(libs)) {
+    throw new Error(`failed to parse registry ${source}: "libs" must be an object`);
+  }
+  const out: Record<string, RegistryEntry> = {};
+  for (const [name, raw] of Object.entries(libs)) {
+    if (!REGISTRY_NAME_REGEX.test(name)) {
+      throw new Error(`failed to parse registry ${source}: invalid name "${name}"`);
+    }
+    if (typeof raw !== "object" || raw === null) {
+      throw new Error(`failed to parse registry ${source}: entry "${name}" must be an object`);
+    }
+    const url = (raw as { url?: unknown }).url;
+    const description = (raw as { description?: unknown }).description;
+    if (typeof url !== "string" || url.length === 0) {
+      throw new Error(`failed to parse registry ${source}: entry "${name}" missing string "url"`);
+    }
+    if (typeof description !== "string") {
+      throw new Error(`failed to parse registry ${source}: entry "${name}" missing string "description"`);
+    }
+    out[name] = { url, description };
+  }
+  return { libs: out };
+}
diff --git a/src/cli/commands/run.test.ts b/src/cli/commands/run.test.ts
new file mode 100644
index 00000000..bfb6940c
--- /dev/null
+++ b/src/cli/commands/run.test.ts
@@ -0,0 +1,210 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { mkdtempSync, writeFileSync, rmSync, mkdirSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { runWorkflow } from "./run";
+import { _dockerExec, _dockerSpawn } from "../../runtime/docker";
+
+const MIN_WORKFLOW = `workflow default() {\n  log "hi"\n}\n`;
+
+function captureStreams(): { restore: () => void; stderr: () => string; stdout: () => string } {
+  let err = "";
+  let out = "";
+  const origErr = process.stderr.write;
+  const origOut = process.stdout.write;
+  process.stderr.write = ((chunk: string | Uint8Array) => {
+    err += String(chunk);
+    return true;
+  }) as typeof process.stderr.write;
+  process.stdout.write = ((chunk: string | Uint8Array) => {
+    out += String(chunk);
+    return true;
+  }) as typeof process.stdout.write;
+  return {
+    restore: () => {
+      process.stderr.write = origErr;
+      process.stdout.write = origOut;
+    },
+    stderr: () => err,
+    stdout: () => out,
+  };
+}
+
+function fenceDockerCalls(): { restore: () => void; calls: () => string[] } {
+  const origExec = _dockerExec.run;
+  const origSpawn = _dockerSpawn.run;
+  const calls: string[] = [];
+  _dockerExec.run = (_args: string[], _opts: object) => {
+    calls.push("exec");
+    throw new Error("docker exec should not be invoked in this test");
+  };
+  _dockerSpawn.run = (_args: string[], _opts: object) => {
+    calls.push("spawn");
+    throw new Error("docker spawn should not be invoked in this test");
+  };
+  return {
+    restore: () => { _dockerExec.run = origExec; _dockerSpawn.run = origSpawn; },
+    calls: () => calls,
+  };
+}
+
+// ---------------------------------------------------------------------------
+// E_FLAG_CONFLICT: --inplace + --unsafe must abort before any container launch
+// ---------------------------------------------------------------------------
+
+test("runWorkflow: --inplace + --unsafe fails with E_FLAG_CONFLICT, no docker exec or spawn invoked", async () => {
+  const ws = mkdtempSync(join(tmpdir(), "jaiph-run-conflict-ws-"));
+  writeFileSync(join(ws, "flow.jh"), MIN_WORKFLOW);
+  const fence = fenceDockerCalls();
+  const cap = captureStreams();
+  let code: number;
+  try {
+    code = await runWorkflow(["--inplace", "--unsafe", join(ws, "flow.jh")]);
+  } finally {
+    cap.restore();
+    fence.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+  assert.equal(code, 1, "must return 1 on flag conflict");
+  assert.match(cap.stderr(), /E_FLAG_CONFLICT/);
+  assert.deepEqual(fence.calls(), [], "no docker exec/spawn must be invoked");
+});
+
+test("runWorkflow: --inplace + env JAIPH_UNSAFE=true also fails with E_FLAG_CONFLICT", async () => {
+  const ws = mkdtempSync(join(tmpdir(), "jaiph-run-conflict-ws-"));
+  writeFileSync(join(ws, "flow.jh"), MIN_WORKFLOW);
+  const fence = fenceDockerCalls();
+  const cap = captureStreams();
+  const savedUnsafe = process.env.JAIPH_UNSAFE;
+  process.env.JAIPH_UNSAFE = "true";
+  let code: number;
+  try {
+    code = await runWorkflow(["--inplace", join(ws, "flow.jh")]);
+  } finally {
+    if (savedUnsafe === undefined) delete process.env.JAIPH_UNSAFE;
+    else process.env.JAIPH_UNSAFE = savedUnsafe;
+    cap.restore();
+    fence.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+  assert.equal(code, 1);
+  assert.match(cap.stderr(), /E_FLAG_CONFLICT/);
+  assert.deepEqual(fence.calls(), []);
+});
+
+// ---------------------------------------------------------------------------
+// --workspace validation: missing value, non-existent dir, file (not dir)
+// ---------------------------------------------------------------------------
+
+test("runWorkflow: --workspace without a value errors and returns 1", async () => {
+  const fence = fenceDockerCalls();
+  const cap = captureStreams();
+  let code: number;
+  try {
+    code = await runWorkflow(["--workspace"]);
+  } finally {
+    cap.restore();
+    fence.restore();
+  }
+  assert.equal(code, 1);
+  assert.match(cap.stderr(), /--workspace requires a directory path/);
+  assert.deepEqual(fence.calls(), []);
+});
+
+test("runWorkflow: --workspace pointing to a non-existent dir errors and returns 1", async () => {
+  const ws = mkdtempSync(join(tmpdir(), "jaiph-run-ws-"));
+  writeFileSync(join(ws, "flow.jh"), MIN_WORKFLOW);
+  const missing = join(ws, "does-not-exist");
+  const fence = fenceDockerCalls();
+  const cap = captureStreams();
+  let code: number;
+  try {
+    code = await runWorkflow(["--workspace", missing, join(ws, "flow.jh")]);
+  } finally {
+    cap.restore();
+    fence.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+  assert.equal(code, 1);
+  assert.match(cap.stderr(), /--workspace path does not exist/);
+  assert.deepEqual(fence.calls(), []);
+});
+
+test("runWorkflow: --workspace pointing to a file (not a directory) errors and returns 1", async () => {
+  const ws = mkdtempSync(join(tmpdir(), "jaiph-run-ws-"));
+  writeFileSync(join(ws, "flow.jh"), MIN_WORKFLOW);
+  const notDir = join(ws, "notadir.txt");
+  writeFileSync(notDir, "");
+  const fence = fenceDockerCalls();
+  const cap = captureStreams();
+  let code: number;
+  try {
+    code = await runWorkflow(["--workspace", notDir, join(ws, "flow.jh")]);
+  } finally {
+    cap.restore();
+    fence.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+  assert.equal(code, 1);
+  assert.match(cap.stderr(), /--workspace path is not a directory/);
+  assert.deepEqual(fence.calls(), []);
+});
+
+// ---------------------------------------------------------------------------
+// --raw applies sandbox flags too: flag conflict aborts before runner spawn
+// ---------------------------------------------------------------------------
+
+test("runWorkflow --raw: --inplace + --unsafe fails with E_FLAG_CONFLICT", async () => {
+  const ws = mkdtempSync(join(tmpdir(), "jaiph-run-raw-conflict-ws-"));
+  writeFileSync(join(ws, "flow.jh"), MIN_WORKFLOW);
+  const fence = fenceDockerCalls();
+  const cap = captureStreams();
+  let code: number;
+  try {
+    code = await runWorkflow(["--raw", "--inplace", "--unsafe", join(ws, "flow.jh")]);
+  } finally {
+    cap.restore();
+    fence.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+  assert.equal(code, 1);
+  assert.match(cap.stderr(), /E_FLAG_CONFLICT/);
+  // --raw never goes through docker anyway, but assert fence still untouched.
+  assert.deepEqual(fence.calls(), []);
+});
+
+// ---------------------------------------------------------------------------
+// --workspace explicit path wins over auto-detect: even when the .jh file
+// lives under a perfectly-good auto-detected workspace, the explicit path
+// is consulted (and rejected as missing) before any fallback applies.
+// ---------------------------------------------------------------------------
+
+test("runWorkflow: --workspace bypasses detectWorkspaceRoot — explicit-missing wins over auto-detectable", async () => {
+  // A workspace-shaped dir (has .git) that would be auto-detected.
+  const autoDetected = mkdtempSync(join(tmpdir(), "jaiph-run-ws-auto-"));
+  mkdirSync(join(autoDetected, ".git"), { recursive: true });
+  const flowPath = join(autoDetected, "flow.jh");
+  writeFileSync(flowPath, MIN_WORKFLOW);
+  const explicitMissing = join(autoDetected, "no-such-explicit-workspace");
+  const fence = fenceDockerCalls();
+  const cap = captureStreams();
+  let code: number;
+  try {
+    code = await runWorkflow(["--workspace", explicitMissing, flowPath]);
+  } finally {
+    cap.restore();
+    fence.restore();
+    rmSync(autoDetected, { recursive: true, force: true });
+  }
+  // If --workspace were ignored, detectWorkspaceRoot would happily find
+  // `autoDetected` and the run would proceed past workspace validation.
+  // The explicit-missing error proves the flag is consulted first.
+  assert.equal(code, 1);
+  assert.match(cap.stderr(), /--workspace path does not exist/);
+  assert.ok(
+    cap.stderr().includes(explicitMissing),
+    `error must name the explicit --workspace path; got: ${cap.stderr()}`,
+  );
+  assert.deepEqual(fence.calls(), []);
+});
diff --git a/src/cli/commands/run.ts b/src/cli/commands/run.ts
index c741b8f5..5f143e54 100644
--- a/src/cli/commands/run.ts
+++ b/src/cli/commands/run.ts
@@ -10,7 +10,8 @@ import { tmpdir } from "node:os";
 import { dirname, join, resolve, extname } from "node:path";
 import { basename } from "node:path";
 import { parsejaiph } from "../../parser";
-import { buildScripts } from "../../transpiler";
+import { buildScripts, buildScriptsFromGraph } from "../../transpiler";
+import { loadModuleGraph, writeModuleGraph } from "../../transpile/module-graph";
 import { metadataToConfig } from "../../config";
 import { buildStepDisplayParamPairs, formatNamedParamsForDisplay } from "./format-params.js";
 import {
@@ -21,9 +22,26 @@ import {
   failedStepArtifactPaths,
   discoverDockerRunDir,
   remapContainerPath,
+  formatDockerTimeoutMessage,
 } from "../shared/errors";
 import { detectWorkspaceRoot } from "../shared/paths";
-import { parseArgs } from "../shared/usage";
+import { hasHelpFlag, parseArgs } from "../shared/usage";
+
+const RUN_USAGE =
+  "Usage: jaiph run [--target <dir>] [--raw] [--workspace <dir>] [--inplace] [--unsafe] [--yes|-y] <file.jh> [--] [args...]\n\n" +
+  "Parse, validate, and run a Jaiph workflow file. Requires a `workflow default` entrypoint.\n\n" +
+  "  --target <dir>     keep emitted scripts and run metadata under <dir>\n" +
+  "  --raw              skip banner, progress tree, hooks, and failure footer; inherited stdio\n" +
+  "  --workspace <dir>  workspace root for import resolution (default: auto-detect from the .jh file)\n" +
+  "  --inplace          bind-mount the host workspace rw so edits land live (sets JAIPH_INPLACE=1 for this run)\n" +
+  "  --unsafe           run on the host with no sandbox (sets JAIPH_UNSAFE=true for this run)\n" +
+  "  -y, --yes          skip the in-place confirmation prompt (sets JAIPH_INPLACE_YES=1 for this run)\n" +
+  "  --                 end of jaiph flags; remaining args go to workflow default\n" +
+  "  -h, --help         show this help\n\n" +
+  "Note: these flags only affect `jaiph run`; the corresponding env vars also apply to other entry points.\n\n" +
+  "Examples:\n" +
+  "  jaiph run ./flows/review.jh \"review this diff\"\n" +
+  "  jaiph run --inplace --workspace ./app ./flows/fix.jh\n";
 import {
   spawnRunProcess,
   setupRunSignalHandlers,
@@ -35,17 +53,20 @@ import {
   prepareImage,
   spawnDockerProcess,
   cleanupDocker,
+  withDockerExitGuard,
   resolveDockerHostRunsRoot,
   selectSandboxMode,
   type SandboxMode,
 } from "../../runtime/docker";
+import { confirmInplaceRun } from "../../runtime/docker-inplace";
 import {
   styleKeywordLabel,
   formatElapsedDuration,
   formatRunningBottomLine,
 } from "../run/progress";
 import { loadMergedHooks, registerHooksSubscriber } from "../run/hooks";
-import { resolveRuntimeEnv } from "../run/env";
+import { resolveRuntimeEnv, applySandboxFlags } from "../run/env";
+import { preflightAgentCredentials } from "../run/preflight-credentials";
 import { colorize, formatJaiphRunningBannerLines } from "../run/display";
 import { createRunEmitter } from "../run/emitter";
 import {
@@ -59,7 +80,18 @@ import {
 } from "../run/stderr-handler";
 
 export async function runWorkflow(rest: string[]): Promise<number> {
-  const { target, raw, positional } = parseArgs(rest);
+  if (hasHelpFlag(rest)) {
+    process.stdout.write(RUN_USAGE);
+    return 0;
+  }
+  let parsed: ReturnType<typeof parseArgs>;
+  try {
+    parsed = parseArgs(rest);
+  } catch (err) {
+    process.stderr.write(`${err instanceof Error ? err.message : String(err)}\n`);
+    return 1;
+  }
+  const { target, raw, workspace, inplace, unsafe, yes, positional } = parsed;
   const input = positional[0];
   const runArgs = positional.slice(1);
   if (!input) {
@@ -67,7 +99,17 @@ export async function runWorkflow(rest: string[]): Promise<number> {
     return 1;
   }
   const inputAbs = resolve(input);
-  const workspaceRoot = detectWorkspaceRoot(dirname(inputAbs));
+  const workspaceRoot = workspace ? resolve(workspace) : detectWorkspaceRoot(dirname(inputAbs));
+  if (workspace) {
+    if (!existsSync(workspaceRoot)) {
+      process.stderr.write(`--workspace path does not exist: ${workspaceRoot}\n`);
+      return 1;
+    }
+    if (!statSync(workspaceRoot).isDirectory()) {
+      process.stderr.write(`--workspace path is not a directory: ${workspaceRoot}\n`);
+      return 1;
+    }
+  }
   const inputStat = statSync(inputAbs);
   const ext = extname(inputAbs);
   if (!inputStat.isFile() || ext !== ".jh") {
@@ -75,12 +117,14 @@ export async function runWorkflow(rest: string[]): Promise<number> {
     return 1;
   }
 
+  const sandboxFlags = { inplace, unsafe, yes };
   if (raw) {
-    return runWorkflowRaw(inputAbs, workspaceRoot, target, runArgs);
+    return runWorkflowRaw(inputAbs, workspaceRoot, target, runArgs, sandboxFlags);
   }
 
   const hooksConfig = loadMergedHooks(workspaceRoot);
-  const mod = parsejaiph(readFileSync(inputAbs, "utf8"), inputAbs);
+  const graph = loadModuleGraph(inputAbs, workspaceRoot);
+  const mod = graph.modules.get(inputAbs)!.ast;
   const effectiveConfig = metadataToConfig(mod.metadata);
 
   const outDir = target ? resolve(target) : mkdtempSync(join(tmpdir(), "jaiph-run-"));
@@ -94,12 +138,40 @@ export async function runWorkflow(rest: string[]): Promise<number> {
     runtimeEnv.JAIPH_SOURCE_ABS = inputAbs;
     const runId = randomUUID();
     runtimeEnv.JAIPH_RUN_ID = runId;
+    try {
+      applySandboxFlags(runtimeEnv, sandboxFlags);
+    } catch (err) {
+      process.stderr.write(`${err instanceof Error ? err.message : String(err)}\n`);
+      return 1;
+    }
     const dockerConfigForBanner = resolveDockerConfig(mod.metadata?.runtime, runtimeEnv);
+    const credPreflight = preflightAgentCredentials({
+      mod,
+      inputAbs,
+      runtimeEnv,
+      dockerEnabled: dockerConfigForBanner.enabled,
+    });
+    for (const w of credPreflight.warnings) {
+      process.stderr.write(`${w}\n`);
+    }
+    if (credPreflight.errors.length > 0) {
+      for (const e of credPreflight.errors) {
+        process.stderr.write(`${e}\n`);
+      }
+      return 1;
+    }
     if (dockerConfigForBanner.enabled) {
       checkDockerAvailable();
       prepareImage(dockerConfigForBanner);
     }
     const sandboxModeForBanner = dockerConfigForBanner.enabled ? selectSandboxMode(runtimeEnv) : null;
+    if (sandboxModeForBanner === "inplace") {
+      const proceed = await confirmInplaceRun(workspaceRoot, runtimeEnv, isTTY);
+      if (!proceed) {
+        process.stderr.write("jaiph in-place mode: aborted by user.\n");
+        return 1;
+      }
+    }
 
     writeBanner(
       mod,
@@ -111,8 +183,18 @@ export async function runWorkflow(rest: string[]): Promise<number> {
       dockerConfigForBanner.enabled,
       sandboxModeForBanner,
     );
-    const { scriptsDir } = buildScripts(inputAbs, outDir, workspaceRoot);
+    const { scriptsDir } = buildScriptsFromGraph(graph, outDir);
     runtimeEnv.JAIPH_SCRIPTS = scriptsDir;
+    // Serialized module graph consumed by the spawned runner so the runtime
+    // graph reuses these ASTs instead of re-parsing every reachable module.
+    // Docker mounts the workspace read-only, so place the cache under outDir,
+    // which the host already arranges for the container side via its existing
+    // sandbox layout. For local runs the runner reads the path directly.
+    const graphFile = join(outDir, ".jaiph-module-graph.json");
+    writeModuleGraph(graphFile, graph);
+    if (!dockerConfigForBanner.enabled) {
+      runtimeEnv.JAIPH_MODULE_GRAPH_FILE = graphFile;
+    }
     const metaFile = join(outDir, `.jaiph-run-meta-${Date.now()}-${process.pid}.txt`);
 
     const emitter = createRunEmitter();
@@ -147,40 +229,36 @@ export async function runWorkflow(rest: string[]): Promise<number> {
       forceKillAfterMs: 1500,
       onSignalCleanup,
     });
-    const exitGuard = dockerResult
-      ? (): void => { cleanupDocker(dockerResult); }
-      : undefined;
-    if (exitGuard) process.on("exit", exitGuard);
-
-    if (isTTY) {
-      ttyCtx.runningInterval = setInterval(() => {
-        const elapsedSec = (Date.now() - startedAt) / 1000;
-        process.stdout.write("\r" + formatRunningBottomLine("default", elapsedSec) + "\u001b[K");
-      }, 1000);
-    } else {
-      const hbMs = nonTTYHeartbeatTickMs();
-      ttyCtx.nonTTYHeartbeatInterval = setInterval(() => {
-        tickNonTTYHeartbeat(ttyCtx);
-      }, hbMs);
-    }
+    const childExit = await withDockerExitGuard(dockerResult, async () => {
+      if (isTTY) {
+        ttyCtx.runningInterval = setInterval(() => {
+          const elapsedSec = (Date.now() - startedAt) / 1000;
+          process.stdout.write("\r" + formatRunningBottomLine("default", elapsedSec) + "\u001b[K");
+        }, 1000);
+      } else {
+        const hbMs = nonTTYHeartbeatTickMs();
+        ttyCtx.nonTTYHeartbeatInterval = setInterval(() => {
+          tickNonTTYHeartbeat(ttyCtx);
+        }, hbMs);
+      }
 
-    const onLine = createStderrParser(emitter);
-    const buf: StreamBuffers = { stdout: "", stderr: "" };
+      const onLine = createStderrParser(emitter);
+      const buf: StreamBuffers = { stdout: "", stderr: "" };
 
-    wireStreams(execResult, onLine, buf, ttyCtx);
-    const childExit = await waitForRunExit(execResult, () => signalHandlers.remove());
-    drainBuffers(onLine, buf, ttyCtx);
+      wireStreams(execResult, onLine, buf, ttyCtx);
+      const exit = await waitForRunExit(execResult, () => signalHandlers.remove());
+      drainBuffers(onLine, buf, ttyCtx);
 
-    if (dockerResult) {
-      const timedOut = dockerResult.timeoutTimer === undefined && activeDockerConfig.timeoutSeconds > 0
-        ? false
-        : (Date.now() - startedAt) >= activeDockerConfig.timeoutSeconds * 1000;
-      if (timedOut && childExit.status !== 0) {
-        runState.capturedStderr += "E_TIMEOUT container execution exceeded timeout\n";
+      if (dockerResult) {
+        const timedOut = dockerResult.timeoutTimer === undefined && activeDockerConfig.timeoutSeconds > 0
+          ? false
+          : (Date.now() - startedAt) >= activeDockerConfig.timeoutSeconds * 1000;
+        if (timedOut && exit.status !== 0) {
+          runState.capturedStderr += `${formatDockerTimeoutMessage(activeDockerConfig.timeoutSeconds)}\n`;
+        }
       }
-      cleanupDocker(dockerResult);
-      if (exitGuard) process.removeListener("exit", exitGuard);
-    }
+      return exit;
+    });
 
     if (childExit.signal && runState.capturedStderr.trim().length === 0) {
       runState.capturedStderr = `Process terminated by signal ${childExit.signal}`;
@@ -219,6 +297,7 @@ async function runWorkflowRaw(
   workspaceRoot: string,
   target: string | undefined,
   runArgs: string[],
+  sandboxFlags: { inplace?: boolean; unsafe?: boolean; yes?: boolean },
 ): Promise<number> {
   const mod = parsejaiph(readFileSync(inputAbs, "utf8"), inputAbs);
   const effectiveConfig = metadataToConfig(mod.metadata);
@@ -227,6 +306,12 @@ async function runWorkflowRaw(
   try {
     const runtimeEnv = resolveRuntimeEnv(effectiveConfig, workspaceRoot, inputAbs);
     runtimeEnv.JAIPH_SOURCE_ABS = inputAbs;
+    try {
+      applySandboxFlags(runtimeEnv, sandboxFlags);
+    } catch (err) {
+      process.stderr.write(`${err instanceof Error ? err.message : String(err)}\n`);
+      return 1;
+    }
     const { scriptsDir } = buildScripts(inputAbs, outDir, workspaceRoot);
     runtimeEnv.JAIPH_SCRIPTS = scriptsDir;
     const metaFile = join(outDir, `.jaiph-run-meta-${Date.now()}-${process.pid}.txt`);
@@ -455,7 +540,10 @@ function reportResult(
     return 0;
   }
 
-  const failureDetails = resolveFailureDetails(capturedStderr, summaryFile);
+  const failureDetails = resolveFailureDetails(capturedStderr, summaryFile, {
+    code: exitStatus,
+    runDir,
+  });
   process.stderr.write("\n");
   process.stderr.write(
     `${palette.red}\u2717 FAIL${palette.reset} workflow default ${palette.dim}(${elapsedLabel})${palette.reset}\n`,
diff --git a/src/cli/commands/test.ts b/src/cli/commands/test.ts
index 340e7c88..07d81441 100644
--- a/src/cli/commands/test.ts
+++ b/src/cli/commands/test.ts
@@ -1,20 +1,32 @@
 import {
   mkdtempSync,
-  readFileSync,
   rmSync,
   statSync,
 } from "node:fs";
 import { tmpdir } from "node:os";
 import { dirname, join, resolve, extname } from "node:path";
 import { basename } from "node:path";
-import { buildScripts, walkTestFiles } from "../../transpiler";
-import { parsejaiph } from "../../parser";
+import { buildScriptsFromGraph, walkTestFiles } from "../../transpiler";
+import { loadModuleGraph } from "../../transpile/module-graph";
 import { jaiphError } from "../../errors";
 import { detectWorkspaceRoot } from "../shared/paths";
-import { parseArgs } from "../shared/usage";
+import { hasHelpFlag, parseArgs } from "../shared/usage";
 import { runTestFile } from "../../runtime/kernel/node-test-runner";
 
+const TEST_USAGE =
+  "Usage: jaiph test [path]\n\n" +
+  "Run *.test.jh modules. With no path, discovers every *.test.jh under the workspace\n" +
+  "root. With a directory, runs every *.test.jh underneath (recursive). With a single\n" +
+  "*.test.jh file, runs only that file.\n\n" +
+  "  -h, --help      show this help\n\n" +
+  "Example:\n" +
+  "  jaiph test ./e2e/say_hello.test.jh\n";
+
 export async function runTest(rest: string[]): Promise<number> {
+  if (hasHelpFlag(rest)) {
+    process.stdout.write(TEST_USAGE);
+    return 0;
+  }
   const { positional } = parseArgs(rest);
   const input = positional[0];
   const runArgs = positional.slice(1);
@@ -23,8 +35,8 @@ export async function runTest(rest: string[]): Promise<number> {
     const workspaceRoot = detectWorkspaceRoot(process.cwd());
     const testFiles = walkTestFiles(workspaceRoot);
     if (testFiles.length === 0) {
-      process.stderr.write("jaiph test: no *.test.jh files found\n");
-      return 1;
+      process.stderr.write("jaiph test: no *.test.jh files found (nothing to do)\n");
+      return 0;
     }
     let exitCode = 0;
     for (const testFile of testFiles) {
@@ -41,8 +53,8 @@ export async function runTest(rest: string[]): Promise<number> {
   if (inputStat.isDirectory()) {
     const testFiles = walkTestFiles(inputAbs);
     if (testFiles.length === 0) {
-      process.stderr.write(`jaiph test: no *.test.jh files in ${input}\n`);
-      return 1;
+      process.stderr.write("jaiph test: no *.test.jh files found (nothing to do)\n");
+      return 0;
     }
     const workspaceRoot = detectWorkspaceRoot(inputAbs);
     let exitCode = 0;
@@ -76,7 +88,8 @@ export async function runSingleTestFile(
   workspaceRoot: string,
   _runArgs: string[],
 ): Promise<number> {
-  const ast = parsejaiph(readFileSync(testFileAbs, "utf8"), testFileAbs);
+  const graph = loadModuleGraph(testFileAbs, workspaceRoot);
+  const ast = graph.modules.get(graph.entryFile)!.ast;
   if (!ast.tests || ast.tests.length === 0) {
     throw jaiphError(ast.filePath, 1, 1, "E_PARSE", "test file must contain at least one test block");
   }
@@ -85,8 +98,8 @@ export async function runSingleTestFile(
   const outDir = mkdtempSync(join(tmpdir(), "jaiph-test-"));
   try {
     /** Only compile the test module and its imports — not every `.jh` under the workspace. */
-    const { scriptsDir } = buildScripts(testFileAbs, outDir, workspaceRoot);
-    return await runTestFile(testFileAbs, workspaceRoot, scriptsDir, ast.tests);
+    const { scriptsDir } = buildScriptsFromGraph(graph, outDir);
+    return await runTestFile(graph, workspaceRoot, scriptsDir, ast.tests);
   } finally {
     rmSync(outDir, { recursive: true, force: true });
   }
diff --git a/src/cli/commands/use.ts b/src/cli/commands/use.ts
index f575fad4..72f5a719 100644
--- a/src/cli/commands/use.ts
+++ b/src/cli/commands/use.ts
@@ -1,4 +1,12 @@
 import { spawnSync } from "node:child_process";
+import { hasHelpFlag } from "../shared/usage";
+
+const USE_USAGE =
+  "Usage: jaiph use <version|nightly>\n\n" +
+  "Reinstall the jaiph CLI at a specific version tag, or 'nightly'.\n\n" +
+  "  -h, --help      show this help\n\n" +
+  "Example:\n" +
+  "  jaiph use nightly\n";
 
 function toInstallRef(version: string): string | undefined {
   const trimmed = version.trim();
@@ -12,9 +20,13 @@ function toInstallRef(version: string): string | undefined {
 }
 
 export function runUse(rest: string[]): number {
+  if (hasHelpFlag(rest)) {
+    process.stdout.write(USE_USAGE);
+    return 0;
+  }
   const version = rest[0];
   if (!version) {
-    process.stderr.write("jaiph use requires a version (e.g. 0.9.4) or 'nightly'\n");
+    process.stderr.write("jaiph use requires a version (e.g. X.Y.Z) or 'nightly'\n");
     return 1;
   }
   const ref = toInstallRef(version);
diff --git a/src/cli/index.test.ts b/src/cli/index.test.ts
new file mode 100644
index 00000000..7ecdcc1b
--- /dev/null
+++ b/src/cli/index.test.ts
@@ -0,0 +1,107 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { existsSync, readFileSync } from "node:fs";
+import { dirname, join } from "node:path";
+import { main } from "./index";
+import { WORKFLOW_RUNNER_ARG } from "../runtime/kernel/node-workflow-runner";
+import { printUsage } from "./shared/usage";
+import { VERSION } from "../version";
+
+function findRepoRoot(): string {
+  let cur = __dirname;
+  while (cur !== dirname(cur)) {
+    if (existsSync(join(cur, "package.json")) && existsSync(join(cur, "tsconfig.json"))) {
+      return cur;
+    }
+    cur = dirname(cur);
+  }
+  throw new Error("could not locate repo root for version test");
+}
+
+interface StreamCapture {
+  text: string;
+  restore: () => void;
+}
+
+function captureStream(stream: NodeJS.WriteStream): StreamCapture {
+  const original = stream.write.bind(stream);
+  const buf: string[] = [];
+  (stream.write as unknown) = (chunk: string | Uint8Array): boolean => {
+    buf.push(typeof chunk === "string" ? chunk : Buffer.from(chunk).toString("utf8"));
+    return true;
+  };
+  return {
+    get text() {
+      return buf.join("");
+    },
+    restore() {
+      stream.write = original;
+    },
+  };
+}
+
+test(`main dispatches ${WORKFLOW_RUNNER_ARG} to the runner instead of falling through to "Unknown command"`, async () => {
+  const err = captureStream(process.stderr);
+  try {
+    // No positional args after the marker — runner's parser must reject this
+    // before the dispatch can route anywhere else.
+    const code = await main(["node", "cli.js", WORKFLOW_RUNNER_ARG]);
+    assert.equal(code, 1);
+  } finally {
+    err.restore();
+  }
+  assert.match(err.text, /node-workflow-runner requires meta file and source file/);
+  assert.doesNotMatch(err.text, /Unknown command/);
+});
+
+test(`printUsage never mentions the internal ${WORKFLOW_RUNNER_ARG} marker`, () => {
+  const out = captureStream(process.stdout);
+  try {
+    printUsage();
+  } finally {
+    out.restore();
+  }
+  assert.doesNotMatch(out.text, new RegExp(WORKFLOW_RUNNER_ARG));
+});
+
+test("--help output never mentions the internal __workflow-runner marker", async () => {
+  const out = captureStream(process.stdout);
+  let code: number;
+  try {
+    code = await main(["node", "cli.js", "--help"]);
+  } finally {
+    out.restore();
+  }
+  assert.equal(code, 0);
+  assert.doesNotMatch(out.text, /__workflow-runner/);
+});
+
+test("--version prints 'jaiph <version>' where <version> equals package.json", async () => {
+  const repoRoot = findRepoRoot();
+  const pkg = JSON.parse(readFileSync(join(repoRoot, "package.json"), "utf8"));
+  assert.equal(typeof pkg.version, "string");
+  assert.equal(VERSION, pkg.version, "src/version.ts VERSION drifted from package.json — rerun `npm run build` (or `npm run embed-assets`)");
+  const out = captureStream(process.stdout);
+  let code: number;
+  try {
+    code = await main(["node", "cli.js", "--version"]);
+  } finally {
+    out.restore();
+  }
+  assert.equal(code, 0);
+  assert.equal(out.text, `jaiph ${pkg.version}\n`);
+});
+
+test("-v prints the same single-sourced version as --version", async () => {
+  const repoRoot = findRepoRoot();
+  const pkg = JSON.parse(readFileSync(join(repoRoot, "package.json"), "utf8"));
+  const out = captureStream(process.stdout);
+  let code: number;
+  try {
+    code = await main(["node", "cli.js", "-v"]);
+  } finally {
+    out.restore();
+  }
+  assert.equal(code, 0);
+  assert.equal(out.text, `jaiph ${pkg.version}\n`);
+});
diff --git a/src/cli/index.ts b/src/cli/index.ts
index 3248529e..4fc3ffc1 100644
--- a/src/cli/index.ts
+++ b/src/cli/index.ts
@@ -8,15 +8,30 @@ import { runUse } from "./commands/use";
 import { runFormat } from "./commands/format";
 import { runInstall } from "./commands/install";
 import { runCompile } from "./commands/compile";
+import { runWorkflowRunner, WORKFLOW_RUNNER_ARG } from "../runtime/kernel/node-workflow-runner";
+import { VERSION } from "../version";
 
 export async function main(argv: string[]): Promise<number> {
   const [, , cmd, ...rest] = argv;
+  // Internal self-spawn dispatch: the bun-compiled binary spawns itself with
+  // `__workflow-runner` to enter the workflow leader. Must run before help,
+  // version, or file-shorthand checks so the reserved marker never leaks into
+  // user-visible paths. Excluded from `printUsage` for the same reason.
+  if (cmd === WORKFLOW_RUNNER_ARG) {
+    try {
+      return await runWorkflowRunner(rest);
+    } catch (error) {
+      const message = error instanceof Error ? error.message : String(error);
+      process.stderr.write(`jaiph node runner: ${message}\n`);
+      return 1;
+    }
+  }
   if (!cmd || cmd === "--help" || cmd === "-h") {
     printUsage();
     return 0;
   }
   if (cmd === "--version" || cmd === "-v") {
-    process.stdout.write("jaiph 0.9.4\n");
+    process.stdout.write(`jaiph ${VERSION}\n`);
     return 0;
   }
   try {
@@ -42,7 +57,7 @@ export async function main(argv: string[]): Promise<number> {
       return runFormat(rest);
     }
     if (cmd === "install") {
-      return runInstall(rest);
+      return await runInstall(rest);
     }
     if (cmd === "compile") {
       return runCompile(rest);
diff --git a/src/cli/run/display.test.ts b/src/cli/run/display.test.ts
index 0226d8b6..da8306b7 100644
--- a/src/cli/run/display.test.ts
+++ b/src/cli/run/display.test.ts
@@ -26,6 +26,15 @@ test("formatJaiphRunningBannerLines: Docker copy shows tmp workspace (no color)"
   assert.equal(s, "\nJaiph: Running say_hello.jh (Docker sandbox, tmp workspace)\n\n");
 });
 
+test("formatJaiphRunningBannerLines: Docker inplace shows live host edits, distinct from overlay/copy", () => {
+  const sInplace = formatJaiphRunningBannerLines("say_hello.jh", true, "inplace", false);
+  const sOverlay = formatJaiphRunningBannerLines("say_hello.jh", true, "overlay", false);
+  const sCopy = formatJaiphRunningBannerLines("say_hello.jh", true, "copy", false);
+  assert.equal(sInplace, "\nJaiph: Running say_hello.jh (Docker sandbox, in-place (live host edits))\n\n");
+  assert.notEqual(sInplace, sOverlay);
+  assert.notEqual(sInplace, sCopy);
+});
+
 test("formatJaiphRunningBannerLines: banner is the same in CI and locally (no obfuscation)", () => {
   const prev = process.env.CI;
   process.env.CI = "true";
diff --git a/src/cli/run/display.ts b/src/cli/run/display.ts
index 84984baf..802e7074 100644
--- a/src/cli/run/display.ts
+++ b/src/cli/run/display.ts
@@ -18,8 +18,12 @@ export function formatJaiphRunningBannerLines(
   let parenInner: string;
   if (!dockerEnabled) {
     parenInner = "no sandbox";
+  } else if (sandboxMode === "overlay") {
+    parenInner = "Docker sandbox, fusefs";
+  } else if (sandboxMode === "inplace") {
+    parenInner = "Docker sandbox, in-place (live host edits)";
   } else {
-    parenInner = sandboxMode === "overlay" ? "Docker sandbox, fusefs" : "Docker sandbox, tmp workspace";
+    parenInner = "Docker sandbox, tmp workspace";
   }
   const dimParen = colorize(` (${parenInner})`, "dim", colorEnabled);
   return `\nJaiph: Running ${fileBasename}${dimParen}\n\n`;
diff --git a/src/cli/run/env.ts b/src/cli/run/env.ts
index 687ab3bc..b5eb4b07 100644
--- a/src/cli/run/env.ts
+++ b/src/cli/run/env.ts
@@ -1,6 +1,48 @@
 import { basename, resolve } from "node:path";
 import type { JaiphConfig } from "../../config";
 
+/**
+ * Boolean sandbox flags from `jaiph run`'s CLI surface. These are an ergonomic
+ * front-end for the corresponding env vars: each flag turns the env var ON for
+ * this run only. Both enabling paths (flag or env) agree, so the env layer
+ * stays the single source of truth that `resolveDockerConfig` / `selectSandboxMode`
+ * consume — no parameter threading through the docker layer.
+ */
+export interface SandboxFlags {
+  inplace?: boolean;
+  unsafe?: boolean;
+  yes?: boolean;
+}
+
+/**
+ * Apply sandbox flags to a runtime env map by mutating it in place.
+ *
+ * Mutate the local `env` only — never `process.env`, which would leak flag
+ * choices into every child process globally. `resolveRuntimeEnv` always
+ * returns a fresh spread of `process.env`, so callers can safely mutate it.
+ *
+ * Fails fast with `E_FLAG_CONFLICT` when `--inplace` / `JAIPH_INPLACE` and
+ * `--unsafe` / `JAIPH_UNSAFE` are both truthy: one keeps the sandbox on,
+ * the other turns it off.
+ */
+export function applySandboxFlags(
+  env: Record<string, string | undefined>,
+  flags: SandboxFlags,
+): void {
+  if (flags.inplace) env.JAIPH_INPLACE = "1";
+  if (flags.unsafe) env.JAIPH_UNSAFE = "true";
+  if (flags.yes) env.JAIPH_INPLACE_YES = "1";
+
+  const inplaceOn = env.JAIPH_INPLACE === "1" || env.JAIPH_INPLACE === "true";
+  const unsafeOn = env.JAIPH_UNSAFE === "true";
+  if (inplaceOn && unsafeOn) {
+    throw new Error(
+      "E_FLAG_CONFLICT --inplace / JAIPH_INPLACE and --unsafe / JAIPH_UNSAFE are mutually exclusive: " +
+        "in-place mode keeps the sandbox on with the host workspace bind-mounted rw, while unsafe disables the sandbox entirely.",
+    );
+  }
+}
+
 const LOCKED_ENV_KEYS = [
   "JAIPH_AGENT_MODEL",
   "JAIPH_AGENT_COMMAND",
diff --git a/src/cli/run/preflight-credentials.test.ts b/src/cli/run/preflight-credentials.test.ts
new file mode 100644
index 00000000..45c5b577
--- /dev/null
+++ b/src/cli/run/preflight-credentials.test.ts
@@ -0,0 +1,454 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import {
+  preflightAgentCredentials,
+  E_AGENT_CREDENTIALS,
+} from "./preflight-credentials";
+import type {
+  jaiphModule,
+  WorkflowDef,
+  WorkflowMetadata,
+  WorkflowStepDef,
+} from "../../types";
+
+function emptyModule(filePath: string, metadata?: WorkflowMetadata): jaiphModule {
+  return {
+    filePath,
+    metadata,
+    imports: [],
+    channels: [],
+    exports: [],
+    rules: [],
+    scripts: [],
+    workflows: [],
+  };
+}
+
+function workflow(
+  name: string,
+  metadata?: WorkflowMetadata,
+  steps: WorkflowStepDef[] = [],
+): WorkflowDef {
+  return {
+    name,
+    params: [],
+    comments: [],
+    steps,
+    metadata,
+    loc: { line: 1, col: 1 },
+  };
+}
+
+/** A trivial `const r = prompt "..."` step — used to make the entry file "use prompt". */
+function promptStep(): WorkflowStepDef {
+  return {
+    type: "const",
+    name: "r",
+    value: { kind: "prompt", raw: "\"hi\"", loc: { line: 1, col: 1 } },
+    loc: { line: 1, col: 1 },
+  };
+}
+
+const ENTRY = "/proj/main.jh";
+
+/**
+ * Realistic runtimeEnv shape. `resolveRuntimeEnv` populates JAIPH_AGENT_BACKEND
+ * from module-level config when the user has not set the env var themselves, so
+ * by the time pre-flight runs the env already reflects the module-level backend.
+ */
+function envFor(moduleBackend: string | undefined, extra: Record<string, string> = {}): Record<string, string | undefined> {
+  return moduleBackend
+    ? { JAIPH_AGENT_BACKEND: moduleBackend, ...extra }
+    : { ...extra };
+}
+
+// ---------------------------------------------------------------------------
+// AC1: Docker + claude + no creds → hard error with E_AGENT_CREDENTIALS
+// ---------------------------------------------------------------------------
+
+test("claude under Docker with no creds → E_AGENT_CREDENTIALS error", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "claude" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude"),
+    dockerEnabled: true,
+  });
+  assert.equal(r.errors.length, 1);
+  assert.equal(r.warnings.length, 0);
+  assert.ok(r.errors[0].startsWith(E_AGENT_CREDENTIALS + ":"));
+  assert.ok(r.errors[0].includes("claude"));
+});
+
+// ---------------------------------------------------------------------------
+// AC2: Host + claude + no creds → warn but no error
+// ---------------------------------------------------------------------------
+
+test("claude on host with no creds → warning, no error (CLI login may work)", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "claude" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude"),
+    dockerEnabled: false,
+  });
+  assert.equal(r.errors.length, 0);
+  assert.equal(r.warnings.length, 1);
+  assert.ok(r.warnings[0].toLowerCase().includes("warning"));
+  assert.ok(r.warnings[0].includes("claude"));
+});
+
+// ---------------------------------------------------------------------------
+// Unsafe mode: the credential pre-flight is skipped entirely
+// ---------------------------------------------------------------------------
+
+test("unsafe mode (JAIPH_UNSAFE=true): claude with no creds → no warning, no error", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "claude" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude", { JAIPH_UNSAFE: "true" }),
+    dockerEnabled: false,
+  });
+  assert.equal(r.errors.length, 0);
+  assert.equal(r.warnings.length, 0);
+});
+
+test("unsafe mode (JAIPH_UNSAFE=true): codex with no OPENAI_API_KEY → no hard error", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "codex" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("codex", { JAIPH_UNSAFE: "true" }),
+    dockerEnabled: false,
+  });
+  assert.equal(r.errors.length, 0);
+  assert.equal(r.warnings.length, 0);
+});
+
+// ---------------------------------------------------------------------------
+// AC3: cursor host/Docker split + codex always-hard
+// ---------------------------------------------------------------------------
+
+test("cursor under Docker with no CURSOR_API_KEY → hard error", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "cursor" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("cursor"),
+    dockerEnabled: true,
+  });
+  assert.equal(r.errors.length, 1);
+  assert.ok(r.errors[0].includes("CURSOR_API_KEY"));
+  assert.ok(r.errors[0].startsWith(E_AGENT_CREDENTIALS + ":"));
+});
+
+test("cursor on host with no CURSOR_API_KEY → warning, no error", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "cursor" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("cursor"),
+    dockerEnabled: false,
+  });
+  assert.equal(r.errors.length, 0);
+  assert.equal(r.warnings.length, 1);
+  assert.ok(r.warnings[0].includes("CURSOR_API_KEY"));
+});
+
+test("codex on host with no OPENAI_API_KEY → hard error", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "codex" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("codex"),
+    dockerEnabled: false,
+  });
+  assert.equal(r.errors.length, 1);
+  assert.ok(r.errors[0].includes("OPENAI_API_KEY"));
+  assert.ok(r.errors[0].startsWith(E_AGENT_CREDENTIALS + ":"));
+});
+
+test("codex under Docker with no OPENAI_API_KEY → hard error", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "codex" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("codex"),
+    dockerEnabled: true,
+  });
+  assert.equal(r.errors.length, 1);
+  assert.ok(r.errors[0].includes("OPENAI_API_KEY"));
+});
+
+// ---------------------------------------------------------------------------
+// AC4: Message content — backend name, model (when set), file path, scope
+// ---------------------------------------------------------------------------
+
+test("message contains backend, model, entry file path, and 'module config' scope", () => {
+  const mod = emptyModule(ENTRY, {
+    agent: { backend: "claude", defaultModel: "sonnet-4" },
+  });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude"),
+    dockerEnabled: true,
+  });
+  const msg = r.errors[0];
+  assert.ok(msg.includes("claude"), `missing backend name: ${msg}`);
+  assert.ok(msg.includes("sonnet-4"), `missing model string: ${msg}`);
+  assert.ok(msg.includes(ENTRY), `missing entry file path: ${msg}`);
+  assert.ok(msg.includes("module config"), `missing scope label: ${msg}`);
+});
+
+test("message reports 'workflow <name>' scope when backend is set at workflow level", () => {
+  const mod = emptyModule(ENTRY);
+  mod.workflows = [
+    workflow("review", {
+      agent: { backend: "claude", defaultModel: "opus-4" },
+    }),
+  ];
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    // No module-level backend, so the env reflects the system default.
+    runtimeEnv: {},
+    dockerEnabled: true,
+  });
+  // Errors: claude (workflow review) + cursor (default, no CURSOR_API_KEY).
+  const claudeErr = r.errors.find((e) => e.includes("claude"));
+  assert.ok(claudeErr, "expected a claude error");
+  assert.ok(claudeErr.includes("opus-4"));
+  assert.ok(claudeErr.includes(ENTRY));
+  assert.ok(claudeErr.includes("workflow review"), `missing 'workflow review' scope: ${claudeErr}`);
+});
+
+test("warning message also names backend/model/file/scope", () => {
+  const mod = emptyModule(ENTRY, {
+    agent: { backend: "claude", defaultModel: "haiku-4" },
+  });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude"),
+    dockerEnabled: false,
+  });
+  const msg = r.warnings[0];
+  assert.ok(msg.includes("claude"));
+  assert.ok(msg.includes("haiku-4"));
+  assert.ok(msg.includes(ENTRY));
+  assert.ok(msg.includes("module config"));
+});
+
+test("message includes Docker forwarding remedy hint when Docker is on", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "claude" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude"),
+    dockerEnabled: true,
+  });
+  assert.ok(
+    r.errors[0].toLowerCase().includes("docker"),
+    `expected Docker remedy hint: ${r.errors[0]}`,
+  );
+});
+
+// ---------------------------------------------------------------------------
+// AC5: With creds → silent (no false positives), including single-of-two for claude
+// ---------------------------------------------------------------------------
+
+test("claude under Docker with ANTHROPIC_API_KEY only → silent", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "claude" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude", { ANTHROPIC_API_KEY: "sk-xxx" }),
+    dockerEnabled: true,
+  });
+  assert.deepEqual(r, { errors: [], warnings: [] });
+});
+
+test("claude under Docker with CLAUDE_CODE_OAUTH_TOKEN only → silent", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "claude" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude", { CLAUDE_CODE_OAUTH_TOKEN: "tok-yyy" }),
+    dockerEnabled: true,
+  });
+  assert.deepEqual(r, { errors: [], warnings: [] });
+});
+
+test("cursor with CURSOR_API_KEY set → silent (both modes)", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "cursor" } });
+  for (const dockerEnabled of [true, false]) {
+    const r = preflightAgentCredentials({
+      mod,
+      inputAbs: ENTRY,
+      runtimeEnv: envFor("cursor", { CURSOR_API_KEY: "k" }),
+      dockerEnabled,
+    });
+    assert.deepEqual(r, { errors: [], warnings: [] }, `dockerEnabled=${dockerEnabled}`);
+  }
+});
+
+test("codex on host with OPENAI_API_KEY set → silent", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "codex" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("codex", { OPENAI_API_KEY: "sk" }),
+    dockerEnabled: false,
+  });
+  assert.deepEqual(r, { errors: [], warnings: [] });
+});
+
+test("empty-value env vars do not satisfy the check", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "cursor" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("cursor", { CURSOR_API_KEY: "" }),
+    dockerEnabled: true,
+  });
+  assert.equal(r.errors.length, 1);
+});
+
+// ---------------------------------------------------------------------------
+// AC6: No in-file backend config, cursor default, host run → warn-only, no fail
+// ---------------------------------------------------------------------------
+
+test("no backend, no prompt — silent (no false positives, contract holds)", () => {
+  // AC: "A workflow with no `prompt` step / no agent backend configured beyond
+  // the default and `cursor` default on host does not hard-fail solely due to a
+  // missing key (host warn-only contract holds)." No errors, no warnings either —
+  // the pre-flight skips entirely when nothing demands credentials.
+  const mod = emptyModule(ENTRY);
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: {},
+    dockerEnabled: false,
+  });
+  assert.equal(r.errors.length, 0, `expected no hard errors, got: ${r.errors.join("\n")}`);
+  assert.equal(r.warnings.length, 0);
+});
+
+test("no agent.backend configured, cursor default on host, no CURSOR_API_KEY, prompt used → warn only", () => {
+  // When the workflow actually uses prompt, the warn-only contract activates.
+  const mod = emptyModule(ENTRY);
+  mod.workflows = [workflow("default", undefined, [promptStep()])];
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: {},
+    dockerEnabled: false,
+  });
+  assert.equal(r.errors.length, 0, `expected no hard errors, got: ${r.errors.join("\n")}`);
+  assert.equal(r.warnings.length, 1);
+  assert.ok(r.warnings[0].includes("cursor"));
+});
+
+test("no agent.backend configured, cursor default on host, CURSOR_API_KEY set, prompt used → silent", () => {
+  const mod = emptyModule(ENTRY);
+  mod.workflows = [workflow("default", undefined, [promptStep()])];
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: { CURSOR_API_KEY: "k" },
+    dockerEnabled: false,
+  });
+  assert.deepEqual(r, { errors: [], warnings: [] });
+});
+
+test("explicit backend in config but no prompt step → still checks (user committed to backend)", () => {
+  // AC1 envisions a workflow whose entry file sets `agent.backend = "claude"`.
+  // Even if no prompt step exists, the explicit declaration is a commitment
+  // we honor by running the check.
+  const mod = emptyModule(ENTRY, { agent: { backend: "claude" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude"),
+    dockerEnabled: true,
+  });
+  assert.equal(r.errors.length, 1);
+  assert.ok(r.errors[0].includes("claude"));
+});
+
+// ---------------------------------------------------------------------------
+// AC7: Pre-flight checks post-forwarding env (non-allowlisted vars treated as missing)
+// ---------------------------------------------------------------------------
+
+test("codex under Docker: OPENAI_API_KEY present on host but not allowlisted → treated as missing", () => {
+  // OPENAI_API_KEY is not on the ENV_ALLOW_PREFIXES list, so isEnvAllowed
+  // strips it before forwarding. The pre-flight must mirror that.
+  const mod = emptyModule(ENTRY, { agent: { backend: "codex" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("codex", { OPENAI_API_KEY: "sk-set-on-host" }),
+    dockerEnabled: true,
+  });
+  assert.equal(r.errors.length, 1);
+  assert.ok(r.errors[0].includes("OPENAI_API_KEY"));
+});
+
+test("codex on host: OPENAI_API_KEY present → silent (no allowlist filter outside Docker)", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "codex" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("codex", { OPENAI_API_KEY: "sk-set-on-host" }),
+    dockerEnabled: false,
+  });
+  assert.deepEqual(r, { errors: [], warnings: [] });
+});
+
+test("claude under Docker: ANTHROPIC_API_KEY is allowlisted (ANTHROPIC_ prefix)", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "claude" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude", { ANTHROPIC_API_KEY: "sk" }),
+    dockerEnabled: true,
+  });
+  assert.deepEqual(r, { errors: [], warnings: [] });
+});
+
+// ---------------------------------------------------------------------------
+// Distinct backends in entry file: each gets its own check
+// ---------------------------------------------------------------------------
+
+test("module-level claude + workflow-level cursor under Docker → claude and cursor errors", () => {
+  const mod = emptyModule(ENTRY, { agent: { backend: "claude" } });
+  mod.workflows = [
+    workflow("legacy", { agent: { backend: "cursor" } }),
+  ];
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude"),
+    dockerEnabled: true,
+  });
+  // claude (module config) + cursor (workflow legacy).
+  assert.equal(r.errors.length, 2);
+  const joined = r.errors.join("\n");
+  assert.ok(joined.includes("claude") && joined.includes("module config"));
+  assert.ok(joined.includes("cursor") && joined.includes("workflow legacy"));
+});
+
+test("module config matches the effective env default → no duplicate check", () => {
+  // realistic flow: resolveRuntimeEnv sets JAIPH_AGENT_BACKEND from module config,
+  // so module-level "claude" and the default backend resolve to the same value.
+  const mod = emptyModule(ENTRY, { agent: { backend: "claude" } });
+  const r = preflightAgentCredentials({
+    mod,
+    inputAbs: ENTRY,
+    runtimeEnv: envFor("claude"),
+    dockerEnabled: true,
+  });
+  assert.equal(r.errors.length, 1, `expected exactly one error, got: ${r.errors.join("\n")}`);
+});
diff --git a/src/cli/run/preflight-credentials.ts b/src/cli/run/preflight-credentials.ts
new file mode 100644
index 00000000..c4f8d177
--- /dev/null
+++ b/src/cli/run/preflight-credentials.ts
@@ -0,0 +1,238 @@
+import type {
+  CatchBody,
+  Expr,
+  jaiphModule,
+  WorkflowStepDef,
+} from "../../types";
+import { isEnvAllowed } from "../../runtime/docker";
+
+export const E_AGENT_CREDENTIALS = "E_AGENT_CREDENTIALS";
+
+type Backend = "cursor" | "claude" | "codex";
+
+interface BackendUsage {
+  backend: Backend;
+  /** Human-readable scope: "module config" | "workflow <name>" | "default" | "JAIPH_AGENT_BACKEND env". */
+  scope: string;
+  /** Model from the same scope, falling back to module-level model. */
+  model?: string;
+}
+
+export interface PreflightResult {
+  errors: string[];
+  warnings: string[];
+}
+
+export interface PreflightArgs {
+  mod: jaiphModule;
+  inputAbs: string;
+  runtimeEnv: Record<string, string | undefined>;
+  dockerEnabled: boolean;
+}
+
+/**
+ * Collect each distinct backend declared in the entry file plus the effective
+ * default backend. Order: module-level (if set), workflow-level (in source order,
+ * skipping duplicates), then the effective default (skipped if already seen).
+ *
+ * Deeper per-import-module backend overrides resolved at runtime are out of scope
+ * here — entry-file scan is the documented contract for this pre-flight.
+ */
+function collectBackendUsages(
+  mod: jaiphModule,
+  runtimeEnv: Record<string, string | undefined>,
+): BackendUsage[] {
+  const seen = new Map<Backend, BackendUsage>();
+  const moduleBackend = mod.metadata?.agent?.backend;
+  const moduleModel = mod.metadata?.agent?.defaultModel;
+  if (moduleBackend) {
+    seen.set(moduleBackend, {
+      backend: moduleBackend,
+      scope: "module config",
+      model: moduleModel,
+    });
+  }
+  for (const wf of mod.workflows) {
+    const wfBackend = wf.metadata?.agent?.backend;
+    if (!wfBackend || seen.has(wfBackend)) continue;
+    const wfModel = wf.metadata?.agent?.defaultModel ?? moduleModel;
+    seen.set(wfBackend, {
+      backend: wfBackend,
+      scope: `workflow ${wf.name}`,
+      model: wfModel,
+    });
+  }
+  const envBackendRaw = runtimeEnv.JAIPH_AGENT_BACKEND;
+  const defaultBackend = (envBackendRaw || "cursor") as Backend;
+  if (!seen.has(defaultBackend)) {
+    const scope = envBackendRaw ? "JAIPH_AGENT_BACKEND env" : "default";
+    seen.set(defaultBackend, { backend: defaultBackend, scope, model: moduleModel });
+  }
+  return [...seen.values()];
+}
+
+/**
+ * True when `key` is set to a non-empty value in the env that will actually
+ * reach the agent. When Docker is on, the host-side allowlist (`isEnvAllowed`)
+ * runs first — a credential present on the host but not on the allowlist is
+ * treated as missing because the container will never see it.
+ */
+function hasCredential(
+  env: Record<string, string | undefined>,
+  key: string,
+  dockerEnabled: boolean,
+): boolean {
+  if (dockerEnabled && !isEnvAllowed(key)) return false;
+  const v = env[key];
+  return typeof v === "string" && v.length > 0;
+}
+
+function formatHeader(usage: BackendUsage, inputAbs: string): string {
+  const modelPart = usage.model ? ` (model "${usage.model}")` : "";
+  return `agent.backend "${usage.backend}"${modelPart} selected by ${usage.scope} in ${inputAbs}`;
+}
+
+function dockerSuffix(dockerEnabled: boolean): string {
+  return dockerEnabled
+    ? " (Docker is on — set the env var on the host so it is forwarded into the container.)"
+    : "";
+}
+
+function checkClaude(
+  usage: BackendUsage,
+  args: PreflightArgs,
+  out: PreflightResult,
+): void {
+  const ok =
+    hasCredential(args.runtimeEnv, "ANTHROPIC_API_KEY", args.dockerEnabled) ||
+    hasCredential(args.runtimeEnv, "CLAUDE_CODE_OAUTH_TOKEN", args.dockerEnabled);
+  if (ok) return;
+  const header = formatHeader(usage, args.inputAbs);
+  const remedy =
+    "Run `claude setup-token` and export CLAUDE_CODE_OAUTH_TOKEN, or set ANTHROPIC_API_KEY.";
+  if (args.dockerEnabled) {
+    out.errors.push(
+      `${E_AGENT_CREDENTIALS}: ${header} — neither ANTHROPIC_API_KEY nor CLAUDE_CODE_OAUTH_TOKEN is set. ${remedy}${dockerSuffix(true)}`,
+    );
+  } else {
+    out.warnings.push(
+      `jaiph: warning: ${header} — neither ANTHROPIC_API_KEY nor CLAUDE_CODE_OAUTH_TOKEN is set. ${remedy} A stored Claude CLI login may still work.`,
+    );
+  }
+}
+
+function checkCursor(
+  usage: BackendUsage,
+  args: PreflightArgs,
+  out: PreflightResult,
+): void {
+  if (hasCredential(args.runtimeEnv, "CURSOR_API_KEY", args.dockerEnabled)) return;
+  const header = formatHeader(usage, args.inputAbs);
+  const remedy =
+    "Set CURSOR_API_KEY (or run `cursor-agent login` for host runs).";
+  if (args.dockerEnabled) {
+    out.errors.push(
+      `${E_AGENT_CREDENTIALS}: ${header} — CURSOR_API_KEY is not set. ${remedy}${dockerSuffix(true)}`,
+    );
+  } else {
+    out.warnings.push(
+      `jaiph: warning: ${header} — CURSOR_API_KEY is not set. ${remedy} A stored cursor-agent login may still work.`,
+    );
+  }
+}
+
+function checkCodex(
+  usage: BackendUsage,
+  args: PreflightArgs,
+  out: PreflightResult,
+): void {
+  if (hasCredential(args.runtimeEnv, "OPENAI_API_KEY", args.dockerEnabled)) return;
+  const header = formatHeader(usage, args.inputAbs);
+  const remedy = "Set OPENAI_API_KEY to your OpenAI API key.";
+  out.errors.push(
+    `${E_AGENT_CREDENTIALS}: ${header} — OPENAI_API_KEY is not set. ${remedy}${dockerSuffix(args.dockerEnabled)}`,
+  );
+}
+
+function exprIsPrompt(e: Expr): boolean {
+  return e.kind === "prompt";
+}
+
+function catchBodyHasPrompt(c: CatchBody): boolean {
+  if ("single" in c) return stepHasPrompt(c.single);
+  return c.block.some(stepHasPrompt);
+}
+
+function stepHasPrompt(s: WorkflowStepDef): boolean {
+  switch (s.type) {
+    case "exec":
+      if (exprIsPrompt(s.body)) return true;
+      if (s.catch && catchBodyHasPrompt(s.catch)) return true;
+      if (s.recover && catchBodyHasPrompt(s.recover)) return true;
+      return false;
+    case "const":
+      return exprIsPrompt(s.value);
+    case "return":
+      return exprIsPrompt(s.value);
+    case "send":
+      return exprIsPrompt(s.value);
+    case "say":
+      return exprIsPrompt(s.message);
+    case "if":
+      return s.body.some(stepHasPrompt) || (s.elseBody?.some(stepHasPrompt) ?? false);
+    case "for_lines":
+      return s.body.some(stepHasPrompt);
+    case "trivia":
+      return false;
+  }
+}
+
+/** True when any workflow or rule in the entry file contains a `prompt` step. */
+function entryFileUsesPrompt(mod: jaiphModule): boolean {
+  for (const wf of mod.workflows) {
+    if (wf.steps.some(stepHasPrompt)) return true;
+  }
+  for (const rule of mod.rules) {
+    if (rule.steps.some(stepHasPrompt)) return true;
+  }
+  return false;
+}
+
+/** True when the entry file declares an agent backend at any config scope. */
+function entryFileHasExplicitBackend(mod: jaiphModule): boolean {
+  if (mod.metadata?.agent?.backend) return true;
+  return mod.workflows.some((wf) => Boolean(wf.metadata?.agent?.backend));
+}
+
+/**
+ * Host-side credential check, keyed to the backend(s) the entry file selects.
+ *
+ * Rules per task spec:
+ *  - codex   → hard error on host AND Docker (no CLI-login fallback).
+ *  - claude  → Docker: hard error; host: warn only (stored CLI login may work).
+ *  - cursor  → Docker: hard error; host: warn only.
+ *
+ * Skip entirely when the entry file neither declares an explicit backend nor
+ * uses any `prompt` step — there is nothing the runtime would credential against,
+ * so a warning would be a false positive.
+ *
+ * Also skip entirely in unsafe mode (`JAIPH_UNSAFE` / `--unsafe`): that is the
+ * explicit "run on the host, trust my environment" escape hatch, so neither the
+ * host warnings nor the codex hard error should fire — a logged-in agent CLI
+ * works, and the runtime backend guards remain as a backstop.
+ */
+export function preflightAgentCredentials(args: PreflightArgs): PreflightResult {
+  const out: PreflightResult = { errors: [], warnings: [] };
+  if (args.runtimeEnv.JAIPH_UNSAFE === "true") {
+    return out;
+  }
+  if (!entryFileHasExplicitBackend(args.mod) && !entryFileUsesPrompt(args.mod)) {
+    return out;
+  }
+  for (const usage of collectBackendUsages(args.mod, args.runtimeEnv)) {
+    if (usage.backend === "codex") checkCodex(usage, args, out);
+    else if (usage.backend === "claude") checkClaude(usage, args, out);
+    else if (usage.backend === "cursor") checkCursor(usage, args, out);
+  }
+  return out;
+}
diff --git a/src/cli/run/progress.test.ts b/src/cli/run/progress.test.ts
index 92ab843a..6b29c01c 100644
--- a/src/cli/run/progress.test.ts
+++ b/src/cli/run/progress.test.ts
@@ -11,19 +11,15 @@ import {
   styleYellow,
   styleBold,
 } from "./progress";
-import type { jaiphModule } from "../../types";
-
-function minimalModule(overrides?: Partial<jaiphModule>): jaiphModule {
-  return {
-    filePath: "test.jh",
-    imports: [],
-    channels: [],
-    exports: [],
-    rules: [],
-    scripts: [],
-    workflows: [],
-    ...overrides,
-  };
+import { parsejaiph } from "../../parser";
+
+/**
+ * Fixtures are built by parsing real Jaiph source so test data flows through
+ * the same producer as production — no hand-written AST shapes to keep in
+ * sync with the type definitions.
+ */
+function modFor(source: string) {
+  return parsejaiph(source, "test.jh");
 }
 
 // --- parseLabel ---
@@ -71,22 +67,21 @@ test("formatElapsedDuration: handles sub-second", () => {
 // --- collectWorkflowChildren ---
 
 test("collectWorkflowChildren: returns empty for unknown workflow", () => {
-  const mod = minimalModule();
+  const mod = modFor(`workflow default() {
+  log "hi"
+}`);
   assert.deepStrictEqual(collectWorkflowChildren(mod, "missing"), []);
 });
 
-test("collectWorkflowChildren: collects run steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "deploy", loc: { line: 2, col: 3 } } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+test("collectWorkflowChildren: collects run step as workflow row", () => {
+  const mod = modFor([
+    "workflow default() {",
+    "  run deploy()",
+    "}",
+    "workflow deploy() {",
+    "  log \"d\"",
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
   assert.equal(items.length, 1);
   assert.equal(items[0].label, "workflow deploy");
@@ -94,1407 +89,175 @@ test("collectWorkflowChildren: collects run steps", () => {
 });
 
 test("collectWorkflowChildren: collects async run with prefix", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "bg_task", loc: { line: 2, col: 3 } }, async: true },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items[0].label, "async workflow bg_task");
-});
-
-test("collectWorkflowChildren: collects ensure steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "ensure", ref: { value: "check_passes", loc: { line: 2, col: 3 } } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 1);
-  assert.equal(items[0].label, "rule check_passes");
-});
-
-test("collectWorkflowChildren: collects prompt steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "prompt", raw: 'prompt "hello world"', loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 1);
-  assert.match(items[0].label, /^prompt "hello world"/);
-});
-
-test("collectWorkflowChildren: collects log steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "log", message: "starting", loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items[0].label, "ℹ starting");
-});
-
-test("collectWorkflowChildren: collects logerr steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "logerr", message: "bad thing", loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items[0].label, "! bad thing");
-});
-
-test("collectWorkflowChildren: collects send steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "send", channel: "notify", rhs: { kind: "literal", token: "hello" }, loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items[0].label, "notify <- send");
-});
-
-test("collectWorkflowChildren: collects fail steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "fail", message: "broken", loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items[0].label, "fail broken");
-});
-
-test("collectWorkflowChildren: collects const steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "const", name: "x", value: { kind: "expr", bashRhs: "1" }, loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items[0].label, "const x");
-});
-
-
-test("collectWorkflowChildren: collects return steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "return", value: '"done"', loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+  const mod = modFor([
+    "workflow default() {",
+    "  run async deploy()",
+    "}",
+    "workflow deploy() {",
+    "  log \"d\"",
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items[0].label, 'return "done"');
-});
-
-test("collectWorkflowChildren: collects shell steps with truncation", () => {
-  const longCmd = "a".repeat(60);
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "shell", command: longCmd, loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.match(items[0].label, /^\$ .{53}\.\.\./);
-});
-
-test("collectWorkflowChildren: skips comment steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "comment", text: "# note", loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 0);
-});
-
-test("collectWorkflowChildren: collects channel-level route declarations", () => {
-  const mod = minimalModule({
-    channels: [{
-      name: "events",
-      routes: [
-        { value: "handler1", loc: { line: 1, col: 20 } },
-        { value: "handler2", loc: { line: 1, col: 30 } },
-      ],
-      loc: { line: 1, col: 9 },
-    }],
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [],
-      loc: { line: 3, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 1);
-  assert.equal(items[0].label, "events -> handler1, handler2");
-});
-
-// --- buildRunTreeRows ---
-
-test("buildRunTreeRows: root row is first", () => {
-  const mod = minimalModule({
-    workflows: [{ name: "default", comments: [], params: [], steps: [], loc: { line: 1, col: 1 } }],
-  });
-  const rows = buildRunTreeRows(mod);
-  assert.equal(rows.length, 1);
-  assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[0].isRoot, true);
-});
-
-test("buildRunTreeRows: includes nested steps", () => {
-  const mod = minimalModule({
-    workflows: [
-      {
-        name: "default",
-        comments: [],
-        params: [],
-        steps: [
-          { type: "run", workflow: { value: "sub", loc: { line: 2, col: 3 } } },
-        ],
-        loc: { line: 1, col: 1 },
-      },
-      {
-        name: "sub",
-        comments: [],
-        params: [],
-        steps: [
-          { type: "log", message: "hello", loc: { line: 5, col: 3 } },
-        ],
-        loc: { line: 4, col: 1 },
-      },
-    ],
-  });
-  const rows = buildRunTreeRows(mod);
-  assert.equal(rows.length, 3);
-  assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[1].rawLabel, "workflow sub");
-  assert.equal(rows[2].rawLabel, "ℹ hello");
-});
-
-test("buildRunTreeRows: does not re-expand visited workflows", () => {
-  const mod = minimalModule({
-    workflows: [
-      {
-        name: "default",
-        comments: [],
-        params: [],
-        steps: [
-          { type: "run", workflow: { value: "shared", loc: { line: 2, col: 3 } } },
-          { type: "run", workflow: { value: "other", loc: { line: 3, col: 3 } } },
-        ],
-        loc: { line: 1, col: 1 },
-      },
-      {
-        name: "shared",
-        comments: [],
-        params: [],
-        steps: [
-          { type: "log", message: "in shared", loc: { line: 6, col: 3 } },
-        ],
-        loc: { line: 5, col: 1 },
-      },
-      {
-        name: "other",
-        comments: [],
-        params: [],
-        steps: [
-          { type: "run", workflow: { value: "shared", loc: { line: 9, col: 3 } } },
-        ],
-        loc: { line: 8, col: 1 },
-      },
-    ],
-  });
-  const rows = buildRunTreeRows(mod);
-  const sharedRows = rows.filter((r) => r.rawLabel === "workflow shared");
-  // "shared" appears twice in the tree (once expanded, once not re-expanded)
-  assert.equal(sharedRows.length, 2);
-  // But "in shared" log only appears once (not re-expanded from "other")
-  const logRows = rows.filter((r) => r.rawLabel === "ℹ in shared");
-  assert.equal(logRows.length, 1);
-});
-
-// --- formatElapsedDuration (additional) ---
-
-test("formatElapsedDuration: zero milliseconds", () => {
-  assert.equal(formatElapsedDuration(0), "0s");
-});
-
-test("formatElapsedDuration: sub-second precision", () => {
-  assert.equal(formatElapsedDuration(50), "0.1s");
-  assert.equal(formatElapsedDuration(999), "1s");
-});
-
-// --- formatRunningBottomLine ---
-
-test("formatRunningBottomLine: contains RUNNING and workflow name", () => {
-  // In non-TTY test env, style functions return plain text
-  const result = formatRunningBottomLine("default", 1.5);
-  assert.ok(result.includes("RUNNING"), "should contain RUNNING");
-  assert.ok(result.includes("workflow"), "should contain 'workflow'");
-  assert.ok(result.includes("default"), "should contain workflow name");
-  assert.ok(result.includes("1.5s"), "should contain elapsed time");
-});
-
-test("formatRunningBottomLine: formats elapsed with one decimal", () => {
-  const result = formatRunningBottomLine("deploy", 10.0);
-  assert.ok(result.includes("10.0s"), "should show one decimal place");
-});
-
-// --- collectWorkflowChildren: catch blocks ---
-
-test("collectWorkflowChildren: run step with single catch includes recovery items", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        {
-          type: "run",
-          workflow: { value: "deploy", loc: { line: 2, col: 3 } },
-          catch: {
-            single: { type: "log", message: "recovering", loc: { line: 3, col: 5 } },
-            bindings: { failure: "err" },
-          },
-        },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+  assert.equal(items[0].label, "async workflow deploy");
+});
+
+test("collectWorkflowChildren: collects ensure step as rule row", () => {
+  const mod = modFor([
+    "rule gate() {",
+    "  return \"ok\"",
+    "}",
+    "workflow default() {",
+    "  ensure gate()",
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 2);
-  assert.equal(items[0].label, "workflow deploy");
-  assert.equal(items[1].label, "ℹ recovering");
+  assert.equal(items[0].label, "rule gate");
 });
 
-test("collectWorkflowChildren: run step with block catch includes all recovery items", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        {
-          type: "run",
-          workflow: { value: "deploy", loc: { line: 2, col: 3 } },
-          catch: {
-            block: [
-              { type: "log", message: "retrying", loc: { line: 3, col: 5 } },
-              { type: "run", workflow: { value: "fallback", loc: { line: 4, col: 5 } } },
-            ],
-            bindings: { failure: "err" },
-          },
-        },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+test("collectWorkflowChildren: collects prompt step with preview", () => {
+  const mod = modFor([
+    "workflow default() {",
+    '  prompt "Pick one"',
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 3);
-  assert.equal(items[0].label, "workflow deploy");
-  assert.equal(items[1].label, "ℹ retrying");
-  assert.equal(items[2].label, "workflow fallback");
+  assert.equal(items[0].label, 'prompt "Pick one"');
 });
 
-test("collectWorkflowChildren: ensure step with single catch includes recovery items", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        {
-          type: "ensure",
-          ref: { value: "check", loc: { line: 2, col: 3 } },
-          catch: {
-            single: { type: "run", workflow: { value: "fix_it", loc: { line: 3, col: 5 } } },
-            bindings: { failure: "err" },
-          },
-        },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+test("collectWorkflowChildren: collects log / logerr / fail (say) rows", () => {
+  const mod = modFor([
+    "workflow default() {",
+    '  log "ok"',
+    '  logerr "err"',
+    '  fail "boom"',
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 2);
-  assert.equal(items[0].label, "rule check");
-  assert.equal(items[1].label, "workflow fix_it");
-});
-
-test("collectWorkflowChildren: ensure step with block catch includes all recovery items", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        {
-          type: "ensure",
-          ref: { value: "check", loc: { line: 2, col: 3 } },
-          catch: {
-            block: [
-              { type: "log", message: "check failed", loc: { line: 3, col: 5 } },
-              { type: "fail", message: "unrecoverable", loc: { line: 4, col: 5 } },
-            ],
-            bindings: { failure: "err" },
-          },
-        },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+  assert.ok(items.some((i) => i.label.startsWith("ℹ ")));
+  assert.ok(items.some((i) => i.label.startsWith("! ")));
+  assert.ok(items.some((i) => i.label.startsWith("fail ")));
+});
+
+test("collectWorkflowChildren: collects send step", () => {
+  const mod = modFor([
+    "channel ch",
+    "workflow default() {",
+    '  ch <- "hi"',
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 3);
-  assert.equal(items[0].label, "rule check");
-  assert.equal(items[1].label, "ℹ check failed");
-  assert.equal(items[2].label, "fail unrecoverable");
-});
-
-// --- buildRunTreeRows: self-recursive workflows ---
-
-test("buildRunTreeRows: self-recursive workflow expands limited depth", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "log", message: "iteration", loc: { line: 2, col: 3 } },
-        { type: "run", workflow: { value: "default", loc: { line: 3, col: 3 } } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const rows = buildRunTreeRows(mod);
-  // Should have root + children, with limited recursion (not infinite)
-  assert.ok(rows.length >= 3, "should expand self-recursive workflow at least once");
-  assert.ok(rows.length < 50, "should not expand infinitely");
-  // First row is root
-  assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[0].isRoot, true);
-  // Should contain "ℹ iteration" at least once
-  const logRows = rows.filter((r) => r.rawLabel === "ℹ iteration");
-  assert.ok(logRows.length >= 1, "should show log from recursive workflow");
-});
-
-test("buildRunTreeRows: workflow with two self-recursive sites", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "default", loc: { line: 2, col: 3 } } },
-        { type: "log", message: "middle", loc: { line: 3, col: 3 } },
-        { type: "run", workflow: { value: "default", loc: { line: 4, col: 3 } } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const rows = buildRunTreeRows(mod);
-  // Should terminate without infinite expansion
-  assert.ok(rows.length >= 3, "should produce tree rows");
-  assert.ok(rows.length < 100, "should not expand infinitely");
+  assert.ok(items.some((i) => i.label === "ch <- send"));
 });
 
-// --- collectWorkflowChildren: match_expr with run/ensure arms ---
-
-test("collectWorkflowChildren: const with match_expr containing run arm", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        {
-          type: "const",
-          name: "result",
-          value: {
-            kind: "match_expr",
-            match: {
-              subject: "x",
-              arms: [
-                { pattern: { kind: "string_literal", value: "a" }, body: 'run deploy("a")' },
-                { pattern: { kind: "wildcard" }, body: '"fallback"' },
-              ],
-              loc: { line: 3, col: 10 },
-            },
-          },
-          loc: { line: 3, col: 3 },
-        },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+test("collectWorkflowChildren: collects const and return rows", () => {
+  const mod = modFor([
+    "workflow default() {",
+    '  const x = "hi"',
+    "  return x",
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 2);
-  assert.equal(items[0].label, "const result");
-  assert.equal(items[1].label, "workflow deploy");
-  assert.equal(items[1].nested, "deploy");
+  assert.ok(items.some((i) => i.label === "const x"));
+  assert.ok(items.some((i) => i.label.startsWith("return ")));
 });
 
-test("collectWorkflowChildren: const with match_expr containing ensure arm", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        {
-          type: "const",
-          name: "status",
-          value: {
-            kind: "match_expr",
-            match: {
-              subject: "x",
-              arms: [
-                { pattern: { kind: "string_literal", value: "check" }, body: 'ensure gate()' },
-                { pattern: { kind: "wildcard" }, body: '"skip"' },
-              ],
-              loc: { line: 3, col: 10 },
-            },
-          },
-          loc: { line: 3, col: 3 },
-        },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+test("collectWorkflowChildren: collects inline script as 'script (inline)'", () => {
+  const mod = modFor([
+    "workflow default() {",
+    "  run `echo hi`()",
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 2);
-  assert.equal(items[0].label, "const status");
-  assert.equal(items[1].label, "rule gate");
-  assert.equal(items[1].nested, "gate");
+  assert.ok(items.some((i) => i.label === "script (inline)"));
 });
 
-test("collectWorkflowChildren: const with match_expr arm with no run/ensure", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        {
-          type: "const",
-          name: "val",
-          value: {
-            kind: "match_expr",
-            match: {
-              subject: "x",
-              arms: [
-                { pattern: { kind: "string_literal", value: "a" }, body: '"hello"' },
-                { pattern: { kind: "wildcard" }, body: '"default"' },
-              ],
-              loc: { line: 3, col: 10 },
-            },
-          },
-          loc: { line: 3, col: 3 },
-        },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+test("collectWorkflowChildren: collects shell step with $ prefix", () => {
+  const mod = modFor([
+    "workflow default() {",
+    "  echo hello",
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 1);
-  assert.equal(items[0].label, "const val");
+  assert.ok(items.some((i) => i.label.startsWith("$ ")));
 });
 
-// --- collectWorkflowChildren: run_inline_script ---
-
-test("collectWorkflowChildren: collects run_inline_script steps", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run_inline_script", body: "echo hello", loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+test("collectWorkflowChildren: skips trivia (comments / blank lines)", () => {
+  const mod = modFor([
+    "workflow default() {",
+    "  # comment",
+    "",
+    '  log "hi"',
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
   assert.equal(items.length, 1);
-  assert.equal(items[0].label, "script (inline)");
-});
-
-// --- buildRunTreeRows: prefix/indentation ---
-
-test("buildRunTreeRows: grandchild rows are more indented than children", () => {
-  const mod = minimalModule({
-    workflows: [
-      {
-        name: "default",
-        comments: [],
-        params: [],
-        steps: [
-          { type: "run", workflow: { value: "sub", loc: { line: 2, col: 3 } } },
-        ],
-        loc: { line: 1, col: 1 },
-      },
-      {
-        name: "sub",
-        comments: [],
-        params: [],
-        steps: [
-          { type: "log", message: "hello", loc: { line: 5, col: 3 } },
-        ],
-        loc: { line: 4, col: 1 },
-      },
-    ],
-  });
-  const rows = buildRunTreeRows(mod);
-  // Root and direct children share empty prefix; grandchildren are indented
-  assert.equal(rows[0].prefix, "", "root should have empty prefix");
-  assert.equal(rows[1].prefix, "", "direct child inherits root prefix");
-  assert.ok(rows[2].prefix.length > rows[1].prefix.length, "grandchild should be more indented than child");
-});
-
-// --- buildRunTreeRows: cross-module imported workflows ---
-
-test("buildRunTreeRows: cross-module workflows are expanded from importedModules", () => {
-  const mainMod = minimalModule({
-    imports: [{ path: "lib.jh", alias: "lib", loc: { line: 1, col: 1 } }],
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "lib.greet", loc: { line: 3, col: 3 } } },
-      ],
-      loc: { line: 2, col: 1 },
-    }],
-  });
-  const libMod = minimalModule({
-    filePath: "lib.jh",
-    workflows: [{
-      name: "greet",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "log", message: "hello from lib", loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const importedModules = new Map([["lib", libMod]]);
-  const rows = buildRunTreeRows(mainMod, undefined, importedModules);
-  // Should contain the imported workflow's children
-  const libLogRows = rows.filter((r) => r.rawLabel === "ℹ hello from lib");
-  assert.equal(libLogRows.length, 1, "should expand imported workflow children");
-});
-
-// --- formatElapsedDuration: exact boundary ---
-
-test("formatElapsedDuration: exactly 60000ms uses minute format", () => {
-  assert.equal(formatElapsedDuration(60000), "1m 0s");
-});
-
-test("formatElapsedDuration: just under 60000ms uses seconds format", () => {
-  assert.equal(formatElapsedDuration(59999), "60s");
-});
-
-// --- collectWorkflowChildren: stepFunc with symbols ---
-
-test("collectWorkflowChildren: run step with dotted ref populates stepFunc from symbols", () => {
-  const mod = minimalModule({
-    imports: [{ path: "lib.jh", alias: "lib", loc: { line: 1, col: 1 } }],
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "lib.deploy", loc: { line: 3, col: 3 } } },
-      ],
-      loc: { line: 2, col: 1 },
-    }],
-  });
-  const symbols = new Map([["lib", "mylib"]]);
-  const items = collectWorkflowChildren(mod, "default", symbols);
-  assert.equal(items.length, 1);
-  assert.equal(items[0].stepFunc, "mylib::deploy");
-});
-
-test("collectWorkflowChildren: run step with dotted ref falls back to alias when symbol missing", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "lib.deploy", loc: { line: 2, col: 3 } } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const symbols = new Map<string, string>();
-  const items = collectWorkflowChildren(mod, "default", symbols);
-  assert.equal(items[0].stepFunc, "lib::deploy");
-});
-
-test("collectWorkflowChildren: run step with currentSymbol populates stepFunc", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "helper", loc: { line: 2, col: 3 } } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default", undefined, "main_mod");
-  assert.equal(items[0].stepFunc, "main_mod::helper");
-});
-
-test("collectWorkflowChildren: ensure step with dotted ref populates stepFunc from symbols", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "ensure", ref: { value: "lib.check", loc: { line: 2, col: 3 } } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const symbols = new Map([["lib", "mylib"]]);
-  const items = collectWorkflowChildren(mod, "default", symbols);
-  assert.equal(items[0].stepFunc, "mylib::check");
-});
-
-test("collectWorkflowChildren: ensure step with currentSymbol populates stepFunc", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "ensure", ref: { value: "gate", loc: { line: 2, col: 3 } } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default", undefined, "main_mod");
-  assert.equal(items[0].stepFunc, "main_mod::gate");
-});
-
-test("collectWorkflowChildren: prompt step always has jaiph::prompt stepFunc", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "prompt", raw: 'prompt "test"', loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+  assert.ok(items[0].label.startsWith("ℹ "));
+});
+
+test("collectWorkflowChildren: const = match expression walks arms for run/ensure targets", () => {
+  const mod = modFor([
+    "rule gate() {",
+    "  return \"ok\"",
+    "}",
+    "workflow other() {",
+    "  log \"o\"",
+    "}",
+    "workflow default(name) {",
+    "  const result = match name {",
+    '    "x" => run other()',
+    '    _ => ensure gate()',
+    "  }",
+    "}",
+  ].join("\n"));
   const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items[0].stepFunc, "jaiph::prompt");
+  // const row + workflow other row + rule gate row
+  assert.ok(items.some((i) => i.label === "const result"));
+  assert.ok(items.some((i) => i.label.startsWith("workflow other")));
+  assert.ok(items.some((i) => i.label.startsWith("rule gate")));
 });
 
-// --- buildRunTreeRows: self-recursion depth gating ---
+// --- buildRunTreeRows ---
 
-test("buildRunTreeRows: self-recursive workflow with three sites limits expansion", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "default", loc: { line: 2, col: 3 } } },
-        { type: "log", message: "a", loc: { line: 3, col: 3 } },
-        { type: "run", workflow: { value: "default", loc: { line: 4, col: 3 } } },
-        { type: "log", message: "b", loc: { line: 5, col: 3 } },
-        { type: "run", workflow: { value: "default", loc: { line: 6, col: 3 } } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
+test("buildRunTreeRows: includes root and children", () => {
+  const mod = modFor([
+    "workflow default() {",
+    "  run deploy()",
+    "}",
+    "workflow deploy() {",
+    "  log \"d\"",
+    "}",
+  ].join("\n"));
   const rows = buildRunTreeRows(mod);
-  // Should terminate without infinite expansion
-  assert.ok(rows.length >= 3, "should produce tree rows");
-  assert.ok(rows.length < 200, "should not expand infinitely");
-  // Root is first
+  assert.ok(rows.length >= 2);
   assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[0].isRoot, true);
-});
-
-// --- collectWorkflowChildren: prompt label formatting ---
-
-test("collectWorkflowChildren: prompt with escaped quotes in raw", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "prompt", raw: 'prompt "say \\"hello\\""', loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  // The escaped quotes in raw should be handled: \" → " in content, then re-escaped for display
-  assert.match(items[0].label, /^prompt "/);
 });
 
-test("collectWorkflowChildren: prompt with no quotes in raw", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "prompt", raw: "prompt myVar", loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  // No quote found, preview is empty → label is just 'prompt ""'
-  assert.equal(items[0].label, 'prompt ""');
-});
-
-// --- styleKeywordLabel / styleDim / styleYellow / styleBold ---
-// In test env (non-TTY), these return plain text. We verify the non-TTY path.
-
-test("styleKeywordLabel: returns plain 'kind name' in non-TTY", () => {
-  const result = styleKeywordLabel("workflow deploy");
-  assert.equal(result, "workflow deploy");
-});
-
-test("styleKeywordLabel: handles single-word label", () => {
-  const result = styleKeywordLabel("wait");
-  assert.equal(result, "step wait");
-});
-
-test("styleDim: returns plain text in non-TTY", () => {
-  assert.equal(styleDim("hello"), "hello");
-});
-
-test("styleYellow: returns plain text in non-TTY", () => {
-  assert.equal(styleYellow("warning"), "warning");
-});
-
-test("styleBold: returns plain text in non-TTY", () => {
-  assert.equal(styleBold("title"), "title");
-});
-
-test("collectWorkflowChildren: prompt with long text truncated at 24 chars", () => {
-  const longText = "A".repeat(30);
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "prompt", raw: `prompt "${longText}"`, loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.ok(items[0].label.includes("A".repeat(24) + "..."), "should truncate at 24 chars");
-  assert.ok(!items[0].label.includes("A".repeat(25)), "should not contain more than 24 chars");
-});
-
-// --- buildRunTreeRows: rootDir parameter ---
-
-test("buildRunTreeRows: rootDir populates symbols for imported modules", () => {
-  const mainMod = minimalModule({
-    filePath: "/project/main.jh",
-    imports: [{ path: "lib.jh", alias: "lib", loc: { line: 1, col: 1 } }],
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "lib.greet", loc: { line: 3, col: 3 } } },
-      ],
-      loc: { line: 2, col: 1 },
-    }],
-  });
-  const libMod = minimalModule({
-    filePath: "/project/lib.jh",
-    workflows: [{
-      name: "greet",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "log", message: "hello", loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const importedModules = new Map([["lib", libMod]]);
-  const rows = buildRunTreeRows(mainMod, undefined, importedModules, "/project");
-  // With rootDir, symbols should be resolved; the run step should have a stepFunc
-  const runRow = rows.find((r) => r.rawLabel === "workflow lib.greet");
-  assert.ok(runRow, "should have the imported workflow row");
-  assert.ok(runRow!.stepFunc, "stepFunc should be populated when rootDir is given");
-});
-
-// --- buildRunTreeRows: custom rootLabel ---
-
-test("buildRunTreeRows: custom rootLabel appears in root row", () => {
-  const mod = minimalModule({
-    workflows: [{ name: "deploy", comments: [], params: [], steps: [], loc: { line: 1, col: 1 } }],
-  });
-  const rows = buildRunTreeRows(mod, "workflow deploy");
-  assert.equal(rows.length, 1);
-  assert.equal(rows[0].rawLabel, "workflow deploy");
-  assert.equal(rows[0].isRoot, true);
-});
-
-test("buildRunTreeRows: custom rootLabel with rule kind", () => {
-  const mod = minimalModule({
-    workflows: [{ name: "check", comments: [], params: [], steps: [], loc: { line: 1, col: 1 } }],
-  });
-  const rows = buildRunTreeRows(mod, "rule check");
-  assert.equal(rows[0].rawLabel, "rule check");
-  assert.equal(rows[0].isRoot, true);
-});
-
-test("buildRunTreeRows: custom rootLabel preserves tree children", () => {
-  const mod = minimalModule({
-    workflows: [
-      {
-        name: "default",
-        comments: [],
-        params: [],
-        steps: [
-          { type: "log", message: "hello", loc: { line: 2, col: 3 } },
-        ],
-        loc: { line: 1, col: 1 },
-      },
-    ],
-  });
-  const rows = buildRunTreeRows(mod, "workflow main_entry");
-  assert.equal(rows.length, 2);
-  assert.equal(rows[0].rawLabel, "workflow main_entry");
-  assert.equal(rows[1].rawLabel, "ℹ hello");
-});
-
-// --- formatRunningBottomLine: edge cases ---
-
-test("formatRunningBottomLine: zero elapsed time", () => {
-  const result = formatRunningBottomLine("test", 0.0);
-  assert.ok(result.includes("RUNNING"), "should contain RUNNING");
-  assert.ok(result.includes("0.0s"), "should show zero time");
-});
-
-test("formatRunningBottomLine: large elapsed time", () => {
-  const result = formatRunningBottomLine("deploy", 999.9);
-  assert.ok(result.includes("999.9s"), "should show large time");
-});
-
-// --- collectWorkflowChildren: shell command truncation boundary ---
-
-test("collectWorkflowChildren: shell command at exactly 56 chars is not truncated", () => {
-  const cmd = "a".repeat(56);
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "shell", command: cmd, loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items[0].label, `$ ${cmd}`, "56-char command should not be truncated");
-  assert.ok(!items[0].label.includes("..."), "should not have ellipsis");
-});
-
-test("collectWorkflowChildren: shell command at 57 chars is truncated", () => {
-  const cmd = "b".repeat(57);
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "shell", command: cmd, loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.ok(items[0].label.includes("..."), "57-char command should be truncated");
-  assert.equal(items[0].label, `$ ${"b".repeat(53)}...`);
-});
-
-test("collectWorkflowChildren: shell command at 1 char is not truncated", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "shell", command: "x", loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items[0].label, "$ x");
-});
-
-// --- style functions: TTY and NO_COLOR paths ---
-
-test("styleKeywordLabel: returns ANSI bold kind when TTY and no NO_COLOR", () => {
-  const origIsTTY = process.stdout.isTTY;
-  const origNoColor = process.env.NO_COLOR;
-  try {
-    Object.defineProperty(process.stdout, "isTTY", { value: true, writable: true, configurable: true });
-    delete process.env.NO_COLOR;
-    const result = styleKeywordLabel("workflow deploy");
-    assert.ok(result.includes("\u001b[1mworkflow\u001b[0m"), "kind should be bold in TTY mode");
-    assert.ok(result.includes("deploy"), "name should be present");
-  } finally {
-    Object.defineProperty(process.stdout, "isTTY", { value: origIsTTY, writable: true, configurable: true });
-    if (origNoColor !== undefined) process.env.NO_COLOR = origNoColor;
-    else delete process.env.NO_COLOR;
-  }
-});
-
-test("styleKeywordLabel: returns plain text when NO_COLOR is set", () => {
-  const origIsTTY = process.stdout.isTTY;
-  const origNoColor = process.env.NO_COLOR;
-  try {
-    Object.defineProperty(process.stdout, "isTTY", { value: true, writable: true, configurable: true });
-    process.env.NO_COLOR = "1";
-    const result = styleKeywordLabel("workflow deploy");
-    assert.equal(result, "workflow deploy", "should return plain text with NO_COLOR");
-    assert.ok(!result.includes("\u001b["), "should not contain ANSI codes");
-  } finally {
-    Object.defineProperty(process.stdout, "isTTY", { value: origIsTTY, writable: true, configurable: true });
-    if (origNoColor !== undefined) process.env.NO_COLOR = origNoColor;
-    else delete process.env.NO_COLOR;
-  }
-});
-
-test("styleDim: returns ANSI dim when TTY and no NO_COLOR", () => {
-  const origIsTTY = process.stdout.isTTY;
-  const origNoColor = process.env.NO_COLOR;
-  try {
-    Object.defineProperty(process.stdout, "isTTY", { value: true, writable: true, configurable: true });
-    delete process.env.NO_COLOR;
-    const result = styleDim("hello");
-    assert.equal(result, "\u001b[2mhello\u001b[0m", "should wrap in dim ANSI");
-  } finally {
-    Object.defineProperty(process.stdout, "isTTY", { value: origIsTTY, writable: true, configurable: true });
-    if (origNoColor !== undefined) process.env.NO_COLOR = origNoColor;
-    else delete process.env.NO_COLOR;
-  }
-});
-
-test("styleDim: returns plain text when NO_COLOR is set", () => {
-  const origIsTTY = process.stdout.isTTY;
-  const origNoColor = process.env.NO_COLOR;
-  try {
-    Object.defineProperty(process.stdout, "isTTY", { value: true, writable: true, configurable: true });
-    process.env.NO_COLOR = "";
-    const result = styleDim("hello");
-    assert.equal(result, "hello", "should return plain text with NO_COLOR");
-  } finally {
-    Object.defineProperty(process.stdout, "isTTY", { value: origIsTTY, writable: true, configurable: true });
-    if (origNoColor !== undefined) process.env.NO_COLOR = origNoColor;
-    else delete process.env.NO_COLOR;
-  }
-});
-
-test("styleYellow: returns ANSI yellow when TTY and no NO_COLOR", () => {
-  const origIsTTY = process.stdout.isTTY;
-  const origNoColor = process.env.NO_COLOR;
-  try {
-    Object.defineProperty(process.stdout, "isTTY", { value: true, writable: true, configurable: true });
-    delete process.env.NO_COLOR;
-    const result = styleYellow("warning");
-    assert.equal(result, "\u001b[33mwarning\u001b[0m", "should wrap in yellow ANSI");
-  } finally {
-    Object.defineProperty(process.stdout, "isTTY", { value: origIsTTY, writable: true, configurable: true });
-    if (origNoColor !== undefined) process.env.NO_COLOR = origNoColor;
-    else delete process.env.NO_COLOR;
-  }
-});
-
-test("styleYellow: returns plain text when NO_COLOR is set", () => {
-  const origIsTTY = process.stdout.isTTY;
-  const origNoColor = process.env.NO_COLOR;
-  try {
-    Object.defineProperty(process.stdout, "isTTY", { value: true, writable: true, configurable: true });
-    process.env.NO_COLOR = "1";
-    const result = styleYellow("warning");
-    assert.equal(result, "warning", "should return plain text with NO_COLOR");
-  } finally {
-    Object.defineProperty(process.stdout, "isTTY", { value: origIsTTY, writable: true, configurable: true });
-    if (origNoColor !== undefined) process.env.NO_COLOR = origNoColor;
-    else delete process.env.NO_COLOR;
-  }
-});
+// --- style helpers (no-color paths) ---
 
-test("styleBold: returns ANSI bold when TTY and no NO_COLOR", () => {
-  const origIsTTY = process.stdout.isTTY;
-  const origNoColor = process.env.NO_COLOR;
+test("styleKeywordLabel: returns plain text when no TTY", () => {
+  const prev = process.stdout.isTTY;
+  Object.defineProperty(process.stdout, "isTTY", { value: false, configurable: true });
   try {
-    Object.defineProperty(process.stdout, "isTTY", { value: true, writable: true, configurable: true });
-    delete process.env.NO_COLOR;
-    const result = styleBold("title");
-    assert.equal(result, "\u001b[1mtitle\u001b[0m", "should wrap in bold ANSI");
+    assert.equal(styleKeywordLabel("workflow default"), "workflow default");
   } finally {
-    Object.defineProperty(process.stdout, "isTTY", { value: origIsTTY, writable: true, configurable: true });
-    if (origNoColor !== undefined) process.env.NO_COLOR = origNoColor;
-    else delete process.env.NO_COLOR;
+    Object.defineProperty(process.stdout, "isTTY", { value: prev, configurable: true });
   }
 });
 
-test("styleBold: returns plain text when not TTY", () => {
-  const origIsTTY = process.stdout.isTTY;
-  const origNoColor = process.env.NO_COLOR;
+test("styleDim / styleYellow / styleBold: no-color when not TTY", () => {
+  const prev = process.stdout.isTTY;
+  Object.defineProperty(process.stdout, "isTTY", { value: false, configurable: true });
   try {
-    Object.defineProperty(process.stdout, "isTTY", { value: false, writable: true, configurable: true });
-    delete process.env.NO_COLOR;
-    const result = styleBold("title");
-    assert.equal(result, "title", "should return plain text when not TTY");
+    assert.equal(styleDim("x"), "x");
+    assert.equal(styleYellow("x"), "x");
+    assert.equal(styleBold("x"), "x");
   } finally {
-    Object.defineProperty(process.stdout, "isTTY", { value: origIsTTY, writable: true, configurable: true });
-    if (origNoColor !== undefined) process.env.NO_COLOR = origNoColor;
-    else delete process.env.NO_COLOR;
+    Object.defineProperty(process.stdout, "isTTY", { value: prev, configurable: true });
   }
 });
 
-// --- buildRunTreeRows: selfRecursiveRunSiteCount returns 0 for missing workflow ---
-
-test("buildRunTreeRows: non-existent nested workflow reference is handled gracefully", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "nonexistent", loc: { line: 2, col: 3 } } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const rows = buildRunTreeRows(mod);
-  // Should have root + the run step reference, but no children expanded since workflow doesn't exist
-  assert.equal(rows.length, 2);
-  assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[1].rawLabel, "workflow nonexistent");
-});
-
-test("collectWorkflowChildren: returns empty for workflow with no matching name", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "other",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "log", message: "hello", loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "nonexistent");
-  assert.deepStrictEqual(items, []);
-});
-
-// --- collectWorkflowChildren: prompt with multiline whitespace raw ---
-
-test("collectWorkflowChildren: prompt with triple-quoted raw (no double quote) returns empty preview", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "prompt", raw: 'prompt """\nHello\n"""', loc: { line: 2, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const items = collectWorkflowChildren(mod, "default");
-  assert.equal(items.length, 1);
-  // The promptPreviewFromRaw picks up text between the first pair of double quotes
-  // In triple-quote form, first " starts at index 7, second " is immediately after → empty content
-  // Then third " triggers break → empty preview
-  assert.match(items[0].label, /^prompt "/);
-});
-
-// --- buildRunTreeRows: channels without routes don't produce tree nodes ---
-
-test("buildRunTreeRows: channel without routes adds no tree rows", () => {
-  const mod = minimalModule({
-    channels: [{
-      name: "events",
-      loc: { line: 1, col: 9 },
-    }],
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [{ type: "log", message: "ok", loc: { line: 3, col: 3 } }],
-      loc: { line: 2, col: 1 },
-    }],
-  });
-  const rows = buildRunTreeRows(mod);
-  assert.equal(rows.length, 2); // root + log
-  assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[1].rawLabel, "ℹ ok");
-});
-
-// --- buildRunTreeRows: imported module not found falls through gracefully ---
-
-test("buildRunTreeRows: imported module alias not in importedModules map is not expanded", () => {
-  const mainMod = minimalModule({
-    imports: [{ path: "lib.jh", alias: "lib", loc: { line: 1, col: 1 } }],
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "run", workflow: { value: "lib.greet", loc: { line: 3, col: 3 } } },
-      ],
-      loc: { line: 2, col: 1 },
-    }],
-  });
-  // Pass empty importedModules — alias "lib" not resolved
-  const importedModules = new Map<string, jaiphModule>();
-  const rows = buildRunTreeRows(mainMod, undefined, importedModules);
-  // Should still have root + the run step reference, but not expanded
-  assert.equal(rows.length, 2);
-  assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[1].rawLabel, "workflow lib.greet");
-});
-
-// --- buildRunTreeRows: match_expr arm expansion ---
-
-test("buildRunTreeRows: match arm with run body expands nested workflow", () => {
-  const mod = minimalModule({
-    workflows: [
-      {
-        name: "default",
-        comments: [],
-        params: [],
-        steps: [
-          {
-            type: "const",
-            name: "result",
-            value: {
-              kind: "match_expr",
-              match: {
-                subject: "x",
-                arms: [
-                  { pattern: { kind: "string_literal", value: "a" }, body: 'run deploy("a")' },
-                  { pattern: { kind: "wildcard" }, body: '"fallback"' },
-                ],
-                loc: { line: 3, col: 3 },
-              },
-            },
-            loc: { line: 2, col: 3 },
-          },
-        ],
-        loc: { line: 1, col: 1 },
-      },
-      {
-        name: "deploy",
-        comments: [],
-        params: [],
-        steps: [
-          { type: "log", message: "deploying", loc: { line: 8, col: 3 } },
-        ],
-        loc: { line: 7, col: 1 },
-      },
-    ],
-  });
-  const rows = buildRunTreeRows(mod);
-  // root + const result + workflow deploy (from match arm) + log deploying (expanded)
-  assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[1].rawLabel, "const result");
-  assert.equal(rows[2].rawLabel, "workflow deploy");
-  assert.equal(rows[3].rawLabel, "ℹ deploying");
-  assert.equal(rows.length, 4);
-});
-
-test("buildRunTreeRows: match arm with ensure body shows rule in tree", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        {
-          type: "const",
-          name: "status",
-          value: {
-            kind: "match_expr",
-            match: {
-              subject: "mode",
-              arms: [
-                { pattern: { kind: "string_literal", value: "strict" }, body: 'ensure gate()' },
-                { pattern: { kind: "wildcard" }, body: '"skip"' },
-              ],
-              loc: { line: 3, col: 3 },
-            },
-          },
-          loc: { line: 2, col: 3 },
-        },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const rows = buildRunTreeRows(mod);
-  assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[1].rawLabel, "const status");
-  assert.equal(rows[2].rawLabel, "rule gate");
-  assert.equal(rows.length, 3);
-});
-
-// --- buildRunTreeRows: mixed step types in tree ---
-
-test("buildRunTreeRows: workflow with multiple step types produces correct tree", () => {
-  const mod = minimalModule({
-    workflows: [{
-      name: "default",
-      comments: [],
-      params: [],
-      steps: [
-        { type: "log", message: "starting", loc: { line: 2, col: 3 } },
-        { type: "run", workflow: { value: "helper", loc: { line: 3, col: 3 } } },
-        { type: "ensure", ref: { value: "check", loc: { line: 4, col: 3 } } },
-        { type: "send", channel: "events", rhs: { kind: "literal", token: '"data"' }, loc: { line: 5, col: 3 } },
-        { type: "fail", message: '"reason"', loc: { line: 6, col: 3 } },
-      ],
-      loc: { line: 1, col: 1 },
-    }],
-  });
-  const rows = buildRunTreeRows(mod);
-  assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[1].rawLabel, "ℹ starting");
-  assert.equal(rows[2].rawLabel, "workflow helper");
-  assert.equal(rows[3].rawLabel, "rule check");
-  assert.equal(rows[4].rawLabel, "events <- send");
-  assert.equal(rows[5].rawLabel, 'fail "reason"');
-  assert.equal(rows.length, 6);
-});
-
-// --- buildRunTreeRows: run with catch block in tree ---
-
-test("buildRunTreeRows: run with catch block shows recovery steps in tree", () => {
-  const mod = minimalModule({
-    workflows: [
-      {
-        name: "default",
-        comments: [],
-        params: [],
-        steps: [
-          {
-            type: "run",
-            workflow: { value: "risky", loc: { line: 2, col: 3 } },
-            catch: {
-              bindings: { failure: "err" },
-              block: [
-                { type: "log", message: "recovering", loc: { line: 4, col: 5 } },
-                { type: "run", workflow: { value: "fallback", loc: { line: 5, col: 5 } } },
-              ],
-            },
-          },
-        ],
-        loc: { line: 1, col: 1 },
-      },
-      {
-        name: "risky",
-        comments: [],
-        params: [],
-        steps: [{ type: "log", message: "trying", loc: { line: 8, col: 3 } }],
-        loc: { line: 7, col: 1 },
-      },
-    ],
-  });
-  const rows = buildRunTreeRows(mod);
-  // root + workflow risky + log trying (expanded) + log recovering (catch) + workflow fallback (catch)
-  assert.equal(rows[0].rawLabel, "workflow default");
-  assert.equal(rows[1].rawLabel, "workflow risky");
-  // risky is expanded since it has children
-  assert.equal(rows[2].rawLabel, "ℹ trying");
-  // catch block children
-  assert.equal(rows[3].rawLabel, "ℹ recovering");
-  assert.equal(rows[4].rawLabel, "workflow fallback");
-  assert.equal(rows.length, 5);
+test("formatRunningBottomLine: renders status with elapsed", () => {
+  const line = formatRunningBottomLine("default", 1.5);
+  assert.ok(line.includes("default"));
+  assert.ok(line.includes("1.5s"));
 });
diff --git a/src/cli/run/progress.ts b/src/cli/run/progress.ts
index 86aeaaa3..546c7aac 100644
--- a/src/cli/run/progress.ts
+++ b/src/cli/run/progress.ts
@@ -1,5 +1,5 @@
 import { resolve } from "node:path";
-import { jaiphModule, type WorkflowStepDef } from "../../types";
+import { jaiphModule, type Expr, type WorkflowStepDef } from "../../types";
 import { workflowSymbolForFile } from "../../transpiler";
 
 export type TreeRow = {
@@ -44,7 +44,7 @@ function selfRecursiveRunSiteCount(mod: jaiphModule, workflowName: string): numb
   }
   let count = 0;
   for (const step of workflow.steps) {
-    if (step.type === "run" && step.workflow.value === workflowName) {
+    if (step.type === "exec" && step.body.kind === "call" && step.body.callee.value === workflowName) {
       count += 1;
       continue;
     }
@@ -52,6 +52,18 @@ function selfRecursiveRunSiteCount(mod: jaiphModule, workflowName: string): numb
   return count;
 }
 
+/** Short surface label for an Expr value (used in `return` / `const` rows). */
+function exprLabel(expr: Expr): string {
+  if (expr.kind === "literal") return expr.raw;
+  if (expr.kind === "call") return `run ${expr.callee.value}(...)`;
+  if (expr.kind === "ensure_call") return `ensure ${expr.callee.value}(...)`;
+  if (expr.kind === "inline_script") return "run `...`(...)";
+  if (expr.kind === "prompt") return `prompt ${expr.raw}`;
+  if (expr.kind === "match") return `match ${expr.match.subject}`;
+  if (expr.kind === "shell") return expr.command;
+  return expr.ref.value;
+}
+
 export function collectWorkflowChildren(
   mod: jaiphModule,
   workflowName: string,
@@ -63,81 +75,77 @@ export function collectWorkflowChildren(
     return [];
   }
   const items: Array<{ label: string; nested?: string; stepFunc?: string }> = [];
+  const refStepFunc = (ref: string): string | undefined =>
+    symbols && ref.includes(".")
+      ? (() => {
+          const dot = ref.indexOf(".");
+          const alias = ref.slice(0, dot);
+          const name = ref.slice(dot + 1);
+          return `${symbols.get(alias) ?? alias}::${name}`;
+        })()
+      : currentSymbol
+        ? `${currentSymbol}::${ref}`
+        : undefined;
   const stepToItems = (s: WorkflowStepDef): Array<{ label: string; nested?: string; stepFunc?: string }> => {
-    if (s.type === "run") {
-      const wf = s.workflow.value;
-      const asyncPrefix = s.async ? "async " : "";
-      const stepFunc =
-        symbols && wf.includes(".")
-          ? (() => {
-              const dot = wf.indexOf(".");
-              const alias = wf.slice(0, dot);
-              const name = wf.slice(dot + 1);
-              return `${symbols.get(alias) ?? alias}::${name}`;
-            })()
-          : currentSymbol
-            ? `${currentSymbol}::${wf}`
-            : undefined;
-      const arr: Array<{ label: string; nested?: string; stepFunc?: string }> = [
-        { label: `${asyncPrefix}workflow ${wf}`, nested: wf, stepFunc },
-      ];
-      if (s.recover) {
-        const steps = "single" in s.recover ? [s.recover.single] : s.recover.block;
-        for (const r of steps) {
-          arr.push(...stepToItems(r));
-        }
-      } else if (s.catch) {
-        const steps = "single" in s.catch ? [s.catch.single] : s.catch.block;
-        for (const r of steps) {
-          arr.push(...stepToItems(r));
+    if (s.type === "exec") {
+      const body = s.body;
+      if (body.kind === "call") {
+        const wf = body.callee.value;
+        const asyncPrefix = body.async ? "async " : "";
+        const arr: Array<{ label: string; nested?: string; stepFunc?: string }> = [
+          { label: `${asyncPrefix}workflow ${wf}`, nested: wf, stepFunc: refStepFunc(wf) },
+        ];
+        if (s.recover) {
+          const steps = "single" in s.recover ? [s.recover.single] : s.recover.block;
+          for (const r of steps) arr.push(...stepToItems(r));
+        } else if (s.catch) {
+          const steps = "single" in s.catch ? [s.catch.single] : s.catch.block;
+          for (const r of steps) arr.push(...stepToItems(r));
         }
+        return arr;
       }
-      return arr;
-    }
-    if (s.type === "ensure") {
-      const ref = s.ref.value;
-      const stepFunc =
-        symbols && ref.includes(".")
-          ? (() => {
-              const dot = ref.indexOf(".");
-              const alias = ref.slice(0, dot);
-              const name = ref.slice(dot + 1);
-              return `${symbols.get(alias) ?? alias}::${name}`;
-            })()
-          : currentSymbol
-            ? `${currentSymbol}::${ref}`
-            : undefined;
-      const arr: Array<{ label: string; nested?: string; stepFunc?: string }> = [
-        { label: `rule ${ref}`, stepFunc },
-      ];
-      if (s.catch) {
-        const steps = "single" in s.catch ? [s.catch.single] : s.catch.block;
-        for (const r of steps) {
-          arr.push(...stepToItems(r));
+      if (body.kind === "ensure_call") {
+        const ref = body.callee.value;
+        const arr: Array<{ label: string; nested?: string; stepFunc?: string }> = [
+          { label: `rule ${ref}`, stepFunc: refStepFunc(ref) },
+        ];
+        if (s.catch) {
+          const steps = "single" in s.catch ? [s.catch.single] : s.catch.block;
+          for (const r of steps) arr.push(...stepToItems(r));
         }
+        return arr;
       }
-      return arr;
-    }
-    if (s.type === "prompt") {
-      return [{ label: formatPromptLabel(s.raw), stepFunc: "jaiph::prompt" }];
-    }
-    if (s.type === "log") {
-      return [{ label: `ℹ ${s.message}` }];
+      if (body.kind === "prompt") {
+        return [{ label: formatPromptLabel(body.raw), stepFunc: "jaiph::prompt" }];
+      }
+      if (body.kind === "inline_script") {
+        return [{ label: "script (inline)" }];
+      }
+      if (body.kind === "shell") {
+        const t = body.command.trim();
+        const label = t.length > 56 ? `${t.slice(0, 53)}...` : t;
+        return [{ label: `$ ${label}` }];
+      }
+      if (body.kind === "match") {
+        // standalone match — no nested rendering
+        return [];
+      }
+      return [];
     }
-    if (s.type === "logerr") {
-      return [{ label: `! ${s.message}` }];
+    if (s.type === "say") {
+      const msg = exprLabel(s.message);
+      if (s.level === "log") return [{ label: `ℹ ${msg}` }];
+      if (s.level === "logerr") return [{ label: `! ${msg}` }];
+      return [{ label: `fail ${msg}` }];
     }
     if (s.type === "send") {
       return [{ label: `${s.channel} <- send` }];
     }
-    if (s.type === "fail") {
-      return [{ label: `fail ${s.message}` }];
-    }
     if (s.type === "const") {
       const constItems: Array<{ label: string; nested?: string; stepFunc?: string }> = [
         { label: `const ${s.name}` },
       ];
-      if (s.value.kind === "match_expr") {
+      if (s.value.kind === "match") {
         for (const arm of s.value.match.arms) {
           const body = arm.body.trimStart();
           const runM = body.match(/^run\s+([A-Za-z_][A-Za-z0-9_.]*)\(/);
@@ -154,19 +162,11 @@ export function collectWorkflowChildren(
       return constItems;
     }
     if (s.type === "return") {
-      return [{ label: `return ${s.value}` }];
+      return [{ label: `return ${exprLabel(s.value)}` }];
     }
-    if (s.type === "comment") {
+    if (s.type === "trivia") {
       return [];
     }
-    if (s.type === "run_inline_script") {
-      return [{ label: "script (inline)" }];
-    }
-    if (s.type === "shell") {
-      const t = s.command.trim();
-      const label = t.length > 56 ? `${t.slice(0, 53)}...` : t;
-      return [{ label: `$ ${label}` }];
-    }
     return [];
   };
 
@@ -179,68 +179,7 @@ export function collectWorkflowChildren(
   }
 
   for (const step of workflow.steps) {
-    if (step.type === "ensure") {
-      items.push(...stepToItems(step));
-      continue;
-    }
-    if (step.type === "run") {
-      const wf = step.workflow.value;
-      const asyncPrefix = step.async ? "async " : "";
-      const stepFunc =
-        symbols && wf.includes(".")
-          ? (() => {
-              const dot = wf.indexOf(".");
-              const alias = wf.slice(0, dot);
-              const name = wf.slice(dot + 1);
-              return `${symbols.get(alias) ?? alias}::${name}`;
-            })()
-          : currentSymbol
-            ? `${currentSymbol}::${wf}`
-            : undefined;
-      items.push(...stepToItems(step));
-      continue;
-    }
-    if (step.type === "run_inline_script") {
-      items.push({ label: "script (inline)" });
-      continue;
-    }
-    if (step.type === "prompt") {
-      items.push({ label: formatPromptLabel(step.raw), stepFunc: "jaiph::prompt" });
-      continue;
-    }
-    if (step.type === "log") {
-      items.push({ label: `ℹ ${step.message}` });
-      continue;
-    }
-    if (step.type === "logerr") {
-      items.push({ label: `! ${step.message}` });
-      continue;
-    }
-    if (step.type === "send") {
-      items.push({ label: `${step.channel} <- send` });
-      continue;
-    }
-    if (step.type === "fail") {
-      items.push({ label: `fail ${step.message}` });
-      continue;
-    }
-    if (step.type === "const") {
-      items.push(...stepToItems(step));
-      continue;
-    }
-    if (step.type === "return") {
-      items.push({ label: `return ${step.value}` });
-      continue;
-    }
-    if (step.type === "comment") {
-      continue;
-    }
-    if (step.type === "shell") {
-      const t = step.command.trim();
-      const label = t.length > 56 ? `${t.slice(0, 53)}...` : t;
-      items.push({ label: `$ ${label}` });
-      continue;
-    }
+    items.push(...stepToItems(step));
   }
   return items;
 }
diff --git a/src/cli/run/sandbox-flags.test.ts b/src/cli/run/sandbox-flags.test.ts
new file mode 100644
index 00000000..8aa07080
--- /dev/null
+++ b/src/cli/run/sandbox-flags.test.ts
@@ -0,0 +1,149 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { applySandboxFlags } from "./env";
+import { resolveDockerConfig, selectSandboxMode } from "../../runtime/docker";
+import { confirmInplaceRun, _inplacePrompt } from "../../runtime/docker-inplace";
+import { mkdtempSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+
+function stubPrompt(): { restore: () => void; callCount: () => number } {
+  const orig = _inplacePrompt.ask;
+  let calls = 0;
+  _inplacePrompt.ask = async (_q: string) => {
+    calls += 1;
+    return true;
+  };
+  return {
+    restore: () => { _inplacePrompt.ask = orig; },
+    callCount: () => calls,
+  };
+}
+
+// ---------------------------------------------------------------------------
+// applySandboxFlags: each flag normalizes into the runtime env map
+// ---------------------------------------------------------------------------
+
+test("applySandboxFlags: --inplace sets JAIPH_INPLACE=1", () => {
+  const env: Record<string, string | undefined> = {};
+  applySandboxFlags(env, { inplace: true });
+  assert.equal(env.JAIPH_INPLACE, "1");
+  assert.equal(env.JAIPH_UNSAFE, undefined);
+  assert.equal(env.JAIPH_INPLACE_YES, undefined);
+});
+
+test("applySandboxFlags: --unsafe sets JAIPH_UNSAFE=true", () => {
+  const env: Record<string, string | undefined> = {};
+  applySandboxFlags(env, { unsafe: true });
+  assert.equal(env.JAIPH_UNSAFE, "true");
+  assert.equal(env.JAIPH_INPLACE, undefined);
+});
+
+test("applySandboxFlags: --yes sets JAIPH_INPLACE_YES=1", () => {
+  const env: Record<string, string | undefined> = {};
+  applySandboxFlags(env, { yes: true });
+  assert.equal(env.JAIPH_INPLACE_YES, "1");
+});
+
+test("applySandboxFlags: no flags leaves env unchanged", () => {
+  const env: Record<string, string | undefined> = { JAIPH_DEBUG: "true" };
+  applySandboxFlags(env, {});
+  assert.deepEqual(env, { JAIPH_DEBUG: "true" });
+});
+
+test("applySandboxFlags: pre-existing env values agree with flag (no conflict)", () => {
+  const env: Record<string, string | undefined> = { JAIPH_INPLACE: "1" };
+  applySandboxFlags(env, { inplace: true });
+  assert.equal(env.JAIPH_INPLACE, "1");
+});
+
+test("applySandboxFlags: env-only path (no flags) still respected by callers — flag missing leaves env alone", () => {
+  const env: Record<string, string | undefined> = { JAIPH_INPLACE: "1" };
+  applySandboxFlags(env, {});
+  assert.equal(env.JAIPH_INPLACE, "1");
+});
+
+// ---------------------------------------------------------------------------
+// E_FLAG_CONFLICT: --inplace + --unsafe is contradictory
+// ---------------------------------------------------------------------------
+
+test("applySandboxFlags: --inplace + --unsafe both set → E_FLAG_CONFLICT", () => {
+  const env: Record<string, string | undefined> = {};
+  assert.throws(
+    () => applySandboxFlags(env, { inplace: true, unsafe: true }),
+    /E_FLAG_CONFLICT/,
+  );
+});
+
+test("applySandboxFlags: --inplace flag + JAIPH_UNSAFE=true env → E_FLAG_CONFLICT", () => {
+  const env: Record<string, string | undefined> = { JAIPH_UNSAFE: "true" };
+  assert.throws(
+    () => applySandboxFlags(env, { inplace: true }),
+    /E_FLAG_CONFLICT/,
+  );
+});
+
+test("applySandboxFlags: --unsafe flag + JAIPH_INPLACE=1 env → E_FLAG_CONFLICT", () => {
+  const env: Record<string, string | undefined> = { JAIPH_INPLACE: "1" };
+  assert.throws(
+    () => applySandboxFlags(env, { unsafe: true }),
+    /E_FLAG_CONFLICT/,
+  );
+});
+
+test("applySandboxFlags: JAIPH_INPLACE=true (string) + JAIPH_UNSAFE=true env → E_FLAG_CONFLICT", () => {
+  const env: Record<string, string | undefined> = { JAIPH_INPLACE: "true", JAIPH_UNSAFE: "true" };
+  assert.throws(
+    () => applySandboxFlags(env, {}),
+    /E_FLAG_CONFLICT/,
+  );
+});
+
+// ---------------------------------------------------------------------------
+// End-to-end: flag-normalized env is consumed by the unmodified docker layer
+// ---------------------------------------------------------------------------
+
+test("--inplace alone (no env) → selectSandboxMode returns 'inplace'", () => {
+  const env: Record<string, string | undefined> = {};
+  applySandboxFlags(env, { inplace: true });
+  assert.equal(selectSandboxMode(env), "inplace");
+});
+
+test("--unsafe alone (no env) → resolveDockerConfig().enabled === false", () => {
+  const env: Record<string, string | undefined> = {};
+  applySandboxFlags(env, { unsafe: true });
+  const cfg = resolveDockerConfig(undefined, env);
+  assert.equal(cfg.enabled, false);
+});
+
+test("env-only JAIPH_INPLACE still selects inplace (regression)", () => {
+  // No flag — the runtime env already had it. selectSandboxMode picks it up.
+  assert.equal(selectSandboxMode({ JAIPH_INPLACE: "1" }), "inplace");
+});
+
+test("env-only JAIPH_UNSAFE still disables Docker (regression)", () => {
+  const cfg = resolveDockerConfig(undefined, { JAIPH_UNSAFE: "true" });
+  assert.equal(cfg.enabled, false);
+});
+
+test("--yes alone (no env) → confirmInplaceRun does not invoke the prompt", async () => {
+  const ws = mkdtempSync(join(tmpdir(), "jaiph-sandbox-flags-ws-"));
+  const spy = stubPrompt();
+  try {
+    const env: Record<string, string | undefined> = {};
+    applySandboxFlags(env, { yes: true });
+    const proceed = await confirmInplaceRun(ws, env, true);
+    assert.equal(proceed, true);
+    assert.equal(spy.callCount(), 0, "prompt must not be invoked when --yes normalized into JAIPH_INPLACE_YES");
+  } finally {
+    spy.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("flag and env agree on JAIPH_INPLACE — no conflict, single value persisted", () => {
+  const env: Record<string, string | undefined> = { JAIPH_INPLACE: "1" };
+  applySandboxFlags(env, { inplace: true });
+  assert.equal(env.JAIPH_INPLACE, "1");
+  assert.equal(selectSandboxMode(env), "inplace");
+});
diff --git a/src/cli/run/stderr-handler.ts b/src/cli/run/stderr-handler.ts
index 8a979ec6..5e85db50 100644
--- a/src/cli/run/stderr-handler.ts
+++ b/src/cli/run/stderr-handler.ts
@@ -46,7 +46,6 @@ function handleLine(
   line: string,
   state: StderrParserState,
   emitter: RunEmitter,
-  formatDiagnosticLine: (line: string) => string,
 ): void {
   const logEvent = parseLogEvent(line);
   if (logEvent) {
@@ -75,7 +74,7 @@ function handleLine(
   }
 
   if (line.length > 0) {
-    emitter.emit("stderr_line", { line: formatDiagnosticLine(line) });
+    emitter.emit("stderr_line", { line });
   }
 }
 
@@ -83,11 +82,10 @@ function handleLine(
  * Create a line handler that parses stderr lines and emits events through the emitter.
  */
 export function createStderrParser(emitter: RunEmitter): (line: string) => void {
-  const formatDiagnosticLine = (ln: string) => ln;
   const state: StderrParserState = {
     runtimeStack: [], legacyStack: [], legacyCounter: 0, rootStepId: null,
   };
-  return (line: string) => handleLine(line, state, emitter, formatDiagnosticLine);
+  return (line: string) => handleLine(line, state, emitter);
 }
 
 // ── Run state (shared output read by runWorkflow after exit) ──
diff --git a/src/cli/shared/errors.test.ts b/src/cli/shared/errors.test.ts
index 1273f7e2..804ce911 100644
--- a/src/cli/shared/errors.test.ts
+++ b/src/cli/shared/errors.test.ts
@@ -12,6 +12,7 @@ import {
   readFailedStepOutput,
   failedStepArtifactPaths,
   discoverDockerRunDir,
+  formatDockerTimeoutMessage,
 } from "./errors";
 
 // === summarizeError ===
@@ -40,6 +41,38 @@ test("summarizeError: handles \\r\\n line endings", () => {
   assert.equal(summarizeError("first\r\nsecond\r\nthird"), "third");
 });
 
+test("summarizeError: empty stderr with code + runDir mentions both", () => {
+  const msg = summarizeError("", undefined, { code: 1, runDir: "/tmp/runs/2026-06-11/00-00-00-x" });
+  assert.match(msg, /\(exit 1\)/);
+  assert.match(msg, /under \/tmp\/runs\/2026-06-11\/00-00-00-x/);
+  assert.match(msg, /run_summary\.jsonl/);
+});
+
+test("summarizeError: empty stderr with code only omits runDir clause", () => {
+  const msg = summarizeError("", undefined, { code: 137 });
+  assert.match(msg, /\(exit 137\) with no error output$/);
+});
+
+test("summarizeError: empty stderr with runDir only omits exit clause", () => {
+  const msg = summarizeError("", undefined, { runDir: "/runs/x" });
+  assert.match(msg, /^Workflow execution failed with no error output;/);
+  assert.match(msg, /under \/runs\/x$/);
+});
+
+test("summarizeError: non-empty stderr ignores code/runDir opts", () => {
+  const msg = summarizeError("real error line", undefined, { code: 1, runDir: "/r" });
+  assert.equal(msg, "real error line");
+});
+
+// === formatDockerTimeoutMessage ===
+
+test("formatDockerTimeoutMessage: includes configured seconds and remedy", () => {
+  const msg = formatDockerTimeoutMessage(42);
+  assert.match(msg, /^E_TIMEOUT container execution exceeded 42s/);
+  assert.match(msg, /runtime\.docker_timeout_seconds/);
+  assert.match(msg, /JAIPH_DOCKER_TIMEOUT/);
+});
+
 // === hasFatalRuntimeStderr ===
 
 test("hasFatalRuntimeStderr: returns false when debug is enabled", () => {
diff --git a/src/cli/shared/errors.ts b/src/cli/shared/errors.ts
index b278bf4c..91582395 100644
--- a/src/cli/shared/errors.ts
+++ b/src/cli/shared/errors.ts
@@ -15,7 +15,11 @@ export function colorPalette(): { green: string; red: string; dim: string; reset
   };
 }
 
-export function summarizeError(stderr: string, fallback?: string): string {
+export function summarizeError(
+  stderr: string,
+  fallback?: string,
+  opts?: { code?: number; runDir?: string },
+): string {
   const lines = stderr
     .split(/\r?\n/)
     .map((line) => line.trim())
@@ -23,9 +27,22 @@ export function summarizeError(stderr: string, fallback?: string): string {
   if (lines.length > 0) {
     return lines[lines.length - 1];
   }
+  const code = opts?.code;
+  const runDir = opts?.runDir;
+  if (code !== undefined || runDir) {
+    const codePart = code !== undefined ? ` (exit ${code})` : "";
+    const dirPart = runDir
+      ? `; inspect run_summary.jsonl and step artifacts under ${runDir}`
+      : "";
+    return `Workflow execution failed${codePart} with no error output${dirPart}`;
+  }
   return fallback ?? "Workflow execution failed.";
 }
 
+export function formatDockerTimeoutMessage(timeoutSeconds: number): string {
+  return `E_TIMEOUT container execution exceeded ${timeoutSeconds}s — increase runtime.docker_timeout_seconds or JAIPH_DOCKER_TIMEOUT`;
+}
+
 export type FailureDetails = {
   summary: string;
   failedStepOutput: string | null;
@@ -36,8 +53,12 @@ export type FailureDetails = {
  * Resolve canonical failure details for CLI rendering.
  * Prefer detailed failed step output when available; summary is fallback-only.
  */
-export function resolveFailureDetails(stderr: string, summaryPath?: string): FailureDetails {
-  const summary = summarizeError(stderr, "Workflow execution failed.");
+export function resolveFailureDetails(
+  stderr: string,
+  summaryPath?: string,
+  opts?: { code?: number; runDir?: string },
+): FailureDetails {
+  const summary = summarizeError(stderr, "Workflow execution failed.", opts);
   const failedStepOutput = summaryPath ? readFailedStepOutput(summaryPath) : null;
   return {
     summary,
diff --git a/src/cli/shared/paths.ts b/src/cli/shared/paths.ts
index 2eca41a7..2e404911 100644
--- a/src/cli/shared/paths.ts
+++ b/src/cli/shared/paths.ts
@@ -3,6 +3,7 @@ import { basename, dirname, join, resolve, sep } from "node:path";
 import { parsejaiph } from "../../parser";
 import { resolveImportPath } from "../../transpiler";
 import { jaiphModule } from "../../types";
+import { JAIPH_SKILL_MD_BASE64, decodeEmbeddedAsset } from "../../runtime/embedded-assets";
 
 /**
  * When TMPDIR (or other tooling) places temp projects under `<repo>/.jaiph/tmp/...`,
@@ -112,6 +113,19 @@ export function resolveInstalledSkillPath(): string | undefined {
   return candidates.find((path) => existsSync(path));
 }
 
+/**
+ * Resolve the SKILL.md body that `jaiph init` should write.
+ *
+ * Disk lookup wins (so a contributor overriding `JAIPH_SKILL_PATH` or running
+ * from a checkout still gets the live source), and the embedded copy is the
+ * fallback for the bun-compiled standalone binary, which has no sibling files.
+ */
+export function loadInstalledSkillContent(): string {
+  const path = resolveInstalledSkillPath();
+  if (path) return readFileSync(path, "utf8");
+  return decodeEmbeddedAsset(JAIPH_SKILL_MD_BASE64);
+}
+
 export function loadImportedModules(mainMod: jaiphModule, workspaceRoot?: string): Map<string, jaiphModule> {
   const map = new Map<string, jaiphModule>();
   for (const imp of mainMod.imports) {
diff --git a/src/cli/shared/usage.test.ts b/src/cli/shared/usage.test.ts
new file mode 100644
index 00000000..ca2971df
--- /dev/null
+++ b/src/cli/shared/usage.test.ts
@@ -0,0 +1,179 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { parseArgs, printUsage } from "./usage";
+
+function captureStdout(): { restore: () => void; text: () => string } {
+  let buf = "";
+  const orig = process.stdout.write;
+  process.stdout.write = ((chunk: string | Uint8Array) => {
+    buf += String(chunk);
+    return true;
+  }) as typeof process.stdout.write;
+  return {
+    restore: () => { process.stdout.write = orig; },
+    text: () => buf,
+  };
+}
+
+// ---------------------------------------------------------------------------
+// parseArgs: existing behavior (regression)
+// ---------------------------------------------------------------------------
+
+test("parseArgs: --target captures next arg and continues parsing", () => {
+  const r = parseArgs(["--target", "/tmp/out", "flow.jh", "hello"]);
+  assert.equal(r.target, "/tmp/out");
+  assert.deepEqual(r.positional, ["flow.jh", "hello"]);
+});
+
+test("parseArgs: --target without a value throws", () => {
+  assert.throws(() => parseArgs(["--target"]), /--target requires a directory path/);
+});
+
+test("parseArgs: --raw sets raw=true", () => {
+  const r = parseArgs(["--raw", "flow.jh"]);
+  assert.equal(r.raw, true);
+  assert.deepEqual(r.positional, ["flow.jh"]);
+});
+
+test("parseArgs: -- terminates flag parsing and pushes the rest into positional", () => {
+  const r = parseArgs(["--raw", "flow.jh", "--", "--raw", "--target", "foo"]);
+  assert.equal(r.raw, true);
+  assert.deepEqual(r.positional, ["flow.jh", "--raw", "--target", "foo"]);
+});
+
+// ---------------------------------------------------------------------------
+// parseArgs: new flags
+// ---------------------------------------------------------------------------
+
+test("parseArgs: --workspace captures next arg", () => {
+  const r = parseArgs(["--workspace", "/tmp/ws", "flow.jh"]);
+  assert.equal(r.workspace, "/tmp/ws");
+  assert.deepEqual(r.positional, ["flow.jh"]);
+});
+
+test("parseArgs: --workspace without a value throws", () => {
+  assert.throws(() => parseArgs(["--workspace"]), /--workspace requires a directory path/);
+});
+
+test("parseArgs: --inplace sets inplace=true", () => {
+  const r = parseArgs(["--inplace", "flow.jh"]);
+  assert.equal(r.inplace, true);
+  assert.deepEqual(r.positional, ["flow.jh"]);
+});
+
+test("parseArgs: --unsafe sets unsafe=true", () => {
+  const r = parseArgs(["--unsafe", "flow.jh"]);
+  assert.equal(r.unsafe, true);
+  assert.deepEqual(r.positional, ["flow.jh"]);
+});
+
+test("parseArgs: --yes sets yes=true", () => {
+  const r = parseArgs(["--yes", "flow.jh"]);
+  assert.equal(r.yes, true);
+});
+
+test("parseArgs: -y short form sets yes=true", () => {
+  const r = parseArgs(["-y", "flow.jh"]);
+  assert.equal(r.yes, true);
+});
+
+test("parseArgs: -- still terminates parsing after new flags; post-`--` tokens land in positional unchanged", () => {
+  const r = parseArgs(["--inplace", "flow.jh", "--", "--inplace", "--unsafe", "--yes"]);
+  assert.equal(r.inplace, true);
+  assert.equal(r.unsafe, undefined);
+  assert.equal(r.yes, undefined);
+  assert.deepEqual(r.positional, ["flow.jh", "--inplace", "--unsafe", "--yes"]);
+});
+
+test("parseArgs: all new flags combined with existing flags", () => {
+  const r = parseArgs([
+    "--raw",
+    "--target", "/tmp/out",
+    "--workspace", "/tmp/ws",
+    "--inplace",
+    "--yes",
+    "flow.jh",
+    "arg1",
+  ]);
+  assert.equal(r.raw, true);
+  assert.equal(r.target, "/tmp/out");
+  assert.equal(r.workspace, "/tmp/ws");
+  assert.equal(r.inplace, true);
+  assert.equal(r.yes, true);
+  assert.equal(r.unsafe, undefined);
+  assert.deepEqual(r.positional, ["flow.jh", "arg1"]);
+});
+
+// ---------------------------------------------------------------------------
+// parseArgs: --flag=value form
+// ---------------------------------------------------------------------------
+
+test("parseArgs: --workspace=value form captures the value", () => {
+  const r = parseArgs(["--workspace=/tmp/ws", "flow.jh"]);
+  assert.equal(r.workspace, "/tmp/ws");
+  assert.deepEqual(r.positional, ["flow.jh"]);
+});
+
+test("parseArgs: --target=value form captures the value", () => {
+  const r = parseArgs(["--target=/tmp/out", "flow.jh", "hello"]);
+  assert.equal(r.target, "/tmp/out");
+  assert.deepEqual(r.positional, ["flow.jh", "hello"]);
+});
+
+test("parseArgs: --flag=value and --flag value forms are equivalent", () => {
+  const eq = parseArgs(["--workspace=/tmp/ws", "--target=/tmp/out", "flow.jh"]);
+  const sp = parseArgs(["--workspace", "/tmp/ws", "--target", "/tmp/out", "flow.jh"]);
+  assert.deepEqual(eq, sp);
+});
+
+test("parseArgs: --workspace= splits on the first '=' so values may contain '='", () => {
+  const r = parseArgs(["--workspace=/tmp/a=b", "flow.jh"]);
+  assert.equal(r.workspace, "/tmp/a=b");
+  assert.deepEqual(r.positional, ["flow.jh"]);
+});
+
+test("parseArgs: --workspace= with empty value throws", () => {
+  assert.throws(() => parseArgs(["--workspace="]), /--workspace requires a directory path/);
+});
+
+test("parseArgs: boolean flag with =value form throws", () => {
+  assert.throws(() => parseArgs(["--inplace=true", "flow.jh"]), /--inplace does not take a value/);
+});
+
+test("parseArgs: --flag=value after -- is left untouched in positional", () => {
+  const r = parseArgs(["flow.jh", "--", "--workspace=/should/not/parse"]);
+  assert.equal(r.workspace, undefined);
+  assert.deepEqual(r.positional, ["flow.jh", "--workspace=/should/not/parse"]);
+});
+
+// ---------------------------------------------------------------------------
+// printUsage: lists the new flags under `jaiph run`
+// ---------------------------------------------------------------------------
+
+test("printUsage: lists --workspace, --inplace, --unsafe, --yes under jaiph run", () => {
+  const cap = captureStdout();
+  try {
+    printUsage();
+  } finally {
+    cap.restore();
+  }
+  const text = cap.text();
+  const runSection = text.slice(text.indexOf("jaiph run:"));
+  assert.ok(runSection.includes("--workspace"), "jaiph run section mentions --workspace");
+  assert.ok(runSection.includes("--inplace"), "jaiph run section mentions --inplace");
+  assert.ok(runSection.includes("--unsafe"), "jaiph run section mentions --unsafe");
+  assert.ok(runSection.includes("--yes"), "jaiph run section mentions --yes");
+});
+
+test("printUsage: example shows --inplace + --workspace combo", () => {
+  const cap = captureStdout();
+  try {
+    printUsage();
+  } finally {
+    cap.restore();
+  }
+  assert.ok(
+    cap.text().includes("jaiph run --inplace --workspace"),
+    "examples block has the documented --inplace + --workspace combo",
+  );
+});
diff --git a/src/cli/shared/usage.ts b/src/cli/shared/usage.ts
index 9166228d..a8fd3535 100644
--- a/src/cli/shared/usage.ts
+++ b/src/cli/shared/usage.ts
@@ -5,31 +5,39 @@ export function printUsage(): void {
       "  jaiph [--help | --version]",
       "  jaiph <file.jh> [args...]                # run workflow (same as jaiph run <file> [args...])",
       "  jaiph <file.test.jh> [args...]           # run tests (same as jaiph test <file>; extra args ignored)",
-      "  jaiph run [--target <dir>] [--raw] <file.jh> [--] [args...]",
+      "  jaiph run [--target <dir>] [--raw] [--workspace <dir>] [--inplace] [--unsafe] [--yes|-y] <file.jh> [--] [args...]",
       "  jaiph test [path]                        # workspace root, directory (recursive), or one *.test.jh file",
       "  jaiph init [workspace-path]",
-      "  jaiph install [--force] [<repo-url[@version]> ...]",
+      "  jaiph install [--force] [<name[@version]> | <repo-url[@version]> ...]",
       "  jaiph use <version|nightly>",
       "  jaiph format [--check] [--indent <n>] <file.jh ...>",
       "  jaiph compile [--json] [--workspace <dir>] <file.jh | directory> ...",
       "",
-      "Global options (only as the first argument, before a subcommand or file path):",
-      "  -h, --help     show this usage",
+      "Global options:",
+      "  -h, --help     show this usage (jaiph --help) — each subcommand also accepts -h / --help",
       "  -v, --version  show version",
       "",
       "jaiph run:",
-      "  --target <dir>  keep emitted script files and run metadata under <dir> (default: temp dir, cleaned up)",
-      "  --raw           skip banner, progress tree, hooks, and failure footer; inherited stdio for embedding / Docker inner run",
-      "  --              end of jaiph flags; remaining args are passed to workflow default",
+      "  --target <dir>     keep emitted script files and run metadata under <dir> (default: temp dir, cleaned up)",
+      "  --raw              skip banner, progress tree, hooks, and failure footer; inherited stdio for embedding / Docker inner run",
+      "  --workspace <dir>  workspace root for import resolution (default: auto-detect from the .jh file)",
+      "  --inplace          bind-mount the host workspace rw so edits land live (sets JAIPH_INPLACE=1 for this run)",
+      "  --unsafe           run on the host with no sandbox (sets JAIPH_UNSAFE=true for this run)",
+      "  -y, --yes          skip the in-place confirmation prompt (sets JAIPH_INPLACE_YES=1 for this run)",
+      "  --                 end of jaiph flags; remaining args are passed to workflow default",
+      "  Note: these flags only affect `jaiph run`; the corresponding env vars (JAIPH_INPLACE,",
+      "  JAIPH_UNSAFE, JAIPH_INPLACE_YES) also apply to other entry points (e.g. `jaiph test`).",
       "",
       "jaiph test:",
       "  With no path, discovers *.test.jh under the workspace root. Extra arguments after an optional",
       "  path are accepted but ignored (reserved).",
       "",
       "jaiph install:",
-      "  With one or more URLs: shallow-clone each repo into .jaiph/libs/<name>/ and update .jaiph/libs.lock.",
-      "  With no args: restore all libraries listed in .jaiph/libs.lock.",
+      "  Args: bare names resolve via the registry; anything containing '/' or ':' is a git URL.",
+      "  With one or more args: shallow-clone each repo into .jaiph/libs/<name>/ and update .jaiph/libs.lock.",
+      "  With no args: restore all libraries listed in .jaiph/libs.lock (registry not contacted).",
       "  --force         delete existing clone and re-clone",
+      "  JAIPH_REGISTRY  registry index path/URL (default: https://jaiph.org/registry).",
       "",
       "jaiph format:",
       "  --check         exit non-zero when file(s) need formatting (no writes)",
@@ -50,10 +58,14 @@ export function printUsage(): void {
       "  jaiph run ./flows/review.jh 'review this diff'",
       "  jaiph run --raw ./flows/review.jh",
       "  jaiph run --target /tmp/jaiph-out ./flows/review.jh",
+      "  jaiph run --inplace --workspace ./app ./flows/fix.jh",
+      "  jaiph run --unsafe ./flows/quick.jh",
       "  jaiph test",
       "  jaiph test ./e2e",
       "  jaiph test e2e/say_hello.test.jh",
       "  jaiph init",
+      "  jaiph install jaiphlang",
+      "  jaiph install mylib@v1.2",
       "  jaiph install https://github.com/you/queue-lib.git@v1.0",
       "  jaiph install",
       "  jaiph use nightly",
@@ -67,29 +79,84 @@ export function printUsage(): void {
   );
 }
 
-export function parseArgs(args: string[]): { target?: string; raw?: boolean; positional: string[] } {
+/**
+ * Returns true if any token before `--` is `-h` or `--help`.
+ * Subcommands call this at the top of their entry function so help requests
+ * never fall into positional / file-path resolution.
+ */
+export function hasHelpFlag(args: string[]): boolean {
+  for (const a of args) {
+    if (a === "--") return false;
+    if (a === "-h" || a === "--help") return true;
+  }
+  return false;
+}
+
+export interface ParsedArgs {
+  target?: string;
+  raw?: boolean;
+  workspace?: string;
+  inplace?: boolean;
+  unsafe?: boolean;
+  yes?: boolean;
+  positional: string[];
+}
+
+export function parseArgs(args: string[]): ParsedArgs {
   let target: string | undefined;
   let raw: boolean | undefined;
+  let workspace: string | undefined;
+  let inplace: boolean | undefined;
+  let unsafe: boolean | undefined;
+  let yes: boolean | undefined;
   const positional: string[] = [];
   for (let i = 0; i < args.length; i += 1) {
-    if (args[i] === "--target") {
-      const val = args[i + 1];
+    const arg = args[i];
+    if (arg === "--") {
+      positional.push(...args.slice(i + 1));
+      break;
+    }
+
+    // Accept both `--flag value` and `--flag=value` for long options. Split on
+    // the first `=` only, so values may themselves contain `=`.
+    let name = arg;
+    let inlineValue: string | undefined;
+    if (arg.startsWith("--") && arg.includes("=")) {
+      const eq = arg.indexOf("=");
+      name = arg.slice(0, eq);
+      inlineValue = arg.slice(eq + 1);
+    }
+
+    // Value-taking flags: value comes from `=` or the next token.
+    if (name === "--target" || name === "--workspace") {
+      let val: string | undefined;
+      if (inlineValue !== undefined) {
+        val = inlineValue;
+      } else {
+        val = args[i + 1];
+        i += 1;
+      }
       if (!val) {
-        throw new Error("--target requires a directory path");
+        throw new Error(`${name} requires a directory path`);
       }
-      target = val;
-      i += 1;
+      if (name === "--target") target = val;
+      else workspace = val;
       continue;
     }
-    if (args[i] === "--raw") {
-      raw = true;
+
+    // Boolean flags: do not accept an `=value` form.
+    if (name === "--raw" || name === "--inplace" || name === "--unsafe" || name === "--yes" || arg === "-y") {
+      if (inlineValue !== undefined) {
+        throw new Error(`${name} does not take a value`);
+      }
+      if (name === "--raw") raw = true;
+      else if (name === "--inplace") inplace = true;
+      else if (name === "--unsafe") unsafe = true;
+      else yes = true;
       continue;
     }
-    if (args[i] === "--") {
-      positional.push(...args.slice(i + 1));
-      break;
-    }
-    positional.push(args[i]);
+
+    positional.push(arg);
   }
-  return { target, raw, positional };
+  return { target, raw, workspace, inplace, unsafe, yes, positional };
 }
diff --git a/src/diagnostics.ts b/src/diagnostics.ts
new file mode 100644
index 00000000..2aed034a
--- /dev/null
+++ b/src/diagnostics.ts
@@ -0,0 +1,130 @@
+/**
+ * Diagnostics collector — replaces fail-fast error reporting for the validator
+ * (and any future call-site that wants to keep going after the first error).
+ *
+ * Two-tier model:
+ * - **Recoverable** errors append to `Diagnostics.errors` and short-circuit the
+ *   current validation unit via {@link BailoutError}. The unit's outer
+ *   `diag.capture(...)` wrapper absorbs the bailout so the next unit (next
+ *   step / next rule / next channel) still runs.
+ * - **Fatal** errors continue to throw via `jaiphError` (parser-level cases
+ *   where continuing would produce garbage AST — unterminated triple-quote,
+ *   unterminated brace block, etc.). A fatal bit on the diagnostic record
+ *   lets the CLI render them distinctly if needed.
+ *
+ * The collector also accepts errors that helpers still throw via the legacy
+ * `jaiphError(file, line, col, code, msg)` shape: `capture()` parses such a
+ * thrown error back into a `JaiphDiagnostic` and appends it. That keeps
+ * helper signatures stable while still surfacing the full error set.
+ */
+
+import { jaiphError } from "./errors";
+
+export interface JaiphDiagnostic {
+  file: string;
+  line: number;
+  col: number;
+  code: string;
+  message: string;
+  fatal: boolean;
+}
+
+/** Sentinel thrown by `diag.error(...)` to unwind to the nearest capture boundary. */
+export class BailoutError extends Error {
+  readonly __jaiphBailout = true as const;
+  constructor() {
+    super("jaiph bailout");
+  }
+}
+
+export function isBailout(err: unknown): err is BailoutError {
+  return err instanceof Error && (err as { __jaiphBailout?: unknown }).__jaiphBailout === true;
+}
+
+/** Parse `path:line:col CODE message` (the shape `jaiphError` produces). */
+export function diagnosticFromThrown(err: unknown, fatal = false): JaiphDiagnostic | null {
+  if (!(err instanceof Error)) return null;
+  if (isBailout(err)) return null;
+  const m = err.message.match(/^(.+):(\d+):(\d+) (\S+) ([\s\S]+)$/);
+  if (!m) return null;
+  return {
+    file: m[1],
+    line: Number(m[2]),
+    col: Number(m[3]),
+    code: m[4],
+    message: m[5].trimEnd(),
+    fatal,
+  };
+}
+
+export class Diagnostics {
+  readonly errors: JaiphDiagnostic[] = [];
+
+  add(d: JaiphDiagnostic): void {
+    this.errors.push(d);
+  }
+
+  /**
+   * Append a recoverable diagnostic and short-circuit the current validation
+   * unit via `BailoutError`. The nearest `capture()` boundary absorbs the
+   * bailout so the next sibling unit still runs.
+   */
+  error(file: string, line: number, col: number, code: string, message: string): never {
+    this.errors.push({ file, line, col, code, message, fatal: false });
+    throw new BailoutError();
+  }
+
+  /**
+   * Run `fn`. Absorb `BailoutError`. Parse any thrown `jaiphError`-shape error
+   * into a recoverable diagnostic. Re-throw anything else (likely an internal
+   * bug we want to surface).
+   */
+  capture(fn: () => void): void {
+    try {
+      fn();
+    } catch (e) {
+      if (isBailout(e)) return;
+      const d = diagnosticFromThrown(e);
+      if (d) {
+        this.errors.push(d);
+        return;
+      }
+      throw e;
+    }
+  }
+
+  hasErrors(): boolean {
+    return this.errors.length > 0;
+  }
+
+  hasFatal(): boolean {
+    return this.errors.some((d) => d.fatal);
+  }
+
+  /** Stable order: file, then line, then column. */
+  sorted(): JaiphDiagnostic[] {
+    return [...this.errors].sort((a, b) => {
+      if (a.file !== b.file) return a.file < b.file ? -1 : 1;
+      if (a.line !== b.line) return a.line - b.line;
+      return a.col - b.col;
+    });
+  }
+
+  /** One `file:line:col CODE message` line per diagnostic, in sorted order. */
+  formatLines(): string[] {
+    return this.sorted().map(
+      (d) => `${d.file}:${d.line}:${d.col} ${d.code} ${d.message}`,
+    );
+  }
+
+  /**
+   * Legacy bridge: throw the first sorted diagnostic as a regular `jaiphError`
+   * so existing callers that depend on `validateReferences` throwing continue
+   * to work. Does nothing when empty.
+   */
+  throwFirstIfAny(): void {
+    if (this.errors.length === 0) return;
+    const f = this.sorted()[0];
+    throw jaiphError(f.file, f.line, f.col, f.code, f.message);
+  }
+}
diff --git a/src/format/emit.test.ts b/src/format/emit.test.ts
index 450b827f..050bca56 100644
--- a/src/format/emit.test.ts
+++ b/src/format/emit.test.ts
@@ -1,11 +1,11 @@
 import { describe, it } from "node:test";
 import assert from "node:assert/strict";
-import { parsejaiph } from "../parser";
+import { parsejaiphWithTrivia } from "../parser";
 import { emitModule } from "./emit";
 
 function roundTrip(source: string, filePath = "test.jh"): string {
-  const mod = parsejaiph(source, filePath);
-  return emitModule(mod);
+  const { ast, trivia } = parsejaiphWithTrivia(source, filePath);
+  return emitModule(ast, trivia);
 }
 
 describe("emitModule", () => {
@@ -166,8 +166,8 @@ describe("emitModule", () => {
       "}",
       "",
     ].join("\n");
-    const mod = parsejaiph(input, "test.jh");
-    assert.equal(emitModule(mod, { indent: 4 }), expected);
+    const { ast, trivia } = parsejaiphWithTrivia(input, "test.jh");
+    assert.equal(emitModule(ast, trivia, { indent: 4 }), expected);
   });
 
   it("reorders out-of-order definitions to canonical order", () => {
@@ -569,4 +569,93 @@ describe("emitModule", () => {
     ].join("\n");
     assert.equal(roundTrip(source), source);
   });
+
+  it("formats if/else with canonical `} else {` on one line", () => {
+    const source = [
+      "workflow default(status) {",
+      '  if status == "ok" {',
+      '    log "healthy"',
+      "  } else {",
+      '    logerr "unhealthy: ${status}"',
+      "  }",
+      "}",
+      "",
+    ].join("\n");
+    assert.equal(roundTrip(source), source);
+  });
+
+  it("if/else is idempotent across two format passes", () => {
+    const source = [
+      "workflow default(status) {",
+      '  if status == "ok" {',
+      '    log "healthy"',
+      "  } else {",
+      '    logerr "unhealthy: ${status}"',
+      "  }",
+      "}",
+      "",
+    ].join("\n");
+    const once = roundTrip(source);
+    const twice = roundTrip(once);
+    assert.equal(twice, once);
+  });
+
+  it("preserves quotes on top-level const string values regardless of spaces", () => {
+    const source = [
+      'const p = "some/path with space.md"',
+      "",
+      'const q = ".jaiph/tmp/x.md"',
+      "",
+      "const MAX = 3",
+      "",
+      "workflow default() {",
+      "  log p",
+      "}",
+      "",
+    ].join("\n");
+    assert.equal(roundTrip(source), source);
+  });
+
+  it("top-level const quoting is idempotent across two format passes", () => {
+    const source = [
+      'const p = "some/path with space.md"',
+      "",
+      'const q = ".jaiph/tmp/x.md"',
+      "",
+      "const MAX = 3",
+      "",
+      "workflow default() {",
+      "  log p",
+      "}",
+      "",
+    ].join("\n");
+    const once = roundTrip(source);
+    const twice = roundTrip(once);
+    assert.equal(twice, once);
+    assert.equal(once, source);
+  });
+
+  it("preserves top-level const value bit-for-bit across format (so ${q} interpolation is identical)", () => {
+    const source = [
+      'const q = ".jaiph/tmp/x.md"',
+      "",
+      'const p = "some/path with space.md"',
+      "",
+      "const MAX = 3",
+      "",
+      "workflow default() {",
+      '  log "${q}"',
+      "}",
+      "",
+    ].join("\n");
+    const before = parsejaiphWithTrivia(source, "test.jh").ast;
+    const formatted = roundTrip(source);
+    const after = parsejaiphWithTrivia(formatted, "test.jh").ast;
+    assert.equal(after.envDecls!.length, before.envDecls!.length);
+    for (let i = 0; i < before.envDecls!.length; i++) {
+      assert.equal(after.envDecls![i].name, before.envDecls![i].name);
+      assert.equal(after.envDecls![i].value, before.envDecls![i].value);
+    }
+    assert.equal(before.envDecls![0].value, ".jaiph/tmp/x.md");
+  });
 });
diff --git a/src/format/emit.ts b/src/format/emit.ts
index f1315f22..c8467117 100644
--- a/src/format/emit.ts
+++ b/src/format/emit.ts
@@ -1,8 +1,8 @@
 import type {
+  Arg,
+  Expr,
   jaiphModule,
   WorkflowStepDef,
-  ConstRhs,
-  SendRhsDef,
   WorkflowDef,
   RuleDef,
   ScriptDef,
@@ -13,7 +13,7 @@ import type {
   WorkflowMetadata,
   TopLevelEmitOrder,
 } from "../types";
-import { parseCallRef } from "../parse/core";
+import { createTrivia, type NodeTrivia, type Trivia } from "../parse/trivia";
 
 export interface EmitOptions {
   indent: number;
@@ -21,7 +21,10 @@ export interface EmitOptions {
 
 const DEFAULT_OPTIONS: EmitOptions = { indent: 2 };
 
-/** When `topLevelOrder` is missing (hand-built AST), match pre–source-order emit behavior. */
+function tn(trivia: Trivia, node: object): NodeTrivia {
+  return trivia.getNode(node) ?? {};
+}
+
 function legacyTopLevelOrder(mod: jaiphModule): TopLevelEmitOrder[] {
   const o: TopLevelEmitOrder[] = [];
   if (mod.envDecls) {
@@ -36,31 +39,41 @@ function legacyTopLevelOrder(mod: jaiphModule): TopLevelEmitOrder[] {
   return o;
 }
 
-function topLevelOrderForEmit(mod: jaiphModule): TopLevelEmitOrder[] {
-  if (mod.topLevelOrder && mod.topLevelOrder.length > 0) return mod.topLevelOrder;
+function topLevelOrderForEmit(mod: jaiphModule, trivia: Trivia): TopLevelEmitOrder[] {
+  const order = trivia.getModule().topLevelOrder;
+  if (order && order.length > 0) return order;
   return legacyTopLevelOrder(mod);
 }
 
-export function emitModule(mod: jaiphModule, opts: EmitOptions = DEFAULT_OPTIONS): string {
+export function emitModule(
+  mod: jaiphModule,
+  triviaOrOpts: Trivia | EmitOptions = createTrivia(),
+  optsArg?: EmitOptions,
+): string {
+  let trivia: Trivia;
+  let opts: EmitOptions;
+  if (triviaOrOpts instanceof Object && "indent" in triviaOrOpts && !("getModule" in triviaOrOpts)) {
+    trivia = createTrivia();
+    opts = triviaOrOpts as EmitOptions;
+  } else {
+    trivia = triviaOrOpts as Trivia;
+    opts = optsArg ?? DEFAULT_OPTIONS;
+  }
   const sections: string[] = [];
   const pad = " ".repeat(opts.indent);
-
-  // Shebang — we don't store it in the AST, so the caller must prepend it if needed.
-  // (handled by the format command reading the first line of the original source)
+  const modTrivia = trivia.getModule();
 
   const importLines: string[] = [];
   if (mod.scriptImports) {
     for (const si of mod.scriptImports) {
-      if (si.leadingComments?.length) {
-        importLines.push(emitCommentBlock(si.leadingComments));
-      }
+      const lc = tn(trivia, si).leadingComments;
+      if (lc?.length) importLines.push(emitCommentBlock(lc));
       importLines.push(`import script "${si.path}" as ${si.alias}`);
     }
   }
   for (const imp of mod.imports) {
-    if (imp.leadingComments?.length) {
-      importLines.push(emitCommentBlock(imp.leadingComments));
-    }
+    const lc = tn(trivia, imp).leadingComments;
+    if (lc?.length) importLines.push(emitCommentBlock(lc));
     importLines.push(`import "${imp.path}" as ${imp.alias}`);
   }
   if (importLines.length > 0) {
@@ -68,17 +81,16 @@ export function emitModule(mod: jaiphModule, opts: EmitOptions = DEFAULT_OPTIONS
   }
 
   if (mod.metadata) {
-    if (mod.configLeadingComments?.length) {
-      sections.push(emitCommentBlock(mod.configLeadingComments));
+    if (modTrivia.configLeadingComments?.length) {
+      sections.push(emitCommentBlock(modTrivia.configLeadingComments));
     }
-    sections.push(emitConfig(mod.metadata, pad));
+    sections.push(emitConfig(mod.metadata, pad, trivia));
   }
 
   const channelLines: string[] = [];
   for (const ch of mod.channels) {
-    if (ch.leadingComments?.length) {
-      channelLines.push(emitCommentBlock(ch.leadingComments));
-    }
+    const lc = tn(trivia, ch).leadingComments;
+    if (lc?.length) channelLines.push(emitCommentBlock(lc));
     channelLines.push(emitChannel(ch));
   }
   if (channelLines.length > 0) {
@@ -87,7 +99,7 @@ export function emitModule(mod: jaiphModule, opts: EmitOptions = DEFAULT_OPTIONS
 
   const exportedNames = new Set(mod.exports);
 
-  for (const item of topLevelOrderForEmit(mod)) {
+  for (const item of topLevelOrderForEmit(mod, trivia)) {
     if (item.kind === "env") {
       const env = mod.envDecls![item.index];
       const envLines: string[] = [];
@@ -99,12 +111,12 @@ export function emitModule(mod: jaiphModule, opts: EmitOptions = DEFAULT_OPTIONS
       continue;
     }
     if (item.kind === "rule") {
-      sections.push(emitRule(mod.rules[item.index], pad, exportedNames.has(mod.rules[item.index].name)));
+      sections.push(emitRule(mod.rules[item.index], pad, exportedNames.has(mod.rules[item.index].name), trivia));
       continue;
     }
     if (item.kind === "script") {
       sections.push(
-        emitScript(mod.scripts[item.index], pad, exportedNames.has(mod.scripts[item.index].name)),
+        emitScript(mod.scripts[item.index], pad, exportedNames.has(mod.scripts[item.index].name), trivia),
       );
       continue;
     }
@@ -114,21 +126,21 @@ export function emitModule(mod: jaiphModule, opts: EmitOptions = DEFAULT_OPTIONS
           mod.workflows[item.index],
           pad,
           exportedNames.has(mod.workflows[item.index].name),
+          trivia,
         ),
       );
       continue;
     }
-    sections.push(emitTestBlock(mod.tests![item.index], pad));
+    sections.push(emitTestBlock(mod.tests![item.index], pad, trivia));
   }
 
-  if (mod.trailingTopLevelComments?.length) {
-    sections.push(emitCommentBlock(mod.trailingTopLevelComments));
+  if (modTrivia.trailingTopLevelComments?.length) {
+    sections.push(emitCommentBlock(modTrivia.trailingTopLevelComments));
   }
 
   return sections.join("\n\n") + "\n";
 }
 
-/** Emit lines for one `key = value` inside `config { }` (matches canonical value formatting). */
 function emitConfigKeyLines(meta: WorkflowMetadata, key: string, pad: string): string[] {
   switch (key) {
     case "agent.default_model":
@@ -159,8 +171,6 @@ function emitConfigKeyLines(meta: WorkflowMetadata, key: string, pad: string): s
       if (meta.run?.recoverLimit === undefined) return [];
       return [`${pad}run.recover_limit = ${meta.run.recoverLimit}`];
     case "runtime.docker_enabled":
-      // runtime.docker_enabled was removed; skip silently for back-compat with
-      // any cached AST that still carries the key in configBodySequence.
       return [];
     case "runtime.docker_image":
       if (meta.runtime?.dockerImage === undefined) return [];
@@ -185,10 +195,11 @@ function emitConfigKeyLines(meta: WorkflowMetadata, key: string, pad: string): s
   }
 }
 
-function emitConfig(meta: WorkflowMetadata, pad: string): string {
+function emitConfig(meta: WorkflowMetadata, pad: string, trivia: Trivia): string {
   const lines: string[] = ["config {"];
-  if (meta.configBodySequence?.length) {
-    for (const part of meta.configBodySequence) {
+  const seq = trivia.getNode(meta)?.configBodySequence;
+  if (seq?.length) {
+    for (const part of seq) {
       if (part.kind === "comment") {
         lines.push(`${pad}${part.text}`);
       } else {
@@ -227,7 +238,6 @@ function emitConfig(meta: WorkflowMetadata, pad: string): string {
   return lines.join("\n");
 }
 
-/** Top-level `const` RHS: bare slugs, JSON string, or triple-quoted when `"` / `\\` would break double-quote round-trip. */
 function emitEnvDecl(env: EnvDeclDef): string[] {
   if (env.value.includes("\n")) {
     const lines = [`const ${env.name} = """`];
@@ -237,6 +247,15 @@ function emitEnvDecl(env: EnvDeclDef): string[] {
     lines.push('"""');
     return lines;
   }
+  if (env.wasQuoted) {
+    // Author wrote a double-quoted string. Preserve the quoted form regardless
+    // of value content (the formatter must not toggle delimiters based on
+    // whether the value happens to contain a space).
+    if (/["\\]/.test(env.value)) {
+      return [`const ${env.name} = """`, env.value, '"""'];
+    }
+    return [`const ${env.name} = ${JSON.stringify(env.value)}`];
+  }
   if (/^[A-Za-z0-9_./@+#%^&=*:~?-]+$/.test(env.value)) {
     return [`const ${env.name} = ${env.value}`];
   }
@@ -250,27 +269,27 @@ function emitComments(comments: string[]): string[] {
   return comments.map((c) => (c.startsWith("#") ? c : `# ${c}`));
 }
 
-/** One section string: consecutive `#` lines stay single-spaced (module sections join with blank lines). */
 function emitCommentBlock(comments: string[]): string {
   return emitComments(comments).join("\n");
 }
 
-function emitRule(rule: RuleDef, pad: string, exported: boolean): string {
+function emitRule(rule: RuleDef, pad: string, exported: boolean, trivia: Trivia): string {
   const lines: string[] = [];
   lines.push(...emitComments(rule.comments));
   const paramStr = `(${rule.params.join(", ")})`;
   const prefix = exported ? "export " : "";
   lines.push(`${prefix}rule ${rule.name}${paramStr} {`);
-  lines.push(...emitSteps(rule.steps, pad, pad));
+  lines.push(...emitSteps(rule.steps, pad, pad, trivia));
   lines.push("}");
   return lines.join("\n");
 }
 
-function emitScript(script: ScriptDef, _pad: string, exported: boolean): string {
+function emitScript(script: ScriptDef, _pad: string, exported: boolean, trivia: Trivia): string {
   const lines: string[] = [];
   lines.push(...emitComments(script.comments));
   const prefix = exported ? "export " : "";
-  if (script.bodyKind === "fenced" || script.lang || script.body.includes("\n")) {
+  const bodyKind = tn(trivia, script).scriptBodyKind;
+  if (bodyKind === "fenced" || script.lang || script.body.includes("\n")) {
     const langTag = script.lang ?? "";
     lines.push(`${prefix}script ${script.name} = \`\`\`${langTag}`);
     for (const bl of script.body.split("\n")) {
@@ -283,7 +302,7 @@ function emitScript(script: ScriptDef, _pad: string, exported: boolean): string
   return lines.join("\n");
 }
 
-function emitWorkflow(wf: WorkflowDef, pad: string, exported: boolean): string {
+function emitWorkflow(wf: WorkflowDef, pad: string, exported: boolean, trivia: Trivia): string {
   const lines: string[] = [];
   lines.push(...emitComments(wf.comments));
 
@@ -292,13 +311,13 @@ function emitWorkflow(wf: WorkflowDef, pad: string, exported: boolean): string {
   lines.push(`${prefix}workflow ${wf.name}${paramStr} {`);
 
   if (wf.metadata) {
-    const configLines = emitConfig(wf.metadata, pad);
+    const configLines = emitConfig(wf.metadata, pad, trivia);
     for (const cl of configLines.split("\n")) {
       lines.push(`${pad}${cl}`);
     }
   }
 
-  lines.push(...emitSteps(wf.steps, pad, pad));
+  lines.push(...emitSteps(wf.steps, pad, pad, trivia));
 
   lines.push("}");
   return lines.join("\n");
@@ -312,9 +331,8 @@ function emitChannel(ch: ChannelDef): string {
   return `channel ${ch.name}`;
 }
 
-/** `log` / `logerr` message: bare identifier form vs JSON-string form (matches parse storage). */
-function emitLogMessageRhs(message: string): string {
-  // Parser stores bare `log name` as the literal string `${name}` (interpolation sentinel).
+/** Bare-identifier form for `log <ident>` / `logerr <ident>`. */
+function emitLogLiteralRhs(message: string): string {
   if (
     message.length >= 3 &&
     message[0] === "$" &&
@@ -329,107 +347,27 @@ function emitLogMessageRhs(message: string): string {
   return JSON.stringify(message);
 }
 
-function emitSteps(steps: WorkflowStepDef[], pad: string, currentIndent: string): string[] {
+function emitSteps(steps: WorkflowStepDef[], pad: string, currentIndent: string, trivia: Trivia): string[] {
   const lines: string[] = [];
   for (const step of steps) {
-    lines.push(...emitStep(step, pad, currentIndent));
+    lines.push(...emitStep(step, pad, currentIndent, trivia));
   }
   return lines;
 }
 
-/** Try to parse `` `body`(args) `` from the start of a string. Returns consumed length or null. */
-function parseInlineScriptArg(s: string): { body: string; innerArgs: string; consumed: number } | null {
-  if (!s.startsWith("`")) return null;
-  const closeIdx = s.indexOf("`", 1);
-  if (closeIdx === -1) return null;
-  const body = s.slice(1, closeIdx);
-  const afterClose = s.slice(closeIdx + 1);
-  if (!afterClose.startsWith("(")) return null;
-  let depth = 1;
-  let j = 1;
-  let inQuote: string | null = null;
-  while (j < afterClose.length && depth > 0) {
-    const ch = afterClose[j];
-    if (inQuote) {
-      if (ch === inQuote && afterClose[j - 1] !== "\\") inQuote = null;
-    } else {
-      if (ch === '"' || ch === "'") inQuote = ch;
-      else if (ch === "(") depth++;
-      else if (ch === ")") depth--;
-    }
-    j++;
-  }
-  if (depth !== 0) return null;
-  const innerArgs = afterClose.slice(1, j - 1).trim();
-  return { body, innerArgs, consumed: closeIdx + 1 + j };
-}
-
-/** Convert space-separated args back to comma-separated format with bare identifiers. */
-function formatArgs(args: string, bareIdentifierArgs?: string[]): string {
-  const bare = new Set(bareIdentifierArgs ?? []);
-  const tokens: string[] = [];
-  let i = 0;
-  while (i < args.length) {
-    while (i < args.length && (args[i] === " " || args[i] === "\t")) i++;
-    if (i >= args.length) break;
-    const tail = args.slice(i);
-    const keyword = tail.startsWith("run ")
-      ? "run"
-      : tail.startsWith("ensure ")
-        ? "ensure"
-        : null;
-    if (keyword) {
-      const afterKeyword = args.slice(i + keyword.length).trimStart();
-      const skipped = args.slice(i + keyword.length).length - afterKeyword.length;
-      const call = parseCallRef(afterKeyword);
-      if (call && (call.rest.length === 0 || /^\s/.test(call.rest))) {
-        const consumed = afterKeyword.length - call.rest.length;
-        tokens.push(`${keyword} ${call.ref}(${formatArgs(call.args ?? "", call.bareIdentifierArgs)})`);
-        i += keyword.length + skipped + consumed;
-        continue;
-      }
-      // Try inline script form: run `body`(args)
-      if (keyword === "run") {
-        const inlineResult = parseInlineScriptArg(afterKeyword);
-        if (inlineResult) {
-          const formattedInner = inlineResult.innerArgs ? formatArgs(inlineResult.innerArgs) : "";
-          tokens.push(`run \`${inlineResult.body}\`(${formattedInner})`);
-          i += keyword.length + skipped + inlineResult.consumed;
-          continue;
-        }
-      }
-    }
-    if (args[i] === '"') {
-      let j = i + 1;
-      while (j < args.length && !(args[j] === '"' && args[j - 1] !== "\\")) j++;
-      tokens.push(args.slice(i, j + 1));
-      i = j + 1;
-    } else {
-      let j = i;
-      while (j < args.length && args[j] !== " " && args[j] !== "\t") j++;
-      const token = args.slice(i, j);
-      const m = token.match(/^\$\{([a-zA-Z_][a-zA-Z0-9_]*)\}$/);
-      if (m && bare.has(m[1])) {
-        tokens.push(m[1]);
-      } else {
-        tokens.push(token);
-      }
-      i = j;
-    }
-  }
-  return tokens.join(", ");
+function formatArgs(args: Arg[] | undefined): string {
+  if (!args || args.length === 0) return "";
+  return args.map((a) => (a.kind === "var" ? a.name : a.raw)).join(", ");
 }
 
-/** Emit inline script form: `prefix \`body\`(args)` or fenced block. */
 function emitInlineScriptLines(
   prefix: string,
   body: string,
-  lang?: string,
-  args?: string,
-  bareIdentifierArgs?: string[],
+  lang: string | undefined,
+  args: Arg[] | undefined,
   ci?: string,
 ): string[] {
-  const argsStr = formatArgs(args ?? "", bareIdentifierArgs);
+  const argsStr = formatArgs(args);
   if (lang || body.includes("\n")) {
     const langTag = lang ?? "";
     const result = [`${prefix} \`\`\`${langTag}`];
@@ -442,11 +380,8 @@ function emitInlineScriptLines(
   return [`${prefix} \`${body}\`(${argsStr})`];
 }
 
-function emitRef(ref: { value: string }, args?: string, bareIdentifierArgs?: string[]): string {
-  if (args !== undefined) {
-    return `${ref.value}(${formatArgs(args, bareIdentifierArgs)})`;
-  }
-  return `${ref.value}()`;
+function emitRef(ref: { value: string }, args: Arg[] | undefined): string {
+  return `${ref.value}(${formatArgs(args)})`;
 }
 
 function emitMatchPattern(p: import("../types").MatchPatternDef): string {
@@ -457,7 +392,6 @@ function emitMatchPattern(p: import("../types").MatchPatternDef): string {
 
 function emitMatchArm(arm: import("../types").MatchArmDef, armIndent: string, bodyIndent: string): string[] {
   const patStr = emitMatchPattern(arm.pattern);
-  // Multiline body (triple-quoted): body stored as "line1\nline2" with outer quotes and actual newlines.
   if (arm.body.startsWith('"') && arm.body.endsWith('"') && arm.body.includes("\n")) {
     const inner = arm.body.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
     const lines: string[] = [`${armIndent}${patStr} => """`];
@@ -470,348 +404,307 @@ function emitMatchArm(arm: import("../types").MatchArmDef, armIndent: string, bo
   return [`${armIndent}${patStr} => ${arm.body}`];
 }
 
-function emitStep(step: WorkflowStepDef, pad: string, currentIndent: string): string[] {
+/**
+ * Emit an `Expr` as it would appear after a `=` / `<-` / `return` / `log` etc.
+ * Multi-line value forms (inline-script fenced bodies, triple-quoted literals,
+ * match arm blocks, triple-quoted prompts) return additional lines via the
+ * `tail` array so the caller can append them at the right indent level.
+ */
+function emitExprFirstLine(
+  expr: Expr,
+  trivia: Trivia,
+  ci: string,
+  pad: string,
+): { head: string; tail: string[] } {
+  const valueTrivia = tn(trivia, expr);
+  if (expr.kind === "literal") {
+    if (valueTrivia.tripleQuoted) {
+      const inner = valueTrivia.rawBody ?? expr.raw.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
+      const tail: string[] = [];
+      for (const bl of inner.split("\n")) tail.push(bl);
+      tail.push(`${ci}"""`);
+      return { head: '"""', tail };
+    }
+    if (valueTrivia.bareSource) {
+      return { head: valueTrivia.bareSource, tail: [] };
+    }
+    return { head: expr.raw, tail: [] };
+  }
+  if (expr.kind === "call") {
+    const asyncMod = expr.async ? "async " : "";
+    return { head: `run ${asyncMod}${emitRef(expr.callee, expr.args)}`, tail: [] };
+  }
+  if (expr.kind === "ensure_call") {
+    return { head: `ensure ${emitRef(expr.callee, expr.args)}`, tail: [] };
+  }
+  if (expr.kind === "inline_script") {
+    if (expr.lang || expr.body.includes("\n")) {
+      const langTag = expr.lang ?? "";
+      const tail: string[] = [];
+      for (const bl of expr.body.split("\n")) tail.push(bl);
+      tail.push(`${ci}\`\`\`(${formatArgs(expr.args)})`);
+      return { head: `run \`\`\`${langTag}`, tail };
+    }
+    return { head: `run \`${expr.body}\`(${formatArgs(expr.args)})`, tail: [] };
+  }
+  if (expr.kind === "prompt") {
+    const returns = expr.returns ? ` returns "${expr.returns}"` : "";
+    if (valueTrivia.bodyKind === "identifier" && valueTrivia.bodyIdentifier) {
+      return { head: `prompt ${valueTrivia.bodyIdentifier}${returns}`, tail: [] };
+    }
+    if (valueTrivia.bodyKind === "triple_quoted") {
+      const inner = valueTrivia.rawBody ?? expr.raw.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
+      const tail: string[] = [];
+      for (const bl of inner.split("\n")) tail.push(bl);
+      tail.push(`${ci}"""`);
+      if (expr.returns) {
+        tail.push(`${ci}returns "${expr.returns}"`);
+      }
+      return { head: 'prompt """', tail };
+    }
+    return { head: `prompt ${expr.raw}${returns}`, tail: [] };
+  }
+  if (expr.kind === "match") {
+    const tail: string[] = [];
+    for (const arm of expr.match.arms) {
+      tail.push(...emitMatchArm(arm, `${ci}${pad}`, ci));
+    }
+    tail.push(`${ci}}`);
+    return { head: `match ${expr.match.subject} {`, tail };
+  }
+  if (expr.kind === "shell") {
+    return { head: expr.command, tail: [] };
+  }
+  // bare_ref
+  return { head: expr.ref.value, tail: [] };
+}
+
+function emitStep(step: WorkflowStepDef, pad: string, currentIndent: string, trivia: Trivia): string[] {
   const lines: string[] = [];
   const ci = currentIndent;
 
-  switch (step.type) {
-    case "blank_line":
+  if (step.type === "trivia") {
+    if (step.kind === "blank_line") {
       lines.push("");
-      break;
-
-    case "comment":
-      lines.push(`${ci}${step.text}`);
-      break;
+    } else {
+      lines.push(`${ci}${step.text ?? ""}`);
+    }
+    return lines;
+  }
 
-    case "shell": {
-      if (step.captureName) {
-        lines.push(`${ci}${step.captureName} = ${step.command}`);
+  if (step.type === "say") {
+    const message = step.message;
+    if (step.level === "fail") {
+      // fail always takes a literal message; preserve triple-quoted form when present.
+      const msgTrivia = tn(trivia, message);
+      if (message.kind === "literal" && msgTrivia.tripleQuoted) {
+        const inner = msgTrivia.rawBody ?? message.raw.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
+        lines.push(`${ci}fail """`);
+        for (const bl of inner.split("\n")) lines.push(bl);
+        lines.push(`${ci}"""`);
+      } else if (message.kind === "literal") {
+        lines.push(`${ci}fail ${message.raw}`);
       } else {
-        lines.push(`${ci}${step.command}`);
+        const { head, tail } = emitExprFirstLine(message, trivia, ci, pad);
+        lines.push(`${ci}fail ${head}`);
+        lines.push(...tail);
       }
-      break;
+      return lines;
     }
-
-    case "ensure": {
-      const ref = emitRef(step.ref, step.args, step.bareIdentifierArgs);
-      const capture = step.captureName ? `${step.captureName} = ` : "";
-      if (step.catch) {
-        const b = step.catch.bindings;
-        const bindStr = `(${b.failure})`;
-        if ("single" in step.catch) {
-          const recoverLines = emitStep(step.catch.single, pad, "");
-          const recoverText = recoverLines.map((l) => l.trim()).join("\n");
-          lines.push(`${ci}${capture}ensure ${ref} catch ${bindStr} ${recoverText}`);
-        } else {
-          lines.push(`${ci}${capture}ensure ${ref} catch ${bindStr} {`);
-          lines.push(...emitSteps(step.catch.block, pad, ci + pad));
-          lines.push(`${ci}}`);
-        }
+    const verb = step.level;
+    if (message.kind === "inline_script") {
+      lines.push(...emitInlineScriptLines(`${ci}${verb} run`, message.body, message.lang, message.args, ci));
+      return lines;
+    }
+    if (message.kind === "literal") {
+      const msgTrivia = tn(trivia, message);
+      if (msgTrivia.tripleQuoted) {
+        const inner = msgTrivia.rawBody ?? message.raw;
+        lines.push(`${ci}${verb} """`);
+        for (const bl of inner.split("\n")) lines.push(bl);
+        lines.push(`${ci}"""`);
       } else {
-        lines.push(`${ci}${capture}ensure ${ref}`);
+        lines.push(`${ci}${verb} ${emitLogLiteralRhs(message.raw)}`);
       }
-      break;
+      return lines;
     }
+    // Fallback for any other Expr kind (shouldn't occur per validator).
+    const { head, tail } = emitExprFirstLine(message, trivia, ci, pad);
+    lines.push(`${ci}${verb} ${head}`);
+    lines.push(...tail);
+    return lines;
+  }
+
+  if (step.type === "shell" as never) {
+    // Defensive: should never appear in the new AST (shell is an exec body kind).
+    return lines;
+  }
 
-    case "run": {
-      const ref = emitRef(step.workflow, step.args, step.bareIdentifierArgs);
-      const capture = step.captureName ? `${step.captureName} = ` : "";
-      const asyncPrefix = step.async ? "async " : "";
+  if (step.type === "exec") {
+    const body = step.body;
+    if (body.kind === "shell") {
+      if (step.captureName) {
+        lines.push(`${ci}${step.captureName} = ${body.command}`);
+      } else {
+        lines.push(`${ci}${body.command}`);
+      }
+      return lines;
+    }
+    const capture = step.captureName ? `${step.captureName} = ` : "";
+    if (body.kind === "call") {
+      const ref = emitRef(body.callee, body.args);
+      const asyncPrefix = body.async ? "async " : "";
       if (step.recover) {
         const b = step.recover.bindings;
         const bindStr = `(${b.failure})`;
         if ("single" in step.recover) {
-          const recoverLines = emitStep(step.recover.single, pad, "");
+          const recoverLines = emitStep(step.recover.single, pad, "", trivia);
           const recoverText = recoverLines.map((l) => l.trim()).join("\n");
           lines.push(`${ci}${capture}run ${asyncPrefix}${ref} recover ${bindStr} ${recoverText}`);
         } else {
           lines.push(`${ci}${capture}run ${asyncPrefix}${ref} recover ${bindStr} {`);
-          lines.push(...emitSteps(step.recover.block, pad, ci + pad));
+          lines.push(...emitSteps(step.recover.block, pad, ci + pad, trivia));
           lines.push(`${ci}}`);
         }
       } else if (step.catch) {
         const b = step.catch.bindings;
         const bindStr = `(${b.failure})`;
         if ("single" in step.catch) {
-          const recoverLines = emitStep(step.catch.single, pad, "");
+          const recoverLines = emitStep(step.catch.single, pad, "", trivia);
           const recoverText = recoverLines.map((l) => l.trim()).join("\n");
           lines.push(`${ci}${capture}run ${asyncPrefix}${ref} catch ${bindStr} ${recoverText}`);
         } else {
           lines.push(`${ci}${capture}run ${asyncPrefix}${ref} catch ${bindStr} {`);
-          lines.push(...emitSteps(step.catch.block, pad, ci + pad));
+          lines.push(...emitSteps(step.catch.block, pad, ci + pad, trivia));
           lines.push(`${ci}}`);
         }
       } else {
         lines.push(`${ci}${capture}run ${asyncPrefix}${ref}`);
       }
-      break;
-    }
-
-    case "run_inline_script": {
-      const capture = step.captureName ? `${step.captureName} = ` : "";
-      const argsStr = formatArgs(step.args ?? "", step.bareIdentifierArgs);
-      if (step.lang || step.body.includes("\n")) {
-        const langTag = step.lang ?? "";
-        lines.push(`${ci}${capture}run \`\`\`${langTag}`);
-        for (const bl of step.body.split("\n")) {
-          lines.push(bl);
-        }
-        lines.push(`${ci}\`\`\`(${argsStr})`);
-      } else {
-        lines.push(`${ci}${capture}run \`${step.body}\`(${argsStr})`);
-      }
-      break;
+      return lines;
     }
-
-    case "prompt": {
-      const capture = step.captureName ? `${step.captureName} = ` : "";
-      const returns = step.returns ? ` returns "${step.returns}"` : "";
-      if (step.bodyKind === "identifier" && step.bodyIdentifier) {
-        lines.push(`${ci}${capture}prompt ${step.bodyIdentifier}${returns}`);
-      } else if (step.bodyKind === "triple_quoted") {
-        const inner = step.raw.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
-        lines.push(`${ci}${capture}prompt """`);
-        for (const bl of inner.split("\n")) {
-          lines.push(bl);
-        }
-        lines.push(`${ci}"""`);
-        if (step.returns) {
-          lines.push(`${ci}returns "${step.returns}"`);
+    if (body.kind === "ensure_call") {
+      const ref = emitRef(body.callee, body.args);
+      if (step.catch) {
+        const b = step.catch.bindings;
+        const bindStr = `(${b.failure})`;
+        if ("single" in step.catch) {
+          const recoverLines = emitStep(step.catch.single, pad, "", trivia);
+          const recoverText = recoverLines.map((l) => l.trim()).join("\n");
+          lines.push(`${ci}${capture}ensure ${ref} catch ${bindStr} ${recoverText}`);
+        } else {
+          lines.push(`${ci}${capture}ensure ${ref} catch ${bindStr} {`);
+          lines.push(...emitSteps(step.catch.block, pad, ci + pad, trivia));
+          lines.push(`${ci}}`);
         }
       } else {
-        lines.push(`${ci}${capture}prompt ${step.raw}${returns}`);
+        lines.push(`${ci}${capture}ensure ${ref}`);
       }
-      break;
+      return lines;
     }
-
-    case "const": {
-      lines.push(`${ci}${emitConstStep(step.name, step.value)}`);
-      // Handle multi-line inline script capture body
-      if (step.value.kind === "run_inline_script_capture" &&
-          (step.value.lang || step.value.body.includes("\n"))) {
-        for (const bl of step.value.body.split("\n")) {
-          lines.push(bl);
-        }
-        const argsStr = formatArgs(step.value.args ?? "", step.value.bareIdentifierArgs);
+    if (body.kind === "inline_script") {
+      const argsStr = formatArgs(body.args);
+      if (body.lang || body.body.includes("\n")) {
+        const langTag = body.lang ?? "";
+        lines.push(`${ci}${capture}run \`\`\`${langTag}`);
+        for (const bl of body.body.split("\n")) lines.push(bl);
         lines.push(`${ci}\`\`\`(${argsStr})`);
-      }
-      // Handle multi-line triple-quoted prompt capture body
-      if (step.value.kind === "prompt_capture" && step.value.bodyKind === "triple_quoted") {
-        const inner = step.value.raw.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
-        for (const bl of inner.split("\n")) {
-          lines.push(bl);
-        }
-        lines.push(`${ci}"""`);
-        if (step.value.returns) {
-          lines.push(`${ci}returns "${step.value.returns}"`);
-        }
-      }
-      // Handle match expression arms and closing brace
-      if (step.value.kind === "match_expr") {
-        for (const arm of step.value.match.arms) {
-          lines.push(...emitMatchArm(arm, `${ci}${pad}`, ci));
-        }
-        lines.push(`${ci}}`);
-      }
-      // Handle multi-line triple-quoted expr (const name = """...""")
-      if (step.value.kind === "expr" && step.value.bashRhs.startsWith('"') &&
-          step.value.bashRhs.endsWith('"') && step.value.bashRhs.includes("\n")) {
-        const inner = step.value.bashRhs.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
-        for (const bl of inner.split("\n")) {
-          lines.push(bl);
-        }
-        lines.push(`${ci}"""`);
-      }
-      break;
-    }
-
-    case "fail": {
-      if (step.message.includes("\n")) {
-        const inner = step.message.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
-        lines.push(`${ci}fail """`);
-        for (const bl of inner.split("\n")) {
-          lines.push(bl);
-        }
-        lines.push(`${ci}"""`);
-      } else {
-        lines.push(`${ci}fail ${step.message}`);
-      }
-      break;
-    }
-
-    case "log":
-      if (step.managed?.kind === "run_inline_script") {
-        lines.push(...emitInlineScriptLines(`${ci}log run`, step.managed.body, step.managed.lang, step.managed.args, step.managed.bareIdentifierArgs, ci));
-      } else if (step.message.includes("\n")) {
-        lines.push(`${ci}log """`);
-        for (const bl of step.message.split("\n")) {
-          lines.push(bl);
-        }
-        lines.push(`${ci}"""`);
-      } else {
-        lines.push(`${ci}log ${emitLogMessageRhs(step.message)}`);
-      }
-      break;
-
-    case "logerr":
-      if (step.managed?.kind === "run_inline_script") {
-        lines.push(...emitInlineScriptLines(`${ci}logerr run`, step.managed.body, step.managed.lang, step.managed.args, step.managed.bareIdentifierArgs, ci));
-      } else if (step.message.includes("\n")) {
-        lines.push(`${ci}logerr """`);
-        for (const bl of step.message.split("\n")) {
-          lines.push(bl);
-        }
-        lines.push(`${ci}"""`);
-      } else {
-        lines.push(`${ci}logerr ${emitLogMessageRhs(step.message)}`);
-      }
-      break;
-
-    case "return": {
-      if (step.managed) {
-        if (step.managed.kind === "run") {
-          lines.push(`${ci}return run ${emitRef(step.managed.ref, step.managed.args, step.managed.bareIdentifierArgs)}`);
-        } else if (step.managed.kind === "ensure") {
-          lines.push(`${ci}return ensure ${emitRef(step.managed.ref, step.managed.args, step.managed.bareIdentifierArgs)}`);
-        } else if (step.managed.kind === "match") {
-          lines.push(`${ci}return match ${step.managed.match.subject} {`);
-          for (const arm of step.managed.match.arms) {
-            lines.push(...emitMatchArm(arm, `${ci}${pad}`, ci));
-          }
-          lines.push(`${ci}}`);
-        } else if (step.managed.kind === "run_inline_script") {
-          lines.push(...emitInlineScriptLines(`${ci}return run`, step.managed.body, step.managed.lang, step.managed.args, step.managed.bareIdentifierArgs, ci));
-        }
-      } else if (step.bareSource) {
-        lines.push(`${ci}return ${step.bareSource}`);
-      } else if (step.value.includes("\n")) {
-        const inner = step.value.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
-        lines.push(`${ci}return """`);
-        for (const bl of inner.split("\n")) {
-          lines.push(bl);
-        }
-        lines.push(`${ci}"""`);
       } else {
-        lines.push(`${ci}return ${step.value}`);
+        lines.push(`${ci}${capture}run \`${body.body}\`(${argsStr})`);
       }
-      break;
+      return lines;
     }
-
-    case "send": {
-      if (step.rhs.kind === "literal" && step.rhs.token.includes("\n")) {
-        const inner = step.rhs.token.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
-        lines.push(`${ci}${step.channel} <- """`);
-        for (const bl of inner.split("\n")) {
-          lines.push(bl);
-        }
+    if (body.kind === "prompt") {
+      const bodyTrivia = tn(trivia, body);
+      const returns = body.returns ? ` returns "${body.returns}"` : "";
+      if (bodyTrivia.bodyKind === "identifier" && bodyTrivia.bodyIdentifier) {
+        lines.push(`${ci}${capture}prompt ${bodyTrivia.bodyIdentifier}${returns}`);
+      } else if (bodyTrivia.bodyKind === "triple_quoted") {
+        const inner = bodyTrivia.rawBody ?? body.raw.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
+        lines.push(`${ci}${capture}prompt """`);
+        for (const bl of inner.split("\n")) lines.push(bl);
         lines.push(`${ci}"""`);
+        if (body.returns) lines.push(`${ci}returns "${body.returns}"`);
       } else {
-        const rhs = emitSendRhs(step.rhs);
-        lines.push(`${ci}${step.channel} <- ${rhs}`);
+        lines.push(`${ci}${capture}prompt ${body.raw}${returns}`);
       }
-      break;
+      return lines;
     }
-
-
-    case "match": {
-      lines.push(`${ci}match ${step.expr.subject} {`);
-      for (const arm of step.expr.arms) {
+    if (body.kind === "match") {
+      lines.push(`${ci}${capture}match ${body.match.subject} {`);
+      for (const arm of body.match.arms) {
         lines.push(...emitMatchArm(arm, `${ci}${pad}`, ci));
       }
       lines.push(`${ci}}`);
-      break;
+      return lines;
     }
+    // bare_ref / literal — not valid as exec body, but handle defensively.
+    const { head, tail } = emitExprFirstLine(body, trivia, ci, pad);
+    lines.push(`${ci}${capture}${head}`);
+    lines.push(...tail);
+    return lines;
+  }
 
-    case "if": {
-      const operandStr = step.operand.kind === "string_literal"
-        ? `"${step.operand.value}"`
-        : `/${step.operand.source}/`;
-      lines.push(`${ci}if ${step.subject} ${step.operator} ${operandStr} {`);
-      lines.push(...emitSteps(step.body, pad, ci + pad));
-      lines.push(`${ci}}`);
-      break;
-    }
+  if (step.type === "const") {
+    const { head, tail } = emitExprFirstLine(step.value, trivia, ci, pad);
+    lines.push(`${ci}const ${step.name} = ${head}`);
+    lines.push(...tail);
+    return lines;
+  }
 
-    case "for_lines": {
-      lines.push(`${ci}for ${step.iterVar} in ${step.sourceVar} {`);
-      lines.push(...emitSteps(step.body, pad, ci + pad));
-      lines.push(`${ci}}`);
-      break;
-    }
+  if (step.type === "return") {
+    const { head, tail } = emitExprFirstLine(step.value, trivia, ci, pad);
+    lines.push(`${ci}return ${head}`);
+    lines.push(...tail);
+    return lines;
   }
 
-  return lines;
-}
+  if (step.type === "send") {
+    const { head, tail } = emitExprFirstLine(step.value, trivia, ci, pad);
+    lines.push(`${ci}${step.channel} <- ${head}`);
+    lines.push(...tail);
+    return lines;
+  }
 
-function emitConstStep(name: string, value: ConstRhs): string {
-  switch (value.kind) {
-    case "expr":
-      if (value.bashRhs.startsWith('"') && value.bashRhs.endsWith('"') && value.bashRhs.includes("\n")) {
-        // Multi-line: caller handles remaining lines
-        return `const ${name} = """`;
-      }
-      return `const ${name} = ${value.bashRhs}`;
-    case "run_capture": {
-      const asyncMod = value.async ? "async " : "";
-      return `const ${name} = run ${asyncMod}${emitRef(value.ref, value.args, value.bareIdentifierArgs)}`;
-    }
-    case "ensure_capture":
-      return `const ${name} = ensure ${emitRef(value.ref, value.args, value.bareIdentifierArgs)}`;
-    case "prompt_capture": {
-      const returns = value.returns ? ` returns "${value.returns}"` : "";
-      if (value.bodyKind === "identifier" && value.bodyIdentifier) {
-        return `const ${name} = prompt ${value.bodyIdentifier}${returns}`;
-      }
-      if (value.bodyKind === "triple_quoted") {
-        // Multi-line: caller handles remaining lines
-        return `const ${name} = prompt """`;
-      }
-      return `const ${name} = prompt ${value.raw}${returns}`;
-    }
-    case "match_expr": {
-      // Multi-line format; return first line (const assignment opens the block)
-      return `const ${name} = match ${value.match.subject} {`;
-    }
-    case "run_inline_script_capture": {
-      const argsStr = formatArgs(value.args ?? "", value.bareIdentifierArgs);
-      if (value.lang || value.body.includes("\n")) {
-        const langTag = value.lang ?? "";
-        return `const ${name} = run \`\`\`${langTag}`;
-      }
-      return `const ${name} = run \`${value.body}\`(${argsStr})`;
+  if (step.type === "if") {
+    const operandStr = step.operand.kind === "string_literal"
+      ? `"${step.operand.value}"`
+      : `/${step.operand.source}/`;
+    lines.push(`${ci}if ${step.subject} ${step.operator} ${operandStr} {`);
+    lines.push(...emitSteps(step.body, pad, ci + pad, trivia));
+    if (step.elseBody) {
+      lines.push(`${ci}} else {`);
+      lines.push(...emitSteps(step.elseBody, pad, ci + pad, trivia));
     }
+    lines.push(`${ci}}`);
+    return lines;
   }
-}
 
-function emitSendRhs(rhs: SendRhsDef): string {
-  switch (rhs.kind) {
-    case "literal":
-      return rhs.token;
-    case "var":
-      return rhs.bash;
-    case "run":
-      return `run ${emitRef(rhs.ref, rhs.args, rhs.bareIdentifierArgs)}`;
-    case "bare_ref":
-      return rhs.ref.value;
-    case "shell":
-      return rhs.command;
+  if (step.type === "for_lines") {
+    lines.push(`${ci}for ${step.iterVar} in ${step.sourceVar} {`);
+    lines.push(...emitSteps(step.body, pad, ci + pad, trivia));
+    lines.push(`${ci}}`);
+    return lines;
   }
+
+  return lines;
 }
 
-function emitTestBlock(test: TestBlockDef, pad: string): string {
+function emitTestBlock(test: TestBlockDef, pad: string, trivia: Trivia): string {
   const lines: string[] = [];
-  if (test.leadingComments?.length) {
-    lines.push(...emitComments(test.leadingComments));
+  const lc = tn(trivia, test).leadingComments;
+  if (lc?.length) {
+    lines.push(...emitComments(lc));
   }
   lines.push(`test "${test.description}" {`);
   for (const step of test.steps) {
-    lines.push(...emitTestStep(step, pad));
+    lines.push(...emitTestStep(step, pad, trivia));
   }
   lines.push("}");
   return lines.join("\n");
 }
 
-function emitTestStep(step: TestStepDef, pad: string): string[] {
+function emitTestStep(step: TestStepDef, pad: string, trivia: Trivia): string[] {
   switch (step.type) {
     case "comment":
       return [`${pad}${step.text}`];
@@ -852,14 +745,14 @@ function emitTestStep(step: TestStepDef, pad: string): string[] {
     case "test_mock_workflow": {
       const paramStr = `(${step.params.join(", ")})`;
       const lines = [`${pad}mock workflow ${step.ref}${paramStr} {`];
-      lines.push(...emitSteps(step.steps, pad, pad + pad));
+      lines.push(...emitSteps(step.steps, pad, pad + pad, trivia));
       lines.push(`${pad}}`);
       return lines;
     }
     case "test_mock_rule": {
       const paramStr = `(${step.params.join(", ")})`;
       const lines = [`${pad}mock rule ${step.ref}${paramStr} {`];
-      lines.push(...emitSteps(step.steps, pad, pad + pad));
+      lines.push(...emitSteps(step.steps, pad, pad + pad, trivia));
       lines.push(`${pad}}`);
       return lines;
     }
diff --git a/src/format/roundtrip.test.ts b/src/format/roundtrip.test.ts
new file mode 100644
index 00000000..0acc3ed3
--- /dev/null
+++ b/src/format/roundtrip.test.ts
@@ -0,0 +1,73 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readFileSync, readdirSync, statSync } from "node:fs";
+import { join, resolve } from "node:path";
+import { parsejaiphWithTrivia } from "../parser";
+import { emitModule } from "./emit";
+
+// Tests run from dist/src/format/roundtrip.test.js, so repo root is four levels up.
+const repoRoot = resolve(__dirname, "../../..");
+
+function findjhFiles(root: string): string[] {
+  const out: string[] = [];
+  const stack = [root];
+  while (stack.length > 0) {
+    const dir = stack.pop()!;
+    let entries: string[];
+    try {
+      entries = readdirSync(dir);
+    } catch {
+      continue;
+    }
+    for (const e of entries) {
+      const p = join(dir, e);
+      let s;
+      try {
+        s = statSync(p);
+      } catch {
+        continue;
+      }
+      if (s.isDirectory()) {
+        stack.push(p);
+      } else if (p.endsWith(".jh") && !p.endsWith(".broken.jh")) {
+        // Skip *.test.jh? We include them — they're also DSL.
+        out.push(p);
+      }
+    }
+  }
+  return out.sort();
+}
+
+const fixtureRoots = [
+  join(repoRoot, "examples"),
+  join(repoRoot, "test-fixtures/golden-ast/fixtures"),
+];
+
+const allFixtures: string[] = [];
+for (const root of fixtureRoots) {
+  allFixtures.push(...findjhFiles(root));
+}
+
+if (allFixtures.length === 0) {
+  test("AC3: round-trip fixtures present", () => {
+    assert.fail("expected at least one .jh fixture under examples/ and test-fixtures/");
+  });
+}
+
+for (const file of allFixtures) {
+  const rel = file.replace(repoRoot + "/", "");
+  test(`AC3: parse → format → parse → format is bit-for-bit on ${rel}`, () => {
+    const source = readFileSync(file, "utf8");
+    // First pass: parse and format.
+    const first = parsejaiphWithTrivia(source, file);
+    const formatted1 = emitModule(first.ast, first.trivia);
+    // Second pass: parse the formatted output and format again.
+    const second = parsejaiphWithTrivia(formatted1, file);
+    const formatted2 = emitModule(second.ast, second.trivia);
+    assert.equal(
+      formatted2,
+      formatted1,
+      `second formatting diverged from first for ${rel}`,
+    );
+  });
+}
diff --git a/src/parse/arg-ast-shape.test.ts b/src/parse/arg-ast-shape.test.ts
new file mode 100644
index 00000000..3ce31de2
--- /dev/null
+++ b/src/parse/arg-ast-shape.test.ts
@@ -0,0 +1,62 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import type { Expr, WorkflowStepDef } from "../types";
+
+/**
+ * AC1 (Refactor 3): `bareIdentifierArgs` must not appear on any call-bearing
+ * AST node, and the three "managed call that yields a value" encodings
+ * — `managed:` sidecar / `run_capture` const RHS / placeholder strings
+ * — have been replaced by a single `Expr` shape that carries `args: Arg[]`.
+ *
+ * Each helper below probes a specific Expr variant where the field used to
+ * live; if it is re-added, `HasField` widens to `true`, the type-level
+ * assertion fails, and TypeScript breaks compilation.
+ */
+type HasField<T, K extends string> = T extends Record<K, unknown> ? true : false;
+
+type ExecStep = Extract<WorkflowStepDef, { type: "exec" }>;
+type ReturnStep = Extract<WorkflowStepDef, { type: "return" }>;
+type SayStep = Extract<WorkflowStepDef, { type: "say" }>;
+type SendStep = Extract<WorkflowStepDef, { type: "send" }>;
+type ConstStep = Extract<WorkflowStepDef, { type: "const" }>;
+
+type CallExpr = Extract<Expr, { kind: "call" }>;
+type EnsureCallExpr = Extract<Expr, { kind: "ensure_call" }>;
+type InlineScriptExpr = Extract<Expr, { kind: "inline_script" }>;
+type PromptExpr = Extract<Expr, { kind: "prompt" }>;
+type SendRunExpr = SendStep["value"];
+type ConstValueExpr = ConstStep["value"];
+
+const _callNoBare: HasField<CallExpr, "bareIdentifierArgs"> = false;
+const _ensureCallNoBare: HasField<EnsureCallExpr, "bareIdentifierArgs"> = false;
+const _inlineNoBare: HasField<InlineScriptExpr, "bareIdentifierArgs"> = false;
+const _promptNoBare: HasField<PromptExpr, "bareIdentifierArgs"> = false;
+const _sendValueNoBare: HasField<SendRunExpr, "bareIdentifierArgs"> = false;
+const _constValueNoBare: HasField<ConstValueExpr, "bareIdentifierArgs"> = false;
+
+// Managed sidecar / placeholder strings on return/log/logerr/etc. are gone:
+const _returnNoManaged: HasField<ReturnStep, "managed"> = false;
+const _sayNoManaged: HasField<SayStep, "managed"> = false;
+const _execNoManaged: HasField<ExecStep, "managed"> = false;
+
+// return.value is now an Expr (not a placeholder string).
+const _returnValueIsExpr: ReturnStep["value"] extends Expr ? true : false = true;
+const _sayMessageIsExpr: SayStep["message"] extends Expr ? true : false = true;
+const _sendValueIsExpr: SendStep["value"] extends Expr ? true : false = true;
+const _constValueIsExpr: ConstStep["value"] extends Expr ? true : false = true;
+
+test("AC1: managed-call encodings collapsed into Expr; no `bareIdentifierArgs` on Expr", () => {
+  assert.equal(_callNoBare, false);
+  assert.equal(_ensureCallNoBare, false);
+  assert.equal(_inlineNoBare, false);
+  assert.equal(_promptNoBare, false);
+  assert.equal(_sendValueNoBare, false);
+  assert.equal(_constValueNoBare, false);
+  assert.equal(_returnNoManaged, false);
+  assert.equal(_sayNoManaged, false);
+  assert.equal(_execNoManaged, false);
+  assert.equal(_returnValueIsExpr, true);
+  assert.equal(_sayMessageIsExpr, true);
+  assert.equal(_sendValueIsExpr, true);
+  assert.equal(_constValueIsExpr, true);
+});
diff --git a/src/parse/arg-grep.test.ts b/src/parse/arg-grep.test.ts
new file mode 100644
index 00000000..ceb8a372
--- /dev/null
+++ b/src/parse/arg-grep.test.ts
@@ -0,0 +1,67 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readdirSync, readFileSync, statSync } from "node:fs";
+import { resolve, join } from "node:path";
+
+// Tests run from dist/src/parse/, so repo root is three levels up.
+const repoRoot = resolve(__dirname, "../../..");
+
+function listTsFiles(dir: string): string[] {
+  const out: string[] = [];
+  const walk = (d: string): void => {
+    for (const name of readdirSync(d)) {
+      const abs = join(d, name);
+      const st = statSync(abs);
+      if (st.isDirectory()) {
+        walk(abs);
+      } else if (name.endsWith(".ts") && !name.endsWith(".test.ts") && !name.endsWith(".d.ts")) {
+        out.push(abs);
+      }
+    }
+  };
+  walk(dir);
+  return out;
+}
+
+const parseSources = listTsFiles(join(repoRoot, "src/parse"));
+const transpileSources = listTsFiles(join(repoRoot, "src/transpile"));
+
+/**
+ * AC2: no production code under src/parse/ or src/transpile/ may re-parse a
+ * call's `args` payload into bare-identifier components. The tokenizer / parser
+ * builds `Arg[]` once via `commaArgsToArgList` in `src/parse/core.ts`;
+ * downstream consumers walk that typed list directly — no `args.split(",")`,
+ * no `bareIdentifierArgs` shadow field, no ad-hoc rescans.
+ */
+test("AC2: no args re-parse into bare-identifier components outside the tokenizer", () => {
+  const forbidden: RegExp[] = [
+    /\bargs\.split\s*\(\s*[`'"],/,
+    /\bbareIdentifierArgs\b/,
+  ];
+  for (const file of [...parseSources, ...transpileSources]) {
+    const content = readFileSync(file, "utf8");
+    for (const re of forbidden) {
+      assert.equal(
+        re.test(content),
+        false,
+        `${file} matches forbidden args re-parse pattern ${re}`,
+      );
+    }
+  }
+});
+
+/**
+ * AC3: `validateBareIdentifierArgs` is deleted. The bare-arg check folds into
+ * the per-step validator that already walks the call: each `Arg` of kind
+ * `"var"` is resolved against in-scope bindings inline.
+ */
+test("AC3: validateBareIdentifierArgs does not reappear in src/transpile/", () => {
+  for (const file of transpileSources) {
+    const content = readFileSync(file, "utf8");
+    assert.equal(
+      /\bvalidateBareIdentifierArgs\b/.test(content),
+      false,
+      `${file} references validateBareIdentifierArgs — it must stay deleted`,
+    );
+  }
+});
diff --git a/src/parse/canonicalize-triple-quoted.test.ts b/src/parse/canonicalize-triple-quoted.test.ts
new file mode 100644
index 00000000..55f9020a
--- /dev/null
+++ b/src/parse/canonicalize-triple-quoted.test.ts
@@ -0,0 +1,105 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readFileSync, readdirSync, statSync } from "node:fs";
+import { resolve, join } from "node:path";
+import { parsejaiph } from "../parser";
+import {
+  canonicalizeTripleQuotedString,
+  tripleQuoteBodyToRaw,
+} from "./triple-quote";
+import { dedentCommonLeadingWhitespace } from "./dedent";
+import type { Expr, WorkflowStepDef } from "../types";
+
+// Tests run from dist/src/parse/, so repo root is three levels up.
+const repoRoot = resolve(__dirname, "../../..");
+
+/**
+ * Verbatim copy of the pre-move `tripleQuotedRawForRuntime` (the helper that
+ * lived in `src/runtime/orchestration-text.ts`). Used as the parity baseline:
+ * the new parser-side `canonicalizeTripleQuotedString` must produce bit-for-bit
+ * identical output for every triple-quoted match-arm body in the corpus.
+ */
+function legacyTripleQuotedRawForRuntime(raw: string): string {
+  if (raw.length < 2 || raw[0] !== '"' || raw[raw.length - 1] !== '"') return raw;
+  const inner = raw.slice(1, -1).replace(/\\"/g, '"').replace(/\\\\/g, "\\");
+  return tripleQuoteBodyToRaw(dedentCommonLeadingWhitespace(inner));
+}
+
+function listJhFiles(dir: string): string[] {
+  const out: string[] = [];
+  for (const entry of readdirSync(dir)) {
+    const abs = join(dir, entry);
+    if (statSync(abs).isDirectory()) {
+      out.push(...listJhFiles(abs));
+      continue;
+    }
+    if (entry.endsWith(".jh") || entry.endsWith(".test.jh")) out.push(abs);
+  }
+  return out;
+}
+
+function collectTripleQuotedArmBodies(expr: Expr, bodies: string[]): void {
+  if (expr.kind === "match") {
+    for (const arm of expr.match.arms) {
+      if (arm.tripleQuotedBody) bodies.push(arm.body);
+    }
+  }
+}
+
+function walkSteps(steps: WorkflowStepDef[], bodies: string[]): void {
+  for (const s of steps) {
+    if (s.type === "const" || s.type === "return") {
+      collectTripleQuotedArmBodies(s.value, bodies);
+    } else if (s.type === "send") {
+      collectTripleQuotedArmBodies(s.value, bodies);
+    } else if (s.type === "exec") {
+      collectTripleQuotedArmBodies(s.body, bodies);
+      if (s.catch) walkSteps("single" in s.catch ? [s.catch.single] : s.catch.block, bodies);
+      if (s.recover) walkSteps("single" in s.recover ? [s.recover.single] : s.recover.block, bodies);
+    } else if (s.type === "if") {
+      walkSteps(s.body, bodies);
+    } else if (s.type === "for_lines") {
+      walkSteps(s.body, bodies);
+    }
+  }
+}
+
+test("AC2: canonicalizeTripleQuotedString matches pre-move tripleQuotedRawForRuntime bit-for-bit on every fixture", () => {
+  const roots = [join(repoRoot, "test-fixtures"), join(repoRoot, "examples")];
+  const files: string[] = [];
+  for (const r of roots) {
+    try {
+      files.push(...listJhFiles(r));
+    } catch {
+      // root missing in this checkout — skip.
+    }
+  }
+  assert.ok(files.length > 0, "expected to discover .jh fixtures under test-fixtures/ and examples/");
+
+  let armCount = 0;
+  for (const file of files) {
+    const source = readFileSync(file, "utf8");
+    let ast;
+    try {
+      ast = parsejaiph(source, file);
+    } catch {
+      // Fixtures that intentionally fail to parse (e.g. parse-error corpus) are out of scope.
+      continue;
+    }
+    const bodies: string[] = [];
+    for (const w of ast.workflows) walkSteps(w.steps, bodies);
+    for (const r of ast.rules) walkSteps(r.steps, bodies);
+    for (const body of bodies) {
+      armCount += 1;
+      assert.equal(
+        canonicalizeTripleQuotedString(body),
+        legacyTripleQuotedRawForRuntime(body),
+        `${file}: canonical form drifted from pre-move tripleQuotedRawForRuntime`,
+      );
+    }
+  }
+  assert.ok(
+    armCount > 0,
+    "expected at least one triple-quoted match-arm body across the fixture corpus",
+  );
+});
diff --git a/src/parse/const-rhs.ts b/src/parse/const-rhs.ts
index 4d528718..19e7300e 100644
--- a/src/parse/const-rhs.ts
+++ b/src/parse/const-rhs.ts
@@ -1,6 +1,7 @@
-import type { ConstRhs, RuleRefDef, WorkflowRefDef } from "../types";
+import type { Expr, RuleRefDef, WorkflowRefDef } from "../types";
+import { createTrivia, type Trivia } from "./trivia";
 import { fail, parseCallRef, rejectTrailingContent } from "./core";
-import { parseTripleQuoteBlock, tripleQuoteBodyToRaw } from "./triple-quote";
+import { dedentTripleQuotedBody, parseTripleQuoteBlock, tripleQuoteBodyToRaw } from "./triple-quote";
 import { parseAnonymousInlineScript } from "./inline-script";
 import { parsePromptStep } from "./prompt";
 import { parseMatchExpr } from "./match";
@@ -48,6 +49,7 @@ export function validateConstBashExpr(filePath: string, expr: string, lineNo: nu
 
 /**
  * Parse RHS after `const name = ` (trimmed). `forRule` disallows prompt capture.
+ * Returns an `Expr` node — the typed value-form that replaces the legacy `ConstRhs` union.
  */
 export function parseConstRhs(
   filePath: string,
@@ -58,7 +60,8 @@ export function parseConstRhs(
   col: number,
   forRule: boolean,
   constName: string,
-): { value: ConstRhs; nextLineIdx: number } {
+  trivia: Trivia = createTrivia(),
+): { value: Expr; nextLineIdx: number } {
   const head = rhs.trimStart();
   if (head.startsWith("prompt ")) {
     if (forRule) {
@@ -67,22 +70,24 @@ export function parseConstRhs(
     const innerRaw = lines[lineIdx];
     const promptCol = innerRaw.indexOf("prompt") + 1;
     const promptArg = rhs.slice(rhs.indexOf("prompt") + "prompt".length).trimStart();
-    const result = parsePromptStep(filePath, lines, lineIdx, promptArg, promptCol, constName);
+    const result = parsePromptStep(filePath, lines, lineIdx, promptArg, promptCol, constName, trivia);
     const st = result.step;
-    if (st.type !== "prompt" || st.captureName !== constName) {
+    if (st.type !== "exec" || st.body.kind !== "prompt" || st.captureName !== constName) {
       fail(filePath, "const ... = prompt internal parse error", lineNo, col);
     }
-    return {
-      value: {
-        kind: "prompt_capture",
-        raw: st.raw,
-        loc: st.loc,
-        returns: st.returns,
-        ...(st.bodyKind ? { bodyKind: st.bodyKind } : {}),
-        ...(st.bodyIdentifier ? { bodyIdentifier: st.bodyIdentifier } : {}),
-      },
-      nextLineIdx: result.nextLineIdx,
-    };
+    const promptBody = st.body;
+    if (promptBody.kind !== "prompt") {
+      fail(filePath, "const ... = prompt internal parse error", lineNo, col);
+    }
+    const promptTrivia = trivia.getNode(st);
+    if (promptTrivia) {
+      trivia.setNode(promptBody, {
+        ...(promptTrivia.bodyKind ? { bodyKind: promptTrivia.bodyKind } : {}),
+        ...(promptTrivia.bodyIdentifier ? { bodyIdentifier: promptTrivia.bodyIdentifier } : {}),
+        ...(promptTrivia.rawBody !== undefined ? { rawBody: promptTrivia.rawBody } : {}),
+      });
+    }
+    return { value: promptBody, nextLineIdx: result.nextLineIdx };
   }
   if (head.startsWith("run ")) {
     const rest = head.slice("run ".length).trim();
@@ -97,13 +102,9 @@ export function parseConstRhs(
         fail(filePath, "const ... = run async must target a valid reference", lineNo, col);
       }
       rejectTrailingContent(filePath, lineNo, "run async", call.rest);
-      const ref: WorkflowRefDef = { value: call.ref, loc: { line: lineNo, col } };
+      const callee: WorkflowRefDef = { value: call.ref, loc: { line: lineNo, col } };
       return {
-        value: {
-          kind: "run_capture", ref, args: call.args,
-          ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-          async: true,
-        },
+        value: { kind: "call", callee, args: call.args, async: true },
         nextLineIdx: lineIdx,
       };
     }
@@ -111,11 +112,10 @@ export function parseConstRhs(
       const result = parseAnonymousInlineScript(filePath, lines, lineIdx, rest, lineNo, col);
       return {
         value: {
-          kind: "run_inline_script_capture",
+          kind: "inline_script",
           body: result.body,
           ...(result.lang ? { lang: result.lang } : {}),
           args: result.args,
-          ...(result.bareIdentifierArgs ? { bareIdentifierArgs: result.bareIdentifierArgs } : {}),
         },
         nextLineIdx: result.nextLineIdx - 1,
       };
@@ -128,12 +128,9 @@ export function parseConstRhs(
       fail(filePath, "const ... = run must target a valid reference", lineNo, col);
     }
     rejectTrailingContent(filePath, lineNo, "run", call.rest);
-    const ref: WorkflowRefDef = { value: call.ref, loc: { line: lineNo, col } };
+    const callee: WorkflowRefDef = { value: call.ref, loc: { line: lineNo, col } };
     return {
-      value: {
-        kind: "run_capture", ref, args: call.args,
-        ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-      },
+      value: { kind: "call", callee, args: call.args },
       nextLineIdx: lineIdx,
     };
   }
@@ -146,12 +143,9 @@ export function parseConstRhs(
     if (call.rest.trim()) {
       fail(filePath, "const ... = ensure cannot use catch", lineNo, col);
     }
-    const ref: RuleRefDef = { value: call.ref, loc: { line: lineNo, col } };
+    const callee: RuleRefDef = { value: call.ref, loc: { line: lineNo, col } };
     return {
-      value: {
-        kind: "ensure_capture", ref, args: call.args,
-        ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-      },
+      value: { kind: "ensure_call", callee, args: call.args },
       nextLineIdx: lineIdx,
     };
   }
@@ -160,7 +154,7 @@ export function parseConstRhs(
   if (constMatchHead) {
     const subject = constMatchHead[1].trim();
     const { expr, nextIndex } = parseMatchExpr(filePath, lines, lineIdx, subject, { line: lineNo, col });
-    return { value: { kind: "match_expr", match: expr }, nextLineIdx: nextIndex - 1 };
+    return { value: { kind: "match", match: expr }, nextLineIdx: nextIndex - 1 };
   }
   // const name = """..."""
   if (head.startsWith('"""')) {
@@ -168,7 +162,9 @@ export function parseConstRhs(
     tqLines[lineIdx] = head;
     const { body, nextIdx, afterClose } = parseTripleQuoteBlock(filePath, tqLines, lineIdx);
     if (afterClose) fail(filePath, 'unexpected content after closing """', nextIdx);
-    return { value: { kind: "expr", bashRhs: tripleQuoteBodyToRaw(body), tripleQuoted: true }, nextLineIdx: nextIdx - 1 };
+    const value: Expr = { kind: "literal", raw: tripleQuoteBodyToRaw(dedentTripleQuotedBody(body)) };
+    trivia.setNode(value, { tripleQuoted: true, rawBody: body });
+    return { value, nextLineIdx: nextIdx - 1 };
   }
   const callLike = head.includes("(") ? parseCallRef(head.trimEnd()) : null;
   if (callLike) {
@@ -182,10 +178,10 @@ export function parseConstRhs(
   validateConstBashExpr(filePath, head, lineNo, col);
   const isBareDotted = isBareDottedIdentifierReturn(head);
   const isBare = !isBareDotted && isBareIdentifierReturn(head);
-  const bashRhs = isBareDotted
+  const raw = isBareDotted
     ? dottedReturnToQuotedString(head)
     : isBare
       ? bareIdentifierToQuotedString(head)
       : head;
-  return { value: { kind: "expr", bashRhs }, nextLineIdx: lineIdx };
+  return { value: { kind: "literal", raw }, nextLineIdx: lineIdx };
 }
diff --git a/src/parse/core.ts b/src/parse/core.ts
index 0cac7c10..54c6ba71 100644
--- a/src/parse/core.ts
+++ b/src/parse/core.ts
@@ -1,4 +1,5 @@
 import { jaiphError } from "../errors";
+import type { Arg } from "../types";
 
 export function fail(filePath: string, message: string, lineNo: number, col = 1): never {
   throw jaiphError(filePath, lineNo, col, "E_PARSE", message);
@@ -162,13 +163,17 @@ export function parseParamList(filePath: string, content: string, lineNo: number
 }
 
 /**
- * Convert comma-separated call arguments to space-separated form for runtime.
- * Respects quoted strings so commas inside quotes are preserved.
- * Bare identifiers (valid names, not keywords) are converted to ${name} form.
+ * Split a comma-separated call argument list into typed `Arg[]`.
+ *
+ * Each top-level comma-separated segment is classified:
+ * - bare identifier (and not a Jaiph keyword): `{ kind: "var", name }`
+ * - anything else (quoted string, ${…}, nested `run …` / `ensure …` call, inline-script
+ *   form, etc.): `{ kind: "literal", raw }`, stored as authored.
+ *
+ * Commas inside quoted strings are preserved (the scanner tracks quote state).
  */
-function commaArgsToSpaced(content: string): { spaced: string; bareIdentifiers: string[] } {
-  const parts: string[] = [];
-  const bareIdentifiers: string[] = [];
+export function commaArgsToArgList(content: string): Arg[] {
+  const out: Arg[] = [];
   let current = "";
   let inQuote: string | null = null;
   for (let j = 0; j < content.length; j++) {
@@ -177,39 +182,41 @@ function commaArgsToSpaced(content: string): { spaced: string; bareIdentifiers:
       current += ch;
       if (ch === inQuote && content[j - 1] !== "\\") inQuote = null;
     } else if (ch === ",") {
-      const trimmed = current.trim();
-      if (trimmed) {
-        if (isBareIdentifier(trimmed)) {
-          bareIdentifiers.push(trimmed);
-          parts.push(`\${${trimmed}}`);
-        } else {
-          parts.push(trimmed);
-        }
-      }
+      pushArg(out, current);
       current = "";
     } else {
       if (ch === '"' || ch === "'") inQuote = ch;
       current += ch;
     }
   }
-  const trimmed = current.trim();
-  if (trimmed) {
-    if (isBareIdentifier(trimmed)) {
-      bareIdentifiers.push(trimmed);
-      parts.push(`\${${trimmed}}`);
-    } else {
-      parts.push(trimmed);
-    }
-  }
-  return { spaced: parts.filter((p) => p).join(" "), bareIdentifiers };
+  pushArg(out, current);
+  return out;
+}
+
+function pushArg(out: Arg[], segment: string): void {
+  const trimmed = segment.trim();
+  if (!trimmed) return;
+  out.push(isBareIdentifier(trimmed) ? { kind: "var", name: trimmed } : { kind: "literal", raw: trimmed });
+}
+
+/**
+ * Convert `Arg[]` back to the space-separated string the runtime consumes:
+ * - `var` → `${name}` (so runtime interpolation expands it against in-scope vars)
+ * - `literal` → raw as authored
+ *
+ * Empty / undefined → empty string.
+ */
+export function argsToRuntimeString(args: Arg[] | undefined): string {
+  if (!args || args.length === 0) return "";
+  return args.map((a) => (a.kind === "var" ? `\${${a.name}}` : a.raw)).join(" ");
 }
 
 /**
  * Parse a call expression `ref(args)` or `ref()` from a string.
- * Returns the ref, optional args (space-separated), bare identifier names, and the rest of the string after `)`.
+ * Returns the ref, optional typed `Arg[]`, and the rest of the string after `)`.
  * Returns null if the string doesn't start with a valid call expression.
  */
-export function parseCallRef(s: string): { ref: string; args?: string; bareIdentifierArgs?: string[]; rest: string } | null {
+export function parseCallRef(s: string): { ref: string; args?: Arg[]; rest: string } | null {
   const t = s.trimStart();
   // Parenthesized form: ref(args) or ref()
   const refMatch = t.match(/^([A-Za-z_][A-Za-z0-9_]*(?:\.[A-Za-z_][A-Za-z0-9_]*)?)\(/);
@@ -234,13 +241,8 @@ export function parseCallRef(s: string): { ref: string; args?: string; bareIdent
     const argsContent = t.slice(parenStart, i - 1).trim();
     const rest = t.slice(i);
     if (!argsContent) return { ref, rest };
-    const { spaced, bareIdentifiers } = commaArgsToSpaced(argsContent);
-    return {
-      ref,
-      args: spaced || undefined,
-      ...(bareIdentifiers.length > 0 ? { bareIdentifierArgs: bareIdentifiers } : {}),
-      rest,
-    };
+    const args = commaArgsToArgList(argsContent);
+    return { ref, ...(args.length > 0 ? { args } : {}), rest };
   }
   // Bare identifier form (no parens) is no longer allowed — require parentheses.
   return null;
@@ -248,14 +250,14 @@ export function parseCallRef(s: string): { ref: string; args?: string; bareIdent
 
 /**
  * Parse a parenthesized argument list `(args)` or `()` at the start of a string.
- * Returns args (space-separated), bare identifier names, and remaining text after `)`.
- * Returns null if the string doesn't start with `(`.
+ * Returns typed `Arg[]` and remaining text after `)`. Returns null if the string
+ * doesn't start with `(`.
  */
-export function parseParenArgs(s: string): { args?: string; bareIdentifierArgs?: string[]; rest: string } | null {
+export function parseParenArgs(s: string): { args?: Arg[]; rest: string } | null {
   if (!s.trimStart().startsWith("(")) return null;
   const result = parseCallRef(`__anon${s.trimStart()}`);
   if (!result) return null;
-  return { args: result.args, bareIdentifierArgs: result.bareIdentifierArgs, rest: result.rest };
+  return { args: result.args, rest: result.rest };
 }
 
 /**
diff --git a/src/parse/env.ts b/src/parse/env.ts
index f31bebea..da6d0c23 100644
--- a/src/parse/env.ts
+++ b/src/parse/env.ts
@@ -28,7 +28,7 @@ export function parseEnvDecl(
       fail(filePath, 'unexpected content after closing """ in const declaration', nextIdx);
     }
     return {
-      envDecl: { name, value: body, loc: { line: lineNo, col: 1 } },
+      envDecl: { name, value: body, loc: { line: lineNo, col: 1 }, wasQuoted: true },
       nextIndex: nextIdx,
     };
   }
@@ -48,7 +48,7 @@ export function parseEnvDecl(
     }
     const value = valuePart.slice(1, closeIdx);
     return {
-      envDecl: { name, value, loc: { line: lineNo, col: 1 } },
+      envDecl: { name, value, loc: { line: lineNo, col: 1 }, wasQuoted: true },
       nextIndex: startIndex + 1,
     };
   }
diff --git a/src/parse/inline-script.ts b/src/parse/inline-script.ts
index c7aeebd0..5e9ed0c4 100644
--- a/src/parse/inline-script.ts
+++ b/src/parse/inline-script.ts
@@ -1,13 +1,18 @@
 import { fail, parseParenArgs, parseSingleBacktickBody } from "./core";
 import { parseFencedBlock } from "./fence";
 import { validateScriptBodyNoInterpolation } from "./scripts";
+import type { Arg } from "../types";
 
 export interface InlineScriptParsed {
   body: string;
   lang?: string;
-  args?: string;
-  bareIdentifierArgs?: string[];
+  args?: Arg[];
+  /** Next line to resume parsing at — the line just after the inline script. */
   nextLineIdx: number;
+  /** Source line index containing the closing `)`. */
+  closingLineIdx: number;
+  /** Trailing text after the closing `)` on the closing line (verbatim). */
+  trailing: string;
 }
 
 /**
@@ -17,6 +22,10 @@ export interface InlineScriptParsed {
  * Two forms:
  *   1. Single backtick: run `body`(args)
  *   2. Fenced block:    run ```lang\n...\n```(args)
+ *
+ * When `allowTrailing` is true the caller is responsible for handling any
+ * non-empty `trailing` text (e.g. `catch (...) { ... }`). When false (default)
+ * non-empty trailing content is rejected with the existing parse error.
  */
 export function parseAnonymousInlineScript(
   filePath: string,
@@ -25,6 +34,7 @@ export function parseAnonymousInlineScript(
   afterRun: string,
   lineNo: number,
   col: number,
+  allowTrailing = false,
 ): InlineScriptParsed {
   const t = afterRun.trimStart();
 
@@ -42,7 +52,7 @@ export function parseAnonymousInlineScript(
         col,
       );
     }
-    if (argsResult.rest.trim()) {
+    if (!allowTrailing && argsResult.rest.trim()) {
       fail(
         filePath,
         `unexpected content after anonymous inline script: '${argsResult.rest.trim()}'`,
@@ -62,8 +72,9 @@ export function parseAnonymousInlineScript(
       body,
       ...(lang ? { lang } : {}),
       args: argsResult.args,
-      ...(argsResult.bareIdentifierArgs ? { bareIdentifierArgs: argsResult.bareIdentifierArgs } : {}),
       nextLineIdx: nextIdx,
+      closingLineIdx: nextIdx - 1,
+      trailing: argsResult.rest,
     };
   }
 
@@ -79,7 +90,7 @@ export function parseAnonymousInlineScript(
         col,
       );
     }
-    if (argsResult.rest.trim()) {
+    if (!allowTrailing && argsResult.rest.trim()) {
       fail(
         filePath,
         `unexpected content after anonymous inline script: '${argsResult.rest.trim()}'`,
@@ -93,8 +104,9 @@ export function parseAnonymousInlineScript(
     return {
       body,
       args: argsResult.args,
-      ...(argsResult.bareIdentifierArgs ? { bareIdentifierArgs: argsResult.bareIdentifierArgs } : {}),
       nextLineIdx: lineIdx + 1,
+      closingLineIdx: lineIdx,
+      trailing: argsResult.rest,
     };
   }
 
diff --git a/src/parse/match.ts b/src/parse/match.ts
index 95f38bd3..ee6a0ea4 100644
--- a/src/parse/match.ts
+++ b/src/parse/match.ts
@@ -4,15 +4,18 @@ import { splitStatementsOnSemicolons } from "./statement-split";
 import { tripleQuoteBodyToRaw, trimAdjacentBlankLines } from "./triple-quote";
 
 const IDENT_RE = /^[A-Za-z_][A-Za-z0-9_]*$/;
+const DOT_IDENT_RE = /^[A-Za-z_][A-Za-z0-9_]*\.[A-Za-z_][A-Za-z0-9_]*$/;
 
 /**
- * Validate that a match subject is a bare identifier (no `$` or `${}`).
+ * Validate that a match subject is a bare identifier or `IDENT.IDENT`
+ * (typed prompt capture field). Dot-field resolution and schema enforcement
+ * happen in the validator, mirroring `${var.field}` interpolation.
  */
 export function validateMatchSubject(filePath: string, subject: string, lineNo: number): void {
   if (subject.startsWith("${") || subject.startsWith("$")) {
     fail(filePath, `match subject should be a bare identifier: match varName { ... }`, lineNo);
   }
-  if (!IDENT_RE.test(subject)) {
+  if (!IDENT_RE.test(subject) && !DOT_IDENT_RE.test(subject)) {
     fail(filePath, `match subject must be a valid identifier, got: ${subject}`, lineNo);
   }
 }
diff --git a/src/parse/metadata.ts b/src/parse/metadata.ts
index 240a230e..0c913ba6 100644
--- a/src/parse/metadata.ts
+++ b/src/parse/metadata.ts
@@ -1,4 +1,5 @@
-import type { ConfigBodyPart, WorkflowMetadata } from "../types";
+import type { WorkflowMetadata } from "../types";
+import type { Trivia, ConfigBodyPart } from "./trivia";
 import { colFromRaw, fail } from "./core";
 
 const ALLOWED_KEYS = new Set([
@@ -176,6 +177,7 @@ export function parseConfigBlock(
   filePath: string,
   lines: string[],
   startIndex: number,
+  trivia?: Trivia,
 ): { metadata: WorkflowMetadata; nextIndex: number } {
   const openLineNo = startIndex + 1;
   const rawOpen = lines[startIndex];
@@ -202,8 +204,8 @@ export function parseConfigBlock(
       continue;
     }
     if (line === "}") {
-      if (bodySequence.length > 0) {
-        out.configBodySequence = bodySequence;
+      if (bodySequence.length > 0 && trivia) {
+        trivia.setNode(out, { configBodySequence: bodySequence });
       }
       idx += 1;
       return { metadata: out, nextIndex: idx };
diff --git a/src/parse/parse-attached-block.test.ts b/src/parse/parse-attached-block.test.ts
new file mode 100644
index 00000000..8ec18569
--- /dev/null
+++ b/src/parse/parse-attached-block.test.ts
@@ -0,0 +1,193 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readFileSync } from "node:fs";
+import { join } from "node:path";
+import { parsejaiph } from "../parser";
+import type { WorkflowStepDef } from "../types";
+
+const stepsTsPath = join(process.cwd(), "src/parse/steps.ts");
+const stepsTsSource = readFileSync(stepsTsPath, "utf8");
+
+// === AC1: src/parse/steps.ts size + grep budget ===
+
+test("AC1: src/parse/steps.ts is at most 200 lines", () => {
+  const lineCount = stepsTsSource.split("\n").length;
+  assert.ok(
+    lineCount <= 200,
+    `expected src/parse/steps.ts to be <=200 lines (was 757 before Refactor 2); got ${lineCount}`,
+  );
+});
+
+test("AC1: src/parse/steps.ts has no parse(Run)?(Catch|Recover|EnsureStep) function", () => {
+  const re = /\bfunction\s+(parse(?:Run)?(?:Catch|Recover|EnsureStep))\b/;
+  const m = stepsTsSource.match(re);
+  assert.equal(
+    m,
+    null,
+    `legacy catch/recover host-parser function reappeared in src/parse/steps.ts: ${m && m[1]}`,
+  );
+});
+
+// === AC2: parseBlockStatement is THE entry point for any catch/recover body ===
+//
+// Before Refactor 2, `parseCatchStatement` was a stripped-down copy of
+// `parseBlockStatement` that recognised only a fixed subset of statement
+// forms. A `for … in …` head, for example, was treated as a shell command.
+// After Refactor 2 the same `parseBlockStatement` parses bodies everywhere,
+// so introducing a new statement form (here: using `for` as the probe — it
+// has always been a parseBlockStatement-only form historically) is accepted
+// identically at top level, inside `catch (e) { … }`, and inside
+// `recover(e) { … }` without any change to the catch/recover code path.
+
+function pickFor(steps: WorkflowStepDef[]): WorkflowStepDef | undefined {
+  return steps.find((s) => s.type === "for_lines");
+}
+
+const FOR_BODY = [
+  '    for line in items {',
+  '      log "$line"',
+  '    }',
+];
+
+test("AC2: top-level for-loop is parsed as `for_lines`", () => {
+  const src = [
+    "workflow w(items) {",
+    ...FOR_BODY,
+    "}",
+    "",
+  ].join("\n");
+  const mod = parsejaiph(src, "ac2-top.jh");
+  const w = mod.workflows.find((x) => x.name === "w")!;
+  const forStep = pickFor(w.steps);
+  assert.ok(forStep, "expected for_lines step at top level");
+});
+
+test("AC2: same for-loop inside catch body parses identically", () => {
+  const src = [
+    "rule check() {",
+    '  return "ok"',
+    "}",
+    "workflow w(items) {",
+    "  ensure check() catch (e) {",
+    ...FOR_BODY,
+    "  }",
+    "}",
+    "",
+  ].join("\n");
+  const mod = parsejaiph(src, "ac2-catch.jh");
+  const w = mod.workflows.find((x) => x.name === "w")!;
+  const ensureStep = w.steps[0];
+  assert.equal(ensureStep.type, "exec");
+  if (ensureStep.type !== "exec") return;
+  assert.ok(ensureStep.catch && "block" in ensureStep.catch);
+  if (!(ensureStep.catch && "block" in ensureStep.catch)) return;
+  const forStep = pickFor(ensureStep.catch.block);
+  assert.ok(forStep, "expected for_lines step inside catch body");
+});
+
+test("AC2: same for-loop inside recover body parses identically", () => {
+  const src = [
+    "workflow target() {",
+    '  log "target"',
+    "}",
+    "workflow w(items) {",
+    "  run target() recover(e) {",
+    ...FOR_BODY,
+    "  }",
+    "}",
+    "",
+  ].join("\n");
+  const mod = parsejaiph(src, "ac2-recover.jh");
+  const w = mod.workflows.find((x) => x.name === "w")!;
+  const runStep = w.steps[0];
+  assert.equal(runStep.type, "exec");
+  if (runStep.type !== "exec") return;
+  assert.ok(runStep.recover && "block" in runStep.recover);
+  if (!(runStep.recover && "block" in runStep.recover)) return;
+  const forStep = pickFor(runStep.recover.block);
+  assert.ok(forStep, "expected for_lines step inside recover body");
+});
+
+// === AC3: parse error messages and locations preserved bit-for-bit ===
+//
+// These cover every error message and location the legacy three-function
+// catch/recover path produced. They are exhaustively asserted as snapshots.
+
+type ErrSnap = { name: string; src: string; expected: string };
+
+const ERR_SNAPSHOTS: ErrSnap[] = [
+  // Bindings paren missing
+  {
+    name: "ensure catch: missing bindings paren (EOL)",
+    src: "workflow w() {\n  ensure r() catch\n}\n",
+    expected: 'fixture.jh:2:14 E_PARSE catch requires explicit bindings and a body: catch (<name>) { ... }',
+  },
+  {
+    name: "ensure catch: bindings open after `{`",
+    src: "workflow w() {\n  ensure r() catch {\n}\n",
+    expected: 'fixture.jh:2:14 E_PARSE catch requires explicit bindings: catch (<name>) { ... }',
+  },
+  {
+    name: "run catch: missing bindings paren (EOL)",
+    src: "workflow w() {\n  run r() catch\n}\n",
+    expected: 'fixture.jh:2:11 E_PARSE catch requires explicit bindings and a body: catch (<name>) { ... }',
+  },
+  {
+    name: "run recover: missing bindings paren (EOL)",
+    src: "workflow w() {\n  run r() recover\n}\n",
+    expected: 'fixture.jh:2:11 E_PARSE recover requires explicit bindings and a body: recover(<name>) { ... }',
+  },
+  {
+    name: "run recover: bindings open after `{`",
+    src: "workflow w() {\n  run r() recover {\n}\n",
+    expected: 'fixture.jh:2:11 E_PARSE recover requires explicit bindings: recover(<name>) { ... }',
+  },
+
+  // Too many bindings
+  {
+    name: "ensure catch: two bindings rejected",
+    src: 'workflow w() {\n  ensure r() catch (a, b) { log "x" }\n}\n',
+    expected: 'fixture.jh:2:14 E_PARSE catch accepts exactly one binding: catch (<name>) — the second binding (attempt) has been removed',
+  },
+  {
+    name: "run recover: two bindings rejected",
+    src: 'workflow w() {\n  run r() recover(a, b) { log "x" }\n}\n',
+    expected: 'fixture.jh:2:11 E_PARSE recover accepts exactly one binding: recover(<name>)',
+  },
+
+  // Empty body
+  {
+    name: "ensure catch: empty inline block rejected",
+    src: "workflow w() {\n  ensure r() catch (e) { }\n}\n",
+    expected: 'fixture.jh:2:14 E_PARSE catch block must contain at least one statement',
+  },
+  {
+    name: "ensure catch: empty multiline block rejected",
+    src: "workflow w() {\n  ensure r() catch (e) {\n  }\n}\n",
+    expected: 'fixture.jh:2:14 E_PARSE catch block must contain at least one statement',
+  },
+  {
+    name: "run recover: empty inline block rejected",
+    src: "workflow w() {\n  run r() recover(e) { }\n}\n",
+    expected: 'fixture.jh:2:11 E_PARSE recover block must contain at least one statement',
+  },
+
+  // Unterminated multiline block
+  {
+    name: "ensure catch: unterminated multiline block",
+    src: 'workflow w() {\n  ensure r() catch (e) {\n    log "x"\n',
+    expected: 'fixture.jh:2:14 E_PARSE unterminated catch block, expected "}"',
+  },
+];
+
+for (const s of ERR_SNAPSHOTS) {
+  test(`AC3 snapshot: ${s.name}`, () => {
+    let actual = "<no error thrown>";
+    try {
+      parsejaiph(s.src, "fixture.jh");
+    } catch (e) {
+      actual = (e as Error).message;
+    }
+    assert.equal(actual, s.expected);
+  });
+}
diff --git a/src/parse/parse-bare-call.test.ts b/src/parse/parse-bare-call.test.ts
index ffe4ca6c..3209e485 100644
--- a/src/parse/parse-bare-call.test.ts
+++ b/src/parse/parse-bare-call.test.ts
@@ -24,10 +24,13 @@ test("run with args and parens still works", () => {
     "test.jh",
   );
   const step = mod.workflows[0].steps[0];
-  assert.equal(step.type, "run");
-  if (step.type === "run") {
-    assert.equal(step.workflow.value, "deploy");
-    assert.equal(step.args, '"prod" "v1"');
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "call") {
+    assert.equal(step.body.callee.value, "deploy");
+    assert.deepEqual(step.body.args, [
+      { kind: "literal", raw: '"prod"' },
+      { kind: "literal", raw: '"v1"' },
+    ]);
   }
 });
 
@@ -83,32 +86,38 @@ test("const x = ensure bare identifier is rejected — parentheses required", ()
 
 // === return run/ensure bare identifier (no parens) now falls through ===
 
-test("return run bare identifier does not parse as managed return", () => {
+test("return run bare identifier falls through to exec/shell", () => {
   // Without parens, "return run helper" is not recognized as a managed return
-  // and falls through to a shell step
+  // and falls through to a shell exec step
   const mod = parsejaiph(
     `workflow default() {\n  return run helper\n}`,
     "test.jh",
   );
   const step = mod.workflows[0].steps[0];
-  assert.equal(step.type, "shell");
+  assert.equal(step.type, "exec");
+  if (step.type === "exec") {
+    assert.equal(step.body.kind, "shell");
+  }
 });
 
-test("return ensure bare identifier does not parse as managed return", () => {
+test("return ensure bare identifier falls through to exec/shell", () => {
   // Without parens, "return ensure check" is not recognized as a managed return
-  // and falls through to a shell step
+  // and falls through to a shell exec step
   const mod = parsejaiph(
     `rule check() {\n  return "ok"\n}\nworkflow default() {\n  return ensure check\n}`,
     "test.jh",
   );
   const step = mod.workflows[0].steps[0];
-  assert.equal(step.type, "shell");
+  assert.equal(step.type, "exec");
+  if (step.type === "exec") {
+    assert.equal(step.body.kind, "shell");
+  }
 });
 
 // === send RHS with bare identifier (no parens) ===
 
-test("channel <- run bare identifier does not parse as send with run RHS", () => {
-  // Without parens, the send RHS falls through to shell kind
+test("channel <- run bare identifier does not parse as send with call value", () => {
+  // Without parens, the send RHS falls through to Expr.shell
   const mod = parsejaiph(
     [
       "channel alerts",
@@ -122,8 +131,7 @@ test("channel <- run bare identifier does not parse as send with run RHS", () =>
   assert.equal(step.type, "send");
   if (step.type === "send") {
     assert.equal(step.channel, "alerts");
-    // Without parens, parseCallRef returns null, so it falls through to shell kind
-    assert.equal(step.rhs.kind, "shell");
+    assert.equal(step.value.kind, "shell");
   }
 });
 
diff --git a/src/parse/parse-const-rhs.test.ts b/src/parse/parse-const-rhs.test.ts
index 333f42ab..2e66723b 100644
--- a/src/parse/parse-const-rhs.test.ts
+++ b/src/parse/parse-const-rhs.test.ts
@@ -91,45 +91,45 @@ test("validateConstBashExpr: rejects ${var:?message} fallback", () => {
 
 // === parseConstRhs ===
 
-test("parseConstRhs: parses bash expression", () => {
+test("parseConstRhs: parses literal expression", () => {
   const result = parseConstRhs("test.jh", ['const x = "hello"'], 0, '"hello"', 1, 1, false, "x");
-  assert.equal(result.value.kind, "expr");
-  if (result.value.kind === "expr") {
-    assert.equal(result.value.bashRhs, '"hello"');
+  assert.equal(result.value.kind, "literal");
+  if (result.value.kind === "literal") {
+    assert.equal(result.value.raw, '"hello"');
   }
   assert.equal(result.nextLineIdx, 0);
 });
 
-test("parseConstRhs: bare identifier is sugar for interpolated string", () => {
+test("parseConstRhs: bare identifier is sugar for interpolated literal", () => {
   const result = parseConstRhs("test.jh", ["const x = response"], 0, "response", 1, 1, false, "x");
-  assert.equal(result.value.kind, "expr");
-  if (result.value.kind === "expr") {
-    assert.equal(result.value.bashRhs, '"${response}"');
+  assert.equal(result.value.kind, "literal");
+  if (result.value.kind === "literal") {
+    assert.equal(result.value.raw, '"${response}"');
   }
 });
 
-test("parseConstRhs: bare dotted identifier is sugar for interpolated string", () => {
+test("parseConstRhs: bare dotted identifier is sugar for interpolated literal", () => {
   const result = parseConstRhs("test.jh", ["const x = response.message"], 0, "response.message", 1, 1, false, "x");
-  assert.equal(result.value.kind, "expr");
-  if (result.value.kind === "expr") {
-    assert.equal(result.value.bashRhs, '"${response.message}"');
+  assert.equal(result.value.kind, "literal");
+  if (result.value.kind === "literal") {
+    assert.equal(result.value.raw, '"${response.message}"');
   }
 });
 
-test("parseConstRhs: parses run capture", () => {
+test("parseConstRhs: parses run capture as Expr.call", () => {
   const result = parseConstRhs("test.jh", ["const x = run my_script()"], 0, "run my_script()", 1, 1, false, "x");
-  assert.equal(result.value.kind, "run_capture");
-  if (result.value.kind === "run_capture") {
-    assert.equal(result.value.ref.value, "my_script");
+  assert.equal(result.value.kind, "call");
+  if (result.value.kind === "call") {
+    assert.equal(result.value.callee.value, "my_script");
   }
 });
 
-test("parseConstRhs: parses run capture with args", () => {
+test("parseConstRhs: parses run capture with args as Expr.call", () => {
   const result = parseConstRhs("test.jh", ['const x = run my_script("arg")'], 0, 'run my_script("arg")', 1, 1, false, "x");
-  assert.equal(result.value.kind, "run_capture");
-  if (result.value.kind === "run_capture") {
-    assert.equal(result.value.ref.value, "my_script");
-    assert.equal(result.value.args, '"arg"');
+  assert.equal(result.value.kind, "call");
+  if (result.value.kind === "call") {
+    assert.equal(result.value.callee.value, "my_script");
+    assert.deepEqual(result.value.args, [{ kind: "literal", raw: '"arg"' }]);
   }
 });
 
@@ -140,11 +140,11 @@ test("parseConstRhs: run without parens rejects (parens required)", () => {
   );
 });
 
-test("parseConstRhs: parses ensure capture", () => {
+test("parseConstRhs: parses ensure capture as Expr.ensure_call", () => {
   const result = parseConstRhs("test.jh", ["const x = ensure my_rule()"], 0, "ensure my_rule()", 1, 1, false, "x");
-  assert.equal(result.value.kind, "ensure_capture");
-  if (result.value.kind === "ensure_capture") {
-    assert.equal(result.value.ref.value, "my_rule");
+  assert.equal(result.value.kind, "ensure_call");
+  if (result.value.kind === "ensure_call") {
+    assert.equal(result.value.callee.value, "my_rule");
   }
 });
 
@@ -176,11 +176,11 @@ test("parseConstRhs: bare call without run suggests fix", () => {
   );
 });
 
-test("parseConstRhs: parses prompt capture in workflow", () => {
+test("parseConstRhs: parses prompt capture as Expr.prompt", () => {
   const lines = ['  const x = prompt "What is your name?"'];
   const result = parseConstRhs("test.jh", lines, 0, 'prompt "What is your name?"', 1, 1, false, "x");
-  assert.equal(result.value.kind, "prompt_capture");
-  if (result.value.kind === "prompt_capture") {
+  assert.equal(result.value.kind, "prompt");
+  if (result.value.kind === "prompt") {
     assert.equal(result.value.raw, '"What is your name?"');
   }
 });
diff --git a/src/parse/parse-core.test.ts b/src/parse/parse-core.test.ts
index 6a3318ee..020353c2 100644
--- a/src/parse/parse-core.test.ts
+++ b/src/parse/parse-core.test.ts
@@ -198,62 +198,61 @@ test("isBareIdentifier: rejects string with spaces", () => {
   assert.equal(isBareIdentifier("has space"), false);
 });
 
-// === parseCallRef: bare identifiers ===
+// === parseCallRef: typed Arg[] classification ===
 
-test("parseCallRef: bare identifier arg is converted to interpolation form", () => {
+test("parseCallRef: bare identifier becomes var arg", () => {
   const result = parseCallRef("foo(task)");
   assert.ok(result);
   assert.equal(result.ref, "foo");
-  assert.equal(result.args, "${task}");
-  assert.deepEqual(result.bareIdentifierArgs, ["task"]);
+  assert.deepEqual(result.args, [{ kind: "var", name: "task" }]);
 });
 
 test("parseCallRef: bare identifier mixed with quoted arg", () => {
   const result = parseCallRef('foo(task, "hello")');
   assert.ok(result);
   assert.equal(result.ref, "foo");
-  assert.equal(result.args, '${task} "hello"');
-  assert.deepEqual(result.bareIdentifierArgs, ["task"]);
+  assert.deepEqual(result.args, [
+    { kind: "var", name: "task" },
+    { kind: "literal", raw: '"hello"' },
+  ]);
 });
 
 test("parseCallRef: multiple bare identifiers", () => {
   const result = parseCallRef("foo(task, branch_name)");
   assert.ok(result);
   assert.equal(result.ref, "foo");
-  assert.equal(result.args, "${task} ${branch_name}");
-  assert.deepEqual(result.bareIdentifierArgs, ["task", "branch_name"]);
+  assert.deepEqual(result.args, [
+    { kind: "var", name: "task" },
+    { kind: "var", name: "branch_name" },
+  ]);
 });
 
-test("parseCallRef: keyword arg is not treated as bare identifier", () => {
+test("parseCallRef: keyword arg is stored as literal (not var)", () => {
   const result = parseCallRef("foo(run)");
   assert.ok(result);
   assert.equal(result.ref, "foo");
-  assert.equal(result.args, "run");
-  assert.equal(result.bareIdentifierArgs, undefined);
+  assert.deepEqual(result.args, [{ kind: "literal", raw: "run" }]);
 });
 
-test("parseCallRef: quoted string arg is not treated as bare identifier", () => {
+test("parseCallRef: quoted string arg is stored as literal", () => {
   const result = parseCallRef('foo("task")');
   assert.ok(result);
   assert.equal(result.ref, "foo");
-  assert.equal(result.args, '"task"');
-  assert.equal(result.bareIdentifierArgs, undefined);
+  assert.deepEqual(result.args, [{ kind: "literal", raw: '"task"' }]);
 });
 
-test("parseCallRef: ${var} arg is not treated as bare identifier", () => {
+test("parseCallRef: ${var} interpolation arg is stored as literal", () => {
   const result = parseCallRef("foo(${task})");
   assert.ok(result);
   assert.equal(result.ref, "foo");
-  assert.equal(result.args, "${task}");
-  assert.equal(result.bareIdentifierArgs, undefined);
+  assert.deepEqual(result.args, [{ kind: "literal", raw: "${task}" }]);
 });
 
-test("parseCallRef: no args returns no bareIdentifierArgs", () => {
+test("parseCallRef: no args returns undefined args", () => {
   const result = parseCallRef("foo()");
   assert.ok(result);
   assert.equal(result.ref, "foo");
   assert.equal(result.args, undefined);
-  assert.equal(result.bareIdentifierArgs, undefined);
 });
 
 // === parseCallRef: bare identifier (no parens) — now returns null ===
diff --git a/src/parse/parse-definitions.test.ts b/src/parse/parse-definitions.test.ts
index bc436efa..ecf0e4dc 100644
--- a/src/parse/parse-definitions.test.ts
+++ b/src/parse/parse-definitions.test.ts
@@ -205,13 +205,20 @@ test("reserved keyword as parameter name is rejected", () => {
   );
 });
 
-test("log accepts a bare identifier (stored as interpolation)", () => {
+test("log accepts a bare identifier (stored as interpolation Expr.literal)", () => {
   const mod = parsejaiph(
     ["workflow w() {", "  log msg", "}", ""].join("\n"),
     "test.jh",
   );
-  assert.equal(mod.workflows[0].steps[0].type, "log");
-  assert.equal((mod.workflows[0].steps[0] as { message: string }).message, "${msg}");
+  const step = mod.workflows[0].steps[0];
+  assert.equal(step.type, "say");
+  if (step.type === "say") {
+    assert.equal(step.level, "log");
+    assert.equal(step.message.kind, "literal");
+    if (step.message.kind === "literal") {
+      assert.equal(step.message.raw, "${msg}");
+    }
+  }
 });
 
 // === import script ===
diff --git a/src/parse/parse-error-snapshot.test.ts b/src/parse/parse-error-snapshot.test.ts
new file mode 100644
index 00000000..ffe50ae3
--- /dev/null
+++ b/src/parse/parse-error-snapshot.test.ts
@@ -0,0 +1,158 @@
+/**
+ * Snapshot test for parser errors. Walks every `=== name` block in
+ * `test-fixtures/compiler-txtar/parse-errors.txt`, parses the virtual files,
+ * and re-emits the captured error as `{ file, line, col, code, message }`.
+ *
+ * The snapshot is stored at
+ * `test-fixtures/compiler-txtar/parse-errors-snapshot.json`. Re-run with
+ * `UPDATE_SNAPSHOTS=1` only after confirming a diff is intentional — this
+ * test exists so any drift in parser error code/line/col/message surfaces
+ * immediately.
+ */
+import test from "node:test";
+import assert from "node:assert/strict";
+import {
+  existsSync,
+  mkdtempSync,
+  readFileSync,
+  rmSync,
+  writeFileSync,
+} from "node:fs";
+import { join, resolve } from "node:path";
+import { tmpdir } from "node:os";
+import { loadModuleGraph } from "../transpile/module-graph";
+
+// Tests run from `dist/src/parse/...`; walk up to repo root.
+const repoRoot = resolve(__dirname, "../../..");
+const fixturesDir = resolve(repoRoot, "test-fixtures/compiler-txtar");
+const fixtureFile = join(fixturesDir, "parse-errors.txt");
+const snapshotPath = join(fixturesDir, "parse-errors-snapshot.json");
+
+interface TxtarCase {
+  name: string;
+  files: Map<string, string>;
+}
+
+interface SnapshotEntry {
+  file: string;
+  line: number;
+  col: number;
+  code: string;
+  message: string;
+}
+
+type Snapshot = Record<string, SnapshotEntry>;
+
+function parseTxtar(content: string): TxtarCase[] {
+  const cases: TxtarCase[] = [];
+  for (const block of content.split(/^=== /m)) {
+    const trimmed = block.trim();
+    if (!trimmed) continue;
+    const lines = trimmed.split("\n");
+    const name = lines[0].trim();
+    let fileStartIdx = -1;
+    for (let i = 1; i < lines.length; i += 1) {
+      if (lines[i].startsWith("--- ")) {
+        fileStartIdx = i;
+        break;
+      }
+    }
+    if (fileStartIdx < 0) continue;
+    cases.push({ name, files: parseVirtualFiles(lines.slice(fileStartIdx)) });
+  }
+  return cases;
+}
+
+function parseVirtualFiles(lines: string[]): Map<string, string> {
+  const files = new Map<string, string>();
+  let cur: string | undefined;
+  let buf: string[] = [];
+  for (const line of lines) {
+    if (line.startsWith("--- ")) {
+      if (cur !== undefined) files.set(cur, buf.join("\n") + "\n");
+      cur = line.slice(4).trim();
+      buf = [];
+    } else {
+      buf.push(line);
+    }
+  }
+  if (cur !== undefined) files.set(cur, buf.join("\n") + "\n");
+  return files;
+}
+
+function entryFile(files: Map<string, string>): string {
+  if (files.has("main.jh")) return "main.jh";
+  if (files.has("input.jh")) return "input.jh";
+  if (files.has("input.test.jh")) return "input.test.jh";
+  const first = files.keys().next().value;
+  if (!first) throw new Error("no virtual files");
+  return first;
+}
+
+function relativizeTmp(p: string, tmpDir: string): string {
+  return p.startsWith(tmpDir) ? p.slice(tmpDir.length).replace(/^[\/]+/, "") : p;
+}
+
+function scrubTmp(msg: string, tmpDir: string): string {
+  const escaped = tmpDir.replace(/[.*+?^${}()|[\]\\]/g, "\\$&");
+  return msg.replace(new RegExp(escaped, "g"), "<TMP>");
+}
+
+function captureSnapshot(): Snapshot {
+  const content = readFileSync(fixtureFile, "utf8");
+  const out: Snapshot = {};
+  for (const tc of parseTxtar(content)) {
+    const tmpDir = mkdtempSync(join(tmpdir(), "jaiph-parse-snap-"));
+    try {
+      for (const [name, body] of tc.files) {
+        writeFileSync(join(tmpDir, name), body, "utf8");
+      }
+      const entry = join(tmpDir, entryFile(tc.files));
+      try {
+        loadModuleGraph(entry);
+        out[tc.name] = {
+          file: "<no-error>",
+          line: 0,
+          col: 0,
+          code: "OK",
+          message: "compilation succeeded but fixture expected a parse error",
+        };
+      } catch (e) {
+        const msg = (e as Error).message ?? String(e);
+        const m = msg.match(/^(.+):(\d+):(\d+) (\S+) ([\s\S]+)$/);
+        out[tc.name] = m
+          ? {
+              file: relativizeTmp(m[1], tmpDir),
+              line: Number(m[2]),
+              col: Number(m[3]),
+              code: m[4],
+              message: scrubTmp(m[5], tmpDir),
+            }
+          : {
+              file: "<unknown>",
+              line: 0,
+              col: 0,
+              code: "E_FATAL",
+              message: scrubTmp(msg, tmpDir),
+            };
+      }
+    } finally {
+      rmSync(tmpDir, { recursive: true, force: true });
+    }
+  }
+  return out;
+}
+
+test("parse-errors.txt snapshot pins {file, line, col, code, message}", () => {
+  const current = captureSnapshot();
+  if (process.env.UPDATE_SNAPSHOTS === "1" || !existsSync(snapshotPath)) {
+    writeFileSync(snapshotPath, JSON.stringify(current, null, 2) + "\n", "utf8");
+    return;
+  }
+  const stored = JSON.parse(readFileSync(snapshotPath, "utf8")) as Snapshot;
+  assert.deepEqual(
+    current,
+    stored,
+    "parser error output drifted from snapshot. Re-run with UPDATE_SNAPSHOTS=1 only after confirming the change is intentional.",
+  );
+});
diff --git a/src/parse/parse-inline-script.test.ts b/src/parse/parse-inline-script.test.ts
index 8fae049f..474eba75 100644
--- a/src/parse/parse-inline-script.test.ts
+++ b/src/parse/parse-inline-script.test.ts
@@ -11,11 +11,11 @@ workflow default() {
   const ast = parsejaiph(src, "test.jh");
   assert.equal(ast.workflows.length, 1);
   const step = ast.workflows[0].steps[0];
-  assert.equal(step.type, "run_inline_script");
-  if (step.type === "run_inline_script") {
-    assert.equal(step.body, "echo hello");
-    assert.equal(step.lang, undefined);
-    assert.equal(step.args, undefined);
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "inline_script") {
+    assert.equal(step.body.body, "echo hello");
+    assert.equal(step.body.lang, undefined);
+    assert.equal(step.body.args, undefined);
     assert.equal(step.captureName, undefined);
   }
 });
@@ -28,10 +28,13 @@ workflow default() {
 `;
   const ast = parsejaiph(src, "test.jh");
   const step = ast.workflows[0].steps[0];
-  assert.equal(step.type, "run_inline_script");
-  if (step.type === "run_inline_script") {
-    assert.equal(step.body, "echo $1");
-    assert.equal(step.args, '"arg1" "arg2"');
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "inline_script") {
+    assert.equal(step.body.body, "echo $1");
+    assert.deepEqual(step.body.args, [
+      { kind: "literal", raw: '"arg1"' },
+      { kind: "literal", raw: '"arg2"' },
+    ]);
   }
 });
 
@@ -53,11 +56,8 @@ workflow default() {
   const ast = parsejaiph(src, "test.jh");
   const step = ast.workflows[0].steps[0];
   assert.equal(step.type, "const");
-  if (step.type === "const") {
-    assert.equal(step.value.kind, "run_inline_script_capture");
-    if (step.value.kind === "run_inline_script_capture") {
-      assert.equal(step.value.body, "echo hello");
-    }
+  if (step.type === "const" && step.value.kind === "inline_script") {
+    assert.equal(step.value.body, "echo hello");
   }
 });
 
@@ -71,10 +71,10 @@ test("parser: run script() with fenced block and lang tag", () => {
   ].join("\n");
   const ast = parsejaiph(src, "test.jh");
   const step = ast.workflows[0].steps[0];
-  assert.equal(step.type, "run_inline_script");
-  if (step.type === "run_inline_script") {
-    assert.equal(step.lang, "python3");
-    assert.equal(step.body, "print('hello')");
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "inline_script") {
+    assert.equal(step.body.lang, "python3");
+    assert.equal(step.body.body, "print('hello')");
   }
 });
 
@@ -104,11 +104,10 @@ test("parser: rule body supports multiline fenced run ```", () => {
   const ast = parsejaiph(src, "test.jh");
   assert.equal(ast.rules.length, 1);
   const step = ast.rules[0].steps[0];
-  assert.equal(step.type, "run_inline_script");
-  if (step.type === "run_inline_script") {
-    assert.ok(step.body.includes('if [ -z "$1" ]'));
-    assert.equal(step.args, "${name}");
-    assert.deepEqual(step.bareIdentifierArgs, ["name"]);
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "inline_script") {
+    assert.ok(step.body.body.includes('if [ -z "$1" ]'));
+    assert.deepEqual(step.body.args, [{ kind: "var", name: "name" }]);
   }
 });
 
diff --git a/src/parse/parse-interpreter-tags.test.ts b/src/parse/parse-interpreter-tags.test.ts
index 78327093..e09829fc 100644
--- a/src/parse/parse-interpreter-tags.test.ts
+++ b/src/parse/parse-interpreter-tags.test.ts
@@ -1,50 +1,50 @@
 import test from "node:test";
 import assert from "node:assert/strict";
-import { parsejaiph } from "../parser";
+import { parsejaiph, parsejaiphWithTrivia } from "../parser";
 
 // === Accepted: fenced block with lang tag ===
 
 test("fenced block with python3 lang tag parses correctly", () => {
-  const mod = parsejaiph('script transform = ```python3\nprint("hi")\n```', "test.jh");
+  const { ast: mod, trivia } = parsejaiphWithTrivia('script transform = ```python3\nprint("hi")\n```', "test.jh");
   assert.equal(mod.scripts.length, 1);
   assert.equal(mod.scripts[0].name, "transform");
   assert.equal(mod.scripts[0].lang, "python3");
   assert.equal(mod.scripts[0].body, 'print("hi")');
-  assert.equal(mod.scripts[0].bodyKind, "fenced");
+  assert.equal(trivia.getNode(mod.scripts[0])?.scriptBodyKind, "fenced");
 });
 
 test("fenced block with node lang tag parses correctly", () => {
-  const mod = parsejaiph("script transform = ```node\nconsole.log('hi');\n```", "test.jh");
+  const { ast: mod, trivia } = parsejaiphWithTrivia("script transform = ```node\nconsole.log('hi');\n```", "test.jh");
   assert.equal(mod.scripts.length, 1);
   assert.equal(mod.scripts[0].name, "transform");
   assert.equal(mod.scripts[0].lang, "node");
   assert.equal(mod.scripts[0].body, "console.log('hi');");
-  assert.equal(mod.scripts[0].bodyKind, "fenced");
+  assert.equal(trivia.getNode(mod.scripts[0])?.scriptBodyKind, "fenced");
 });
 
 test("any arbitrary lang tag is valid (no allowlist)", () => {
-  const mod = parsejaiph("script run_deno = ```deno\nconsole.log('hi');\n```", "test.jh");
+  const { ast: mod, trivia } = parsejaiphWithTrivia("script run_deno = ```deno\nconsole.log('hi');\n```", "test.jh");
   assert.equal(mod.scripts.length, 1);
   assert.equal(mod.scripts[0].lang, "deno");
-  assert.equal(mod.scripts[0].bodyKind, "fenced");
+  assert.equal(trivia.getNode(mod.scripts[0])?.scriptBodyKind, "fenced");
 });
 
 // === Accepted: plain script without lang tag ===
 
 test("plain script without lang tag has no lang", () => {
-  const mod = parsejaiph('script setup = `echo hello`', "test.jh");
+  const { ast: mod, trivia } = parsejaiphWithTrivia('script setup = `echo hello`', "test.jh");
   assert.equal(mod.scripts[0].lang, undefined);
   assert.equal(mod.scripts[0].body, "echo hello");
-  assert.equal(mod.scripts[0].bodyKind, "backtick");
+  assert.equal(trivia.getNode(mod.scripts[0])?.scriptBodyKind, "backtick");
 });
 
 // === Accepted: manual shebang in fenced body (no lang tag) ===
 
 test("manual shebang in fenced body without lang tag works", () => {
-  const mod = parsejaiph('script analyze = ```\n#!/usr/bin/env ruby\nputs "hi"\n```', "test.jh");
+  const { ast: mod, trivia } = parsejaiphWithTrivia('script analyze = ```\n#!/usr/bin/env ruby\nputs "hi"\n```', "test.jh");
   assert.equal(mod.scripts[0].lang, undefined);
   assert.equal(mod.scripts[0].body, '#!/usr/bin/env ruby\nputs "hi"');
-  assert.equal(mod.scripts[0].bodyKind, "fenced");
+  assert.equal(trivia.getNode(mod.scripts[0])?.scriptBodyKind, "fenced");
 });
 
 // === Rejected: both fence tag and manual shebang ===
diff --git a/src/parse/parse-metadata.test.ts b/src/parse/parse-metadata.test.ts
index a83332c9..107114bb 100644
--- a/src/parse/parse-metadata.test.ts
+++ b/src/parse/parse-metadata.test.ts
@@ -2,6 +2,7 @@ import test from "node:test";
 import assert from "node:assert/strict";
 import { parseConfigBlock } from "./metadata";
 import { parsejaiph } from "../parser";
+import { createTrivia } from "./trivia";
 
 test("parseConfigBlock: parses minimal config with one key", () => {
   const lines = [
@@ -132,9 +133,10 @@ test("parseConfigBlock: skips empty lines and comments", () => {
     "",
     "}",
   ];
-  const { metadata } = parseConfigBlock("test.jh", lines, 0);
+  const trivia = createTrivia();
+  const { metadata } = parseConfigBlock("test.jh", lines, 0, trivia);
   assert.equal(metadata.agent?.command, "claude");
-  assert.deepEqual(metadata.configBodySequence, [
+  assert.deepEqual(trivia.getNode(metadata)?.configBodySequence, [
     { kind: "comment", text: "# this is a comment" },
     { kind: "assign", key: "agent.command" },
   ]);
@@ -270,7 +272,7 @@ test("workflow config: parses config inside workflow", () => {
   const mod = parsejaiph(src, "test.jh");
   assert.equal(mod.workflows[0].metadata?.agent?.backend, "claude");
   assert.equal(mod.workflows[0].steps.length, 1);
-  assert.equal(mod.workflows[0].steps[0].type, "log");
+  assert.equal(mod.workflows[0].steps[0].type, "say");
 });
 
 test("workflow config: allows comments before config", () => {
diff --git a/src/parse/parse-prompt.test.ts b/src/parse/parse-prompt.test.ts
index a546b297..6b2ce9fd 100644
--- a/src/parse/parse-prompt.test.ts
+++ b/src/parse/parse-prompt.test.ts
@@ -1,46 +1,60 @@
 import test from "node:test";
 import assert from "node:assert/strict";
 import { parsePromptStep } from "./prompt";
+import { createTrivia } from "./trivia";
+
+const trivia = createTrivia();
+
+/**
+ * `parsePromptStep` now returns an `exec` step whose `body` is an `Expr.prompt`.
+ * The bodyKind / bodyIdentifier / rawBody trivia hangs off that inner Expr.
+ */
+function unwrapPrompt(step: import("../types").WorkflowStepDef): import("../types").Expr & { kind: "prompt" } {
+  if (step.type !== "exec" || step.body.kind !== "prompt") {
+    throw new Error(`expected exec step with prompt body, got ${step.type}`);
+  }
+  return step.body;
+}
 
 // === parsePromptStep: single-line string literal ===
 
 test("parsePromptStep: parses simple single-line prompt", () => {
   const lines = ['  prompt "Hello world"'];
-  const result = parsePromptStep("test.jh", lines, 0, '"Hello world"', 3);
-  assert.equal(result.step.type, "prompt");
-  assert.equal(result.step.raw, '"Hello world"');
-  assert.equal(result.step.loc.line, 1);
-  assert.equal(result.step.loc.col, 3);
-  assert.equal(result.step.captureName, undefined);
-  assert.equal(result.step.returns, undefined);
-  if (result.step.type === "prompt") {
-    assert.equal(result.step.bodyKind, "string");
+  const result = parsePromptStep("test.jh", lines, 0, '"Hello world"', 3, undefined, trivia);
+  const body = unwrapPrompt(result.step);
+  assert.equal(body.raw, '"Hello world"');
+  assert.equal(body.loc.line, 1);
+  assert.equal(body.loc.col, 3);
+  if (result.step.type === "exec") {
+    assert.equal(result.step.captureName, undefined);
   }
+  assert.equal(body.returns, undefined);
+  assert.equal(trivia.getNode(body)?.bodyKind, "string");
 });
 
 test("parsePromptStep: parses captured prompt", () => {
   const lines = ['  answer = prompt "What?"'];
-  const result = parsePromptStep("test.jh", lines, 0, '"What?"', 3, "answer");
-  assert.equal(result.step.type, "prompt");
-  assert.equal(result.step.raw, '"What?"');
-  assert.equal(result.step.captureName, "answer");
-  if (result.step.type === "prompt") {
-    assert.equal(result.step.bodyKind, "string");
+  const result = parsePromptStep("test.jh", lines, 0, '"What?"', 3, "answer", trivia);
+  const body = unwrapPrompt(result.step);
+  assert.equal(body.raw, '"What?"');
+  if (result.step.type === "exec") {
+    assert.equal(result.step.captureName, "answer");
   }
+  assert.equal(trivia.getNode(body)?.bodyKind, "string");
 });
 
 test("parsePromptStep: parses prompt with returns schema (double-quoted)", () => {
   const lines = ['  prompt "Classify" returns "{ type: string }"'];
-  const result = parsePromptStep("test.jh", lines, 0, '"Classify" returns "{ type: string }"', 3);
-  assert.equal(result.step.type, "prompt");
-  assert.equal(result.step.raw, '"Classify"');
-  assert.equal(result.step.returns, "{ type: string }");
+  const result = parsePromptStep("test.jh", lines, 0, '"Classify" returns "{ type: string }"', 3, undefined, trivia);
+  const body = unwrapPrompt(result.step);
+  assert.equal(body.raw, '"Classify"');
+  assert.equal(body.returns, "{ type: string }");
 });
 
 test("parsePromptStep: rejects single-quoted returns schema", () => {
   const lines = ["  prompt \"Classify\" returns '{ type: string }'"];
   assert.throws(
-    () => parsePromptStep("test.jh", lines, 0, "\"Classify\" returns '{ type: string }'", 3),
+    () => parsePromptStep("test.jh", lines, 0, "\"Classify\" returns '{ type: string }'", 3, undefined, trivia),
     /single-quoted strings are not supported/,
   );
 });
@@ -53,7 +67,7 @@ test("parsePromptStep: multiline quoted prompt throws with clear error", () => {
     '  world"',
   ];
   assert.throws(
-    () => parsePromptStep("test.jh", lines, 0, '"Hello', 3),
+    () => parsePromptStep("test.jh", lines, 0, '"Hello', 3, undefined, trivia),
     /multiline prompt strings are no longer supported/,
   );
 });
@@ -62,36 +76,32 @@ test("parsePromptStep: multiline quoted prompt throws with clear error", () => {
 
 test("parsePromptStep: parses bare identifier prompt", () => {
   const lines = ['  prompt myVar'];
-  const result = parsePromptStep("test.jh", lines, 0, "myVar", 3);
-  assert.equal(result.step.type, "prompt");
-  if (result.step.type === "prompt") {
-    assert.equal(result.step.bodyKind, "identifier");
-    assert.equal(result.step.bodyIdentifier, "myVar");
-    assert.equal(result.step.raw, '"${myVar}"');
-    assert.equal(result.step.returns, undefined);
-  }
+  const result = parsePromptStep("test.jh", lines, 0, "myVar", 3, undefined, trivia);
+  const body = unwrapPrompt(result.step);
+  assert.equal(trivia.getNode(body)?.bodyKind, "identifier");
+  assert.equal(trivia.getNode(body)?.bodyIdentifier, "myVar");
+  assert.equal(body.raw, '"${myVar}"');
+  assert.equal(body.returns, undefined);
 });
 
 test("parsePromptStep: parses identifier prompt with returns", () => {
   const lines = ['  prompt myVar returns "{ type: string }"'];
-  const result = parsePromptStep("test.jh", lines, 0, 'myVar returns "{ type: string }"', 3);
-  assert.equal(result.step.type, "prompt");
-  if (result.step.type === "prompt") {
-    assert.equal(result.step.bodyKind, "identifier");
-    assert.equal(result.step.bodyIdentifier, "myVar");
-    assert.equal(result.step.returns, "{ type: string }");
-  }
+  const result = parsePromptStep("test.jh", lines, 0, 'myVar returns "{ type: string }"', 3, undefined, trivia);
+  const body = unwrapPrompt(result.step);
+  assert.equal(trivia.getNode(body)?.bodyKind, "identifier");
+  assert.equal(trivia.getNode(body)?.bodyIdentifier, "myVar");
+  assert.equal(body.returns, "{ type: string }");
 });
 
 test("parsePromptStep: parses captured identifier prompt", () => {
   const lines = ['  answer = prompt text'];
-  const result = parsePromptStep("test.jh", lines, 0, "text", 3, "answer");
-  assert.equal(result.step.type, "prompt");
-  assert.equal(result.step.captureName, "answer");
-  if (result.step.type === "prompt") {
-    assert.equal(result.step.bodyKind, "identifier");
-    assert.equal(result.step.bodyIdentifier, "text");
+  const result = parsePromptStep("test.jh", lines, 0, "text", 3, "answer", trivia);
+  const body = unwrapPrompt(result.step);
+  if (result.step.type === "exec") {
+    assert.equal(result.step.captureName, "answer");
   }
+  assert.equal(trivia.getNode(body)?.bodyKind, "identifier");
+  assert.equal(trivia.getNode(body)?.bodyIdentifier, "text");
 });
 
 // === parsePromptStep: triple-quoted block ===
@@ -103,14 +113,11 @@ test("parsePromptStep: parses triple-quoted block prompt", () => {
     'Analyze the following: ${input}',
     '"""',
   ];
-  const result = parsePromptStep("test.jh", lines, 0, '"""', 3);
-  assert.equal(result.step.type, "prompt");
-  if (result.step.type === "prompt") {
-    assert.equal(result.step.bodyKind, "triple_quoted");
-    // raw contains the body wrapped in quotes for runtime interpolation
-    assert.ok(result.step.raw.includes("You are a helpful assistant."));
-    assert.ok(result.step.raw.includes("${input}"));
-  }
+  const result = parsePromptStep("test.jh", lines, 0, '"""', 3, undefined, trivia);
+  const body = unwrapPrompt(result.step);
+  assert.equal(trivia.getNode(body)?.bodyKind, "triple_quoted");
+  assert.ok(body.raw.includes("You are a helpful assistant."));
+  assert.ok(body.raw.includes("${input}"));
 });
 
 test("parsePromptStep: parses captured triple-quoted block prompt", () => {
@@ -119,12 +126,12 @@ test("parsePromptStep: parses captured triple-quoted block prompt", () => {
     'Hello multiline',
     '"""',
   ];
-  const result = parsePromptStep("test.jh", lines, 0, '"""', 3, "answer");
-  assert.equal(result.step.type, "prompt");
-  assert.equal(result.step.captureName, "answer");
-  if (result.step.type === "prompt") {
-    assert.equal(result.step.bodyKind, "triple_quoted");
+  const result = parsePromptStep("test.jh", lines, 0, '"""', 3, "answer", trivia);
+  const body = unwrapPrompt(result.step);
+  if (result.step.type === "exec") {
+    assert.equal(result.step.captureName, "answer");
   }
+  assert.equal(trivia.getNode(body)?.bodyKind, "triple_quoted");
 });
 
 test("parsePromptStep: triple-quoted block may be followed by returns on the next line", () => {
@@ -134,12 +141,10 @@ test("parsePromptStep: triple-quoted block may be followed by returns on the nex
     '"""',
     'returns "{ role: string }"',
   ];
-  const result = parsePromptStep("test.jh", lines, 0, '"""', 3, "answer");
-  assert.equal(result.step.type, "prompt");
-  if (result.step.type === "prompt") {
-    assert.equal(result.step.bodyKind, "triple_quoted");
-    assert.equal(result.step.returns, "{ role: string }");
-  }
+  const result = parsePromptStep("test.jh", lines, 0, '"""', 3, "answer", trivia);
+  const body = unwrapPrompt(result.step);
+  assert.equal(trivia.getNode(body)?.bodyKind, "triple_quoted");
+  assert.equal(body.returns, "{ role: string }");
   assert.equal(result.nextLineIdx, 3);
 });
 
@@ -149,12 +154,10 @@ test("parsePromptStep: triple-quoted block may close with returns on same line",
     "Hello",
     '""" returns "{ role: string }"',
   ];
-  const result = parsePromptStep("test.jh", lines, 0, '"""', 3, "answer");
-  assert.equal(result.step.type, "prompt");
-  if (result.step.type === "prompt") {
-    assert.equal(result.step.bodyKind, "triple_quoted");
-    assert.equal(result.step.returns, "{ role: string }");
-  }
+  const result = parsePromptStep("test.jh", lines, 0, '"""', 3, "answer", trivia);
+  const body = unwrapPrompt(result.step);
+  assert.equal(trivia.getNode(body)?.bodyKind, "triple_quoted");
+  assert.equal(body.returns, "{ role: string }");
   assert.equal(result.nextLineIdx, 2);
 });
 
@@ -165,13 +168,11 @@ test("parsePromptStep: unterminated triple-quoted block throws", () => {
     'no closing triple-quote',
   ];
   assert.throws(
-    () => parsePromptStep("test.jh", lines, 0, '"""', 3),
+    () => parsePromptStep("test.jh", lines, 0, '"""', 3, undefined, trivia),
     /unterminated triple-quoted block/,
   );
 });
 
-// === parsePromptStep: triple-backtick fences are rejected for prompts ===
-
 test("parsePromptStep: triple-backtick fence is rejected with guidance", () => {
   const lines = [
     '  prompt ```',
@@ -179,17 +180,15 @@ test("parsePromptStep: triple-backtick fence is rejected with guidance", () => {
     '```',
   ];
   assert.throws(
-    () => parsePromptStep("test.jh", lines, 0, "```", 3),
+    () => parsePromptStep("test.jh", lines, 0, "```", 3, undefined, trivia),
     /prompt blocks use triple quotes.*triple backticks are for scripts/,
   );
 });
 
-// === parsePromptStep: errors ===
-
 test("parsePromptStep: unterminated single-line string throws", () => {
   const lines = ['  prompt "Hello'];
   assert.throws(
-    () => parsePromptStep("test.jh", lines, 0, '"Hello', 3),
+    () => parsePromptStep("test.jh", lines, 0, '"Hello', 3, undefined, trivia),
     /multiline prompt strings are no longer supported/,
   );
 });
@@ -197,7 +196,7 @@ test("parsePromptStep: unterminated single-line string throws", () => {
 test("parsePromptStep: invalid text after prompt string throws", () => {
   const lines = ['  prompt "Hello" garbage'];
   assert.throws(
-    () => parsePromptStep("test.jh", lines, 0, '"Hello" garbage', 3),
+    () => parsePromptStep("test.jh", lines, 0, '"Hello" garbage', 3, undefined, trivia),
     /expected keyword "returns"/,
   );
 });
@@ -205,16 +204,14 @@ test("parsePromptStep: invalid text after prompt string throws", () => {
 test("parsePromptStep: unterminated returns schema throws", () => {
   const lines = ['  prompt "Hello" returns "{ type: string'];
   assert.throws(
-    () => parsePromptStep("test.jh", lines, 0, '"Hello" returns "{ type: string', 3),
+    () => parsePromptStep("test.jh", lines, 0, '"Hello" returns "{ type: string', 3, undefined, trivia),
     /unterminated returns schema/,
   );
 });
 
 test("parsePromptStep: returns with double-quoted schema", () => {
   const lines = ['  prompt "Classify" returns "{ type: string }"'];
-  const result = parsePromptStep("test.jh", lines, 0, '"Classify" returns "{ type: string }"', 3);
-  assert.equal(result.step.type, "prompt");
-  if (result.step.type === "prompt") {
-    assert.equal(result.step.returns, "{ type: string }");
-  }
+  const result = parsePromptStep("test.jh", lines, 0, '"Classify" returns "{ type: string }"', 3, undefined, trivia);
+  const body = unwrapPrompt(result.step);
+  assert.equal(body.returns, "{ type: string }");
 });
diff --git a/src/parse/parse-return.test.ts b/src/parse/parse-return.test.ts
index 3478a418..ea40480f 100644
--- a/src/parse/parse-return.test.ts
+++ b/src/parse/parse-return.test.ts
@@ -2,7 +2,7 @@ import test from "node:test";
 import assert from "node:assert/strict";
 import { parsejaiph } from "../parser";
 
-test("return run parses managed run call", () => {
+test("return run parses Expr.call", () => {
   const mod = parsejaiph(
     `workflow default() {\n  return run helper()\n}`,
     "test.jh",
@@ -10,26 +10,27 @@ test("return run parses managed run call", () => {
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "return");
   if (step.type === "return") {
-    assert.ok(step.managed);
-    assert.equal(step.managed!.kind, "run");
-    assert.equal(step.managed!.ref.value, "helper");
-    assert.equal(step.managed!.args, undefined);
-    assert.equal(step.value, "run helper()");
+    assert.equal(step.value.kind, "call");
+    if (step.value.kind === "call") {
+      assert.equal(step.value.callee.value, "helper");
+      assert.equal(step.value.args, undefined);
+    }
   }
 });
 
-test("return run parses managed run call with args", () => {
+test("return run parses Expr.call with args", () => {
   const mod = parsejaiph(
     `workflow default() {\n  return run helper("a", "b")\n}`,
     "test.jh",
   );
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "return");
-  if (step.type === "return") {
-    assert.ok(step.managed);
-    assert.equal(step.managed!.kind, "run");
-    assert.equal(step.managed!.ref.value, "helper");
-    assert.equal(step.managed!.args, '"a" "b"');
+  if (step.type === "return" && step.value.kind === "call") {
+    assert.equal(step.value.callee.value, "helper");
+    assert.deepEqual(step.value.args, [
+      { kind: "literal", raw: '"a"' },
+      { kind: "literal", raw: '"b"' },
+    ]);
   }
 });
 
@@ -40,14 +41,12 @@ test("return run parses dotted ref", () => {
   );
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "return");
-  if (step.type === "return") {
-    assert.ok(step.managed);
-    assert.equal(step.managed!.kind, "run");
-    assert.equal(step.managed!.ref.value, "lib.helper");
+  if (step.type === "return" && step.value.kind === "call") {
+    assert.equal(step.value.callee.value, "lib.helper");
   }
 });
 
-test("return ensure parses managed ensure call", () => {
+test("return ensure parses Expr.ensure_call", () => {
   const mod = parsejaiph(
     `workflow default() {\n  return ensure check()\n}`,
     "test.jh",
@@ -55,60 +54,52 @@ test("return ensure parses managed ensure call", () => {
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "return");
   if (step.type === "return") {
-    assert.ok(step.managed);
-    assert.equal(step.managed!.kind, "ensure");
-    assert.equal(step.managed!.ref.value, "check");
-    assert.equal(step.managed!.args, undefined);
-    assert.equal(step.value, "ensure check()");
+    assert.equal(step.value.kind, "ensure_call");
+    if (step.value.kind === "ensure_call") {
+      assert.equal(step.value.callee.value, "check");
+      assert.equal(step.value.args, undefined);
+    }
   }
 });
 
-test("return ensure parses managed ensure call with args", () => {
+test("return ensure parses Expr.ensure_call with args", () => {
   const mod = parsejaiph(
     `workflow default() {\n  return ensure check("x")\n}`,
     "test.jh",
   );
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "return");
-  if (step.type === "return") {
-    assert.ok(step.managed);
-    assert.equal(step.managed!.kind, "ensure");
-    assert.equal(step.managed!.args, '"x"');
+  if (step.type === "return" && step.value.kind === "ensure_call") {
+    assert.deepEqual(step.value.args, [{ kind: "literal", raw: '"x"' }]);
   }
 });
 
-test("return run in rule parses managed run call", () => {
+test("return run in rule parses Expr.call", () => {
   const mod = parsejaiph(
     `script helper = \`echo "ok"\`\nrule my_rule() {\n  return run helper()\n}`,
     "test.jh",
   );
   const step = mod.rules[0].steps[0];
   assert.equal(step.type, "return");
-  if (step.type === "return") {
-    assert.ok(step.managed);
-    assert.equal(step.managed!.kind, "run");
-    assert.equal(step.managed!.ref.value, "helper");
+  if (step.type === "return" && step.value.kind === "call") {
+    assert.equal(step.value.callee.value, "helper");
   }
 });
 
-test("return ensure in rule parses managed ensure call", () => {
+test("return ensure in rule parses Expr.ensure_call", () => {
   const mod = parsejaiph(
     `rule sub_rule() {\n  return "ok"\n}\nrule my_rule() {\n  return ensure sub_rule()\n}`,
     "test.jh",
   );
-  const step = mod.rules[0].steps[1];
-  // The rule that contains `return ensure sub_rule()` is my_rule (index 1)
   const myRule = mod.rules.find(r => r.name === "my_rule")!;
   const retStep = myRule.steps[0];
   assert.equal(retStep.type, "return");
-  if (retStep.type === "return") {
-    assert.ok(retStep.managed);
-    assert.equal(retStep.managed!.kind, "ensure");
-    assert.equal(retStep.managed!.ref.value, "sub_rule");
+  if (retStep.type === "return" && retStep.value.kind === "ensure_call") {
+    assert.equal(retStep.value.callee.value, "sub_rule");
   }
 });
 
-test("return with string value has no managed field", () => {
+test("return with string value is Expr.literal", () => {
   const mod = parsejaiph(
     `workflow default() {\n  return "hello"\n}`,
     "test.jh",
@@ -116,12 +107,14 @@ test("return with string value has no managed field", () => {
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "return");
   if (step.type === "return") {
-    assert.equal(step.managed, undefined);
-    assert.equal(step.value, '"hello"');
+    assert.equal(step.value.kind, "literal");
+    if (step.value.kind === "literal") {
+      assert.equal(step.value.raw, '"hello"');
+    }
   }
 });
 
-test("bare return has no managed field", () => {
+test("bare return is Expr.literal with empty string", () => {
   const mod = parsejaiph(
     `workflow default() {\n  return\n}`,
     "test.jh",
@@ -129,25 +122,25 @@ test("bare return has no managed field", () => {
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "return");
   if (step.type === "return") {
-    assert.equal(step.managed, undefined);
-    assert.equal(step.value, '""');
+    assert.equal(step.value.kind, "literal");
+    if (step.value.kind === "literal") {
+      assert.equal(step.value.raw, '""');
+    }
   }
 });
 
-test("return run inline script parses managed inline script", () => {
+test("return run inline script parses Expr.inline_script", () => {
   const mod = parsejaiph(
     "workflow default() {\n  return run `cat report.txt`()\n}",
     "test.jh",
   );
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "return");
-  if (step.type === "return") {
-    assert.ok(step.managed);
-    assert.equal(step.managed!.kind, "run_inline_script");
-    if (step.managed!.kind === "run_inline_script") {
-      assert.equal(step.managed!.body, "cat report.txt");
-      assert.equal(step.managed!.args, undefined);
-    }
+  if (step.type === "return" && step.value.kind === "inline_script") {
+    assert.equal(step.value.body, "cat report.txt");
+    assert.equal(step.value.args, undefined);
+  } else {
+    assert.fail(`expected return/inline_script, got ${step.type}`);
   }
 });
 
@@ -158,13 +151,9 @@ test("return run inline script with args", () => {
   );
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "return");
-  if (step.type === "return") {
-    assert.ok(step.managed);
-    assert.equal(step.managed!.kind, "run_inline_script");
-    if (step.managed!.kind === "run_inline_script") {
-      assert.equal(step.managed!.body, "echo $1");
-      assert.equal(step.managed!.args, '"x"');
-    }
+  if (step.type === "return" && step.value.kind === "inline_script") {
+    assert.equal(step.value.body, "echo $1");
+    assert.deepEqual(step.value.args, [{ kind: "literal", raw: '"x"' }]);
   }
 });
 
@@ -175,18 +164,20 @@ test("return bare inline script is rejected", () => {
   );
 });
 
-test("log run inline script parses managed inline script", () => {
+test("log run inline script parses say with inline_script message", () => {
   const mod = parsejaiph(
     "workflow default() {\n  log run `cat report.txt`()\n}",
     "test.jh",
   );
   const step = mod.workflows[0].steps[0];
-  assert.equal(step.type, "log");
-  if (step.type === "log") {
-    assert.ok(step.managed);
-    assert.equal(step.managed!.kind, "run_inline_script");
-    assert.equal(step.managed!.body, "cat report.txt");
-    assert.equal(step.managed!.args, undefined);
+  assert.equal(step.type, "say");
+  if (step.type === "say") {
+    assert.equal(step.level, "log");
+    assert.equal(step.message.kind, "inline_script");
+    if (step.message.kind === "inline_script") {
+      assert.equal(step.message.body, "cat report.txt");
+      assert.equal(step.message.args, undefined);
+    }
   }
 });
 
@@ -196,12 +187,10 @@ test("log run inline script with args", () => {
     "test.jh",
   );
   const step = mod.workflows[0].steps[0];
-  assert.equal(step.type, "log");
-  if (step.type === "log") {
-    assert.ok(step.managed);
-    assert.equal(step.managed!.kind, "run_inline_script");
-    assert.equal(step.managed!.body, "echo $1");
-    assert.equal(step.managed!.args, '"x"');
+  assert.equal(step.type, "say");
+  if (step.type === "say" && step.message.kind === "inline_script") {
+    assert.equal(step.message.body, "echo $1");
+    assert.deepEqual(step.message.args, [{ kind: "literal", raw: '"x"' }]);
   }
 });
 
@@ -219,16 +208,15 @@ test("logerr bare inline script is rejected", () => {
   );
 });
 
-test("return bare identifier is sugar for interpolated string", () => {
+test("return bare identifier is sugar for interpolated literal", () => {
   const mod = parsejaiph(
     `workflow default() {\n  const response = "hello"\n  return response\n}`,
     "test.jh",
   );
   const step = mod.workflows[0].steps[1];
   assert.equal(step.type, "return");
-  if (step.type === "return") {
-    assert.equal(step.managed, undefined);
-    assert.equal(step.value, '"${response}"');
+  if (step.type === "return" && step.value.kind === "literal") {
+    assert.equal(step.value.raw, '"${response}"');
   }
 });
 
@@ -249,8 +237,8 @@ test("return bare identifier in brace block (if body)", () => {
   if (ifStep.type === "if") {
     const retStep = ifStep.body[0];
     assert.equal(retStep.type, "return");
-    if (retStep.type === "return") {
-      assert.equal(retStep.value, '"${msg}"');
+    if (retStep.type === "return" && retStep.value.kind === "literal") {
+      assert.equal(retStep.value.raw, '"${msg}"');
     }
   }
 });
@@ -270,14 +258,14 @@ test("return bare identifier in catch/recover block", () => {
     "test.jh",
   );
   const ensureStep = mod.workflows[0].steps[0];
-  assert.equal(ensureStep.type, "ensure");
-  if (ensureStep.type === "ensure") {
+  assert.equal(ensureStep.type, "exec");
+  if (ensureStep.type === "exec" && ensureStep.body.kind === "ensure_call") {
     assert.ok(ensureStep.catch);
     const recoverSteps = "block" in ensureStep.catch! ? ensureStep.catch!.block : [ensureStep.catch!.single];
     const retStep = recoverSteps[0];
     assert.equal(retStep.type, "return");
-    if (retStep.type === "return") {
-      assert.equal(retStep.value, '"${err}"');
+    if (retStep.type === "return" && retStep.value.kind === "literal") {
+      assert.equal(retStep.value.raw, '"${err}"');
     }
   }
 });
@@ -298,16 +286,14 @@ test("return run in ensure recover block", () => {
     "test.jh",
   );
   const ensureStep = mod.workflows[0].steps[0];
-  assert.equal(ensureStep.type, "ensure");
-  if (ensureStep.type === "ensure") {
+  assert.equal(ensureStep.type, "exec");
+  if (ensureStep.type === "exec" && ensureStep.body.kind === "ensure_call") {
     assert.ok(ensureStep.catch);
     const recoverSteps = "block" in ensureStep.catch! ? ensureStep.catch!.block : [ensureStep.catch!.single];
     const retStep = recoverSteps[0];
     assert.equal(retStep.type, "return");
-    if (retStep.type === "return") {
-      assert.ok(retStep.managed);
-      assert.equal(retStep.managed!.kind, "run");
-      assert.equal(retStep.managed!.ref.value, "helper");
+    if (retStep.type === "return" && retStep.value.kind === "call") {
+      assert.equal(retStep.value.callee.value, "helper");
     }
   }
 });
diff --git a/src/parse/parse-run-async.test.ts b/src/parse/parse-run-async.test.ts
index 7727ae46..1c750f32 100644
--- a/src/parse/parse-run-async.test.ts
+++ b/src/parse/parse-run-async.test.ts
@@ -2,7 +2,7 @@ import test from "node:test";
 import assert from "node:assert/strict";
 import { parsejaiph } from "../parser";
 
-test("parse: run async produces run step with async flag", () => {
+test("parse: run async produces exec/call with async flag on the body", () => {
   const src = [
     "workflow default() {",
     "  run async some_wf()",
@@ -10,26 +10,29 @@ test("parse: run async produces run step with async flag", () => {
   ].join("\n");
   const mod = parsejaiph(src, "test.jh");
   const step = mod.workflows[0]!.steps[0]!;
-  assert.equal(step.type, "run");
-  if (step.type === "run") {
-    assert.equal(step.workflow.value, "some_wf");
-    assert.equal(step.async, true);
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "call") {
+    assert.equal(step.body.callee.value, "some_wf");
+    assert.equal(step.body.async, true);
   }
 });
 
 test("parse: run async with args", () => {
   const src = [
     "workflow default() {",
-    '  run async other_wf("hello" "$x")',
+    '  run async other_wf("hello", "$x")',
     "}",
   ].join("\n");
   const mod = parsejaiph(src, "test.jh");
   const step = mod.workflows[0]!.steps[0]!;
-  assert.equal(step.type, "run");
-  if (step.type === "run") {
-    assert.equal(step.workflow.value, "other_wf");
-    assert.equal(step.args, '"hello" "$x"');
-    assert.equal(step.async, true);
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "call") {
+    assert.equal(step.body.callee.value, "other_wf");
+    assert.deepEqual(step.body.args, [
+      { kind: "literal", raw: '"hello"' },
+      { kind: "literal", raw: '"$x"' },
+    ]);
+    assert.equal(step.body.async, true);
   }
 });
 
@@ -41,10 +44,10 @@ test("parse: run async with qualified ref", () => {
   ].join("\n");
   const mod = parsejaiph(src, "test.jh");
   const step = mod.workflows[0]!.steps[0]!;
-  assert.equal(step.type, "run");
-  if (step.type === "run") {
-    assert.equal(step.workflow.value, "mod.some_wf");
-    assert.equal(step.async, true);
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "call") {
+    assert.equal(step.body.callee.value, "mod.some_wf");
+    assert.equal(step.body.async, true);
   }
 });
 
@@ -56,9 +59,9 @@ test("parse: regular run does not have async flag", () => {
   ].join("\n");
   const mod = parsejaiph(src, "test.jh");
   const step = mod.workflows[0]!.steps[0]!;
-  assert.equal(step.type, "run");
-  if (step.type === "run") {
-    assert.equal(step.async, undefined);
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "call") {
+    assert.equal(step.body.async, undefined);
   }
 });
 
@@ -74,7 +77,7 @@ test("parse: capture + run async is rejected without const", () => {
   );
 });
 
-test("parse: const capture + run async produces run_capture with async flag", () => {
+test("parse: const capture + run async produces Expr.call with async flag", () => {
   const src = [
     "workflow default() {",
     "  const h = run async some_wf()",
@@ -83,13 +86,10 @@ test("parse: const capture + run async produces run_capture with async flag", ()
   const mod = parsejaiph(src, "test.jh");
   const step = mod.workflows[0]!.steps[0]!;
   assert.equal(step.type, "const");
-  if (step.type === "const") {
+  if (step.type === "const" && step.value.kind === "call") {
     assert.equal(step.name, "h");
-    assert.equal(step.value.kind, "run_capture");
-    if (step.value.kind === "run_capture") {
-      assert.equal(step.value.ref.value, "some_wf");
-      assert.equal(step.value.async, true);
-    }
+    assert.equal(step.value.callee.value, "some_wf");
+    assert.equal(step.value.async, true);
   }
 });
 
@@ -102,13 +102,10 @@ test("parse: const capture + run async with args", () => {
   const mod = parsejaiph(src, "test.jh");
   const step = mod.workflows[0]!.steps[0]!;
   assert.equal(step.type, "const");
-  if (step.type === "const") {
-    assert.equal(step.value.kind, "run_capture");
-    if (step.value.kind === "run_capture") {
-      assert.equal(step.value.ref.value, "other_wf");
-      assert.equal(step.value.args, '"hello"');
-      assert.equal(step.value.async, true);
-    }
+  if (step.type === "const" && step.value.kind === "call") {
+    assert.equal(step.value.callee.value, "other_wf");
+    assert.deepEqual(step.value.args, [{ kind: "literal", raw: '"hello"' }]);
+    assert.equal(step.value.async, true);
   }
 });
 
@@ -120,15 +117,15 @@ test("parse: run async with recover block", () => {
   ].join("\n");
   const mod = parsejaiph(src, "test.jh");
   const step = mod.workflows[0]!.steps[0]!;
-  assert.equal(step.type, "run");
-  if (step.type === "run") {
-    assert.equal(step.workflow.value, "foo");
-    assert.equal(step.async, true);
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "call") {
+    assert.equal(step.body.callee.value, "foo");
+    assert.equal(step.body.async, true);
     assert.ok(step.recover);
     if (step.recover && "block" in step.recover) {
       assert.equal(step.recover.bindings.failure, "err");
       assert.equal(step.recover.block.length, 1);
-      assert.equal(step.recover.block[0].type, "log");
+      assert.equal(step.recover.block[0].type, "say");
     }
   }
 });
@@ -144,9 +141,9 @@ test("parse: run async with multi-line recover block", () => {
   ].join("\n");
   const mod = parsejaiph(src, "test.jh");
   const step = mod.workflows[0]!.steps[0]!;
-  assert.equal(step.type, "run");
-  if (step.type === "run") {
-    assert.equal(step.async, true);
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "call") {
+    assert.equal(step.body.async, true);
     assert.ok(step.recover);
     if (step.recover && "block" in step.recover) {
       assert.equal(step.recover.block.length, 2);
@@ -162,10 +159,10 @@ test("parse: run async with catch block", () => {
   ].join("\n");
   const mod = parsejaiph(src, "test.jh");
   const step = mod.workflows[0]!.steps[0]!;
-  assert.equal(step.type, "run");
-  if (step.type === "run") {
-    assert.equal(step.workflow.value, "bar");
-    assert.equal(step.async, true);
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "call") {
+    assert.equal(step.body.callee.value, "bar");
+    assert.equal(step.body.async, true);
     assert.ok(step.catch);
     if (step.catch && "block" in step.catch) {
       assert.equal(step.catch.bindings.failure, "e");
diff --git a/src/parse/parse-send-rhs.test.ts b/src/parse/parse-send-rhs.test.ts
index 67754ef6..f6b7cb0e 100644
--- a/src/parse/parse-send-rhs.test.ts
+++ b/src/parse/parse-send-rhs.test.ts
@@ -2,16 +2,16 @@ import test from "node:test";
 import assert from "node:assert/strict";
 import { parseSendRhs } from "./send-rhs";
 
-// === parseSendRhs: empty/whitespace RHS is now rejected ===
+// === parseSendRhs: empty/whitespace RHS is rejected ===
 
-test("parseSendRhs: empty RHS returns forward kind", () => {
+test("parseSendRhs: empty RHS throws", () => {
   assert.throws(
     () => parseSendRhs("test.jh", "", 1, 1),
     /send requires an explicit payload/,
   );
 });
 
-test("parseSendRhs: whitespace-only RHS returns forward kind", () => {
+test("parseSendRhs: whitespace-only RHS throws", () => {
   assert.throws(
     () => parseSendRhs("test.jh", "   ", 1, 1),
     /send requires an explicit payload/,
@@ -20,19 +20,19 @@ test("parseSendRhs: whitespace-only RHS returns forward kind", () => {
 
 // === parseSendRhs: literal ===
 
-test("parseSendRhs: quoted string returns literal kind", () => {
-  const { rhs } = parseSendRhs("test.jh", '"hello world"', 1, 1);
-  assert.equal(rhs.kind, "literal");
-  if (rhs.kind === "literal") {
-    assert.equal(rhs.token, '"hello world"');
+test("parseSendRhs: quoted string returns Expr.literal", () => {
+  const { value } = parseSendRhs("test.jh", '"hello world"', 1, 1);
+  assert.equal(value.kind, "literal");
+  if (value.kind === "literal") {
+    assert.equal(value.raw, '"hello world"');
   }
 });
 
 test("parseSendRhs: quoted string with escaped quote", () => {
-  const { rhs } = parseSendRhs("test.jh", '"say \\"hi\\""', 1, 1);
-  assert.equal(rhs.kind, "literal");
-  if (rhs.kind === "literal") {
-    assert.equal(rhs.token, '"say \\"hi\\""');
+  const { value } = parseSendRhs("test.jh", '"say \\"hi\\""', 1, 1);
+  assert.equal(value.kind, "literal");
+  if (value.kind === "literal") {
+    assert.equal(value.raw, '"say \\"hi\\""');
   }
 });
 
@@ -50,68 +50,68 @@ test("parseSendRhs: trailing content after quoted string throws", () => {
   );
 });
 
-// === parseSendRhs: run ===
+// === parseSendRhs: call ===
 
-test("parseSendRhs: run call returns run kind", () => {
-  const { rhs } = parseSendRhs("test.jh", "run my_script()", 1, 5);
-  assert.equal(rhs.kind, "run");
-  if (rhs.kind === "run") {
-    assert.equal(rhs.ref.value, "my_script");
-    assert.equal(rhs.ref.loc.line, 1);
-    assert.equal(rhs.ref.loc.col, 5);
+test("parseSendRhs: run call returns Expr.call", () => {
+  const { value } = parseSendRhs("test.jh", "run my_script()", 1, 5);
+  assert.equal(value.kind, "call");
+  if (value.kind === "call") {
+    assert.equal(value.callee.value, "my_script");
+    assert.equal(value.callee.loc.line, 1);
+    assert.equal(value.callee.loc.col, 5);
   }
 });
 
 test("parseSendRhs: run call with args", () => {
-  const { rhs } = parseSendRhs("test.jh", 'run my_script("arg1")', 1, 1);
-  assert.equal(rhs.kind, "run");
-  if (rhs.kind === "run") {
-    assert.equal(rhs.ref.value, "my_script");
-    assert.equal(rhs.args, '"arg1"');
+  const { value } = parseSendRhs("test.jh", 'run my_script("arg1")', 1, 1);
+  assert.equal(value.kind, "call");
+  if (value.kind === "call") {
+    assert.equal(value.callee.value, "my_script");
+    assert.deepEqual(value.args, [{ kind: "literal", raw: '"arg1"' }]);
   }
 });
 
 test("parseSendRhs: run call with dotted ref", () => {
-  const { rhs } = parseSendRhs("test.jh", "run lib.process()", 1, 1);
-  assert.equal(rhs.kind, "run");
-  if (rhs.kind === "run") {
-    assert.equal(rhs.ref.value, "lib.process");
+  const { value } = parseSendRhs("test.jh", "run lib.process()", 1, 1);
+  assert.equal(value.kind, "call");
+  if (value.kind === "call") {
+    assert.equal(value.callee.value, "lib.process");
   }
 });
 
-// === parseSendRhs: var ===
+// === parseSendRhs: bare variable (`$name`) is Expr.literal in the new model ===
 
-test("parseSendRhs: simple variable returns var kind", () => {
-  const { rhs } = parseSendRhs("test.jh", "$myVar", 1, 1);
-  assert.equal(rhs.kind, "var");
-  if (rhs.kind === "var") {
-    assert.equal(rhs.bash, "$myVar");
+test("parseSendRhs: simple variable returns Expr.literal", () => {
+  const { value } = parseSendRhs("test.jh", "$myVar", 1, 1);
+  assert.equal(value.kind, "literal");
+  if (value.kind === "literal") {
+    assert.equal(value.raw, "$myVar");
   }
 });
 
 test("parseSendRhs: underscore variable", () => {
-  const { rhs } = parseSendRhs("test.jh", "$_name", 1, 1);
-  assert.equal(rhs.kind, "var");
-  if (rhs.kind === "var") {
-    assert.equal(rhs.bash, "$_name");
+  const { value } = parseSendRhs("test.jh", "$_name", 1, 1);
+  assert.equal(value.kind, "literal");
+  if (value.kind === "literal") {
+    assert.equal(value.raw, "$_name");
   }
 });
 
 // === parseSendRhs: braced variable ===
 
-test("parseSendRhs: braced variable returns var kind", () => {
-  const { rhs } = parseSendRhs("test.jh", "${myVar}", 1, 1);
-  assert.equal(rhs.kind, "var");
-  if (rhs.kind === "var") {
-    assert.equal(rhs.bash, "${myVar}");
+test("parseSendRhs: braced variable returns Expr.literal", () => {
+  const { value } = parseSendRhs("test.jh", "${myVar}", 1, 1);
+  assert.equal(value.kind, "literal");
+  if (value.kind === "literal") {
+    assert.equal(value.raw, "${myVar}");
   }
 });
 
 test("parseSendRhs: nested braced variable", () => {
-  const { rhs } = parseSendRhs("test.jh", "${outer_${inner}}", 1, 1);
-  assert.equal(rhs.kind, "var");
-  if (rhs.kind === "var") {
-    assert.equal(rhs.bash, "${outer_${inner}}");
+  const { value } = parseSendRhs("test.jh", "${outer_${inner}}", 1, 1);
+  assert.equal(value.kind, "literal");
+  if (value.kind === "literal") {
+    assert.equal(value.raw, "${outer_${inner}}");
   }
 });
 
@@ -138,37 +138,37 @@ test("parseSendRhs: braced variable with command substitution throws", () => {
 
 // === parseSendRhs: bare_ref ===
 
-test("parseSendRhs: bare dotted ref returns bare_ref kind", () => {
-  const { rhs } = parseSendRhs("test.jh", "lib.handler", 1, 3);
-  assert.equal(rhs.kind, "bare_ref");
-  if (rhs.kind === "bare_ref") {
-    assert.equal(rhs.ref.value, "lib.handler");
-    assert.equal(rhs.ref.loc.line, 1);
-    assert.equal(rhs.ref.loc.col, 3);
+test("parseSendRhs: bare dotted ref returns Expr.bare_ref", () => {
+  const { value } = parseSendRhs("test.jh", "lib.handler", 1, 3);
+  assert.equal(value.kind, "bare_ref");
+  if (value.kind === "bare_ref") {
+    assert.equal(value.ref.value, "lib.handler");
+    assert.equal(value.ref.loc.line, 1);
+    assert.equal(value.ref.loc.col, 3);
   }
 });
 
 // === parseSendRhs: shell ===
 
-test("parseSendRhs: unrecognized expression returns shell kind", () => {
-  const { rhs } = parseSendRhs("test.jh", "echo hello | grep h", 1, 1);
-  assert.equal(rhs.kind, "shell");
-  if (rhs.kind === "shell") {
-    assert.equal(rhs.command, "echo hello | grep h");
-    assert.equal(rhs.loc.line, 1);
-    assert.equal(rhs.loc.col, 1);
+test("parseSendRhs: unrecognized expression returns Expr.shell", () => {
+  const { value } = parseSendRhs("test.jh", "echo hello | grep h", 1, 1);
+  assert.equal(value.kind, "shell");
+  if (value.kind === "shell") {
+    assert.equal(value.command, "echo hello | grep h");
+    assert.equal(value.loc.line, 1);
+    assert.equal(value.loc.col, 1);
   }
 });
 
 // === parseSendRhs: triple-quoted literal ===
 
-test("parseSendRhs: triple-quoted string returns literal kind", () => {
+test("parseSendRhs: triple-quoted string returns Expr.literal", () => {
   const lines = ['ch <- """', "  hello", "  world", '"""'];
-  const { rhs, nextIdx } = parseSendRhs("test.jh", '"""', 1, 6, lines, 0);
-  assert.equal(rhs.kind, "literal");
-  if (rhs.kind === "literal") {
-    assert.ok(rhs.token.includes("hello"));
-    assert.ok(rhs.token.includes("world"));
+  const { value, nextIdx } = parseSendRhs("test.jh", '"""', 1, 6, lines, 0);
+  assert.equal(value.kind, "literal");
+  if (value.kind === "literal") {
+    assert.ok(value.raw.includes("hello"));
+    assert.ok(value.raw.includes("world"));
   }
   assert.equal(nextIdx, 4);
 });
diff --git a/src/parse/parse-steps.test.ts b/src/parse/parse-steps.test.ts
index c4a20985..999b3f09 100644
--- a/src/parse/parse-steps.test.ts
+++ b/src/parse/parse-steps.test.ts
@@ -1,255 +1,249 @@
 import test from "node:test";
 import assert from "node:assert/strict";
 import { parsejaiph } from "../parser";
-import { parseEnsureStep, parseRunRecoverStep } from "./steps";
-
-// === parseEnsureStep: basic ensure without catch ===
-
-test("parseEnsureStep: parses basic ensure call", () => {
-  const lines = ["  ensure my_rule()"];
-  const { step, nextIdx } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule()");
-  assert.equal(step.type, "ensure");
-  if (step.type === "ensure") {
-    assert.equal(step.ref.value, "my_rule");
-    assert.equal(step.catch, undefined);
+import type { WorkflowStepDef } from "../types";
+
+/**
+ * After Refactor 2 the per-host catch/recover parsers (`parseEnsureStep`,
+ * `parseRunCatchStep`, `parseRunRecoverStep`) and their mini body parser
+ * (`parseCatchStatement`) are gone. The contract is now exercised end-to-end
+ * through `parsejaiph` — `parseAttachedBlock` (in `src/parse/steps.ts`)
+ * delegates body parsing to the same `parseBlockStatement` used at the top
+ * level.
+ */
+
+function asEnsureExec(step: WorkflowStepDef) {
+  if (step.type !== "exec" || step.body.kind !== "ensure_call") {
+    throw new Error(`expected exec/ensure_call step, got ${step.type}`);
   }
-  assert.equal(nextIdx, 0);
-});
+  return step;
+}
+function asRunExec(step: WorkflowStepDef) {
+  if (step.type !== "exec" || step.body.kind !== "call") {
+    throw new Error(`expected exec/call step, got ${step.type}`);
+  }
+  return step;
+}
 
-test("parseEnsureStep: parses ensure with args", () => {
-  const lines = ['  ensure my_rule("arg1")'];
-  const { step } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], 'my_rule("arg1")');
-  if (step.type === "ensure") {
-    assert.equal(step.ref.value, "my_rule");
-    assert.equal(step.args, '"arg1"');
+function parseOneWorkflowStep(bodyLines: string[]): WorkflowStepDef {
+  const src = ["workflow w() {", ...bodyLines.map((l) => `  ${l}`), "}", ""].join("\n");
+  const mod = parsejaiph(src, "fixture.jh");
+  const w = mod.workflows.find((x) => x.name === "w");
+  if (!w) throw new Error("workflow not found");
+  const steps = w.steps.filter((s) => s.type !== "trivia");
+  if (steps.length !== 1) throw new Error(`expected one step, got ${steps.length}`);
+  return steps[0];
+}
+
+// === ensure: basic ===
+
+test("ensure: parses basic ensure call", () => {
+  const e = asEnsureExec(parseOneWorkflowStep(["ensure my_rule()"]));
+  assert.equal(e.body.kind, "ensure_call");
+  if (e.body.kind === "ensure_call") {
+    assert.equal(e.body.callee.value, "my_rule");
   }
+  assert.equal(e.catch, undefined);
 });
 
-test("parseEnsureStep: parses ensure with dotted ref", () => {
-  const lines = ["  ensure lib.check()"];
-  const { step } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], "lib.check()");
-  if (step.type === "ensure") {
-    assert.equal(step.ref.value, "lib.check");
+test("ensure: parses ensure with args", () => {
+  const e = asEnsureExec(parseOneWorkflowStep(['ensure my_rule("arg1")']));
+  if (e.body.kind === "ensure_call") {
+    assert.equal(e.body.callee.value, "my_rule");
+    assert.deepEqual(e.body.args, [{ kind: "literal", raw: '"arg1"' }]);
   }
 });
 
-test("parseEnsureStep: parses ensure with captureName", () => {
-  const lines = ["  result = ensure my_rule()"];
-  const { step } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule()", "result");
-  if (step.type === "ensure") {
-    assert.equal(step.captureName, "result");
+test("ensure: parses ensure with dotted ref", () => {
+  const e = asEnsureExec(parseOneWorkflowStep(["ensure lib.check()"]));
+  if (e.body.kind === "ensure_call") {
+    assert.equal(e.body.callee.value, "lib.check");
   }
 });
 
-test("parseEnsureStep: ensure without parens parses as zero-arg call", () => {
-  const lines = ["  ensure my_rule"];
+test("ensure: ensure without parens throws", () => {
   assert.throws(
-    () => parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule"),
+    () => parseOneWorkflowStep(["ensure my_rule"]),
     /parentheses are required/,
   );
 });
 
-// === parseEnsureStep: catch with single statement ===
+// === ensure catch: single statement forms ===
 
-test("parseEnsureStep: parses ensure with single catch statement", () => {
-  const lines = ['  ensure my_rule() catch (failure) log "failed"'];
-  const { step } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], 'my_rule() catch (failure) log "failed"');
-  if (step.type === "ensure") {
-    assert.ok(step.catch);
-    assert.equal(step.catch.bindings.failure, "failure");
-    if ("single" in step.catch) {
-      assert.equal(step.catch.single.type, "log");
-    }
+test("ensure catch: parses single catch log statement", () => {
+  const e = asEnsureExec(parseOneWorkflowStep(['ensure my_rule() catch (failure) log "failed"']));
+  assert.ok(e.catch);
+  assert.equal(e.catch!.bindings.failure, "failure");
+  if (e.catch && "single" in e.catch) {
+    assert.equal(e.catch.single.type, "say");
   }
 });
 
-test("parseEnsureStep: parses ensure with catch run statement", () => {
-  const lines = ["  ensure my_rule() catch (err) run fallback()"];
-  const { step } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule() catch (err) run fallback()");
-  if (step.type === "ensure") {
-    assert.ok(step.catch);
-    assert.equal(step.catch.bindings.failure, "err");
-    if ("single" in step.catch) {
-      assert.equal(step.catch.single.type, "run");
-    }
+test("ensure catch: parses single catch run statement", () => {
+  const e = asEnsureExec(parseOneWorkflowStep(["ensure my_rule() catch (err) run fallback()"]));
+  assert.ok(e.catch);
+  assert.equal(e.catch!.bindings.failure, "err");
+  if (e.catch && "single" in e.catch) {
+    assert.equal(e.catch.single.type, "exec");
   }
 });
 
-test("parseEnsureStep: parses ensure with catch wait statement", () => {
-  const lines = ["  ensure my_rule() catch (failure) wait"];
+test("ensure catch: wait statement is rejected", () => {
   assert.throws(
-    () => parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule() catch (failure) wait"),
+    () => parseOneWorkflowStep(["ensure my_rule() catch (failure) wait"]),
     /"wait" has been removed from the language/,
   );
 });
 
-test("parseEnsureStep: parses ensure with catch fail statement", () => {
-  const lines = ['  ensure my_rule() catch (failure) fail "reason"'];
-  const { step } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], 'my_rule() catch (failure) fail "reason"');
-  if (step.type === "ensure") {
-    assert.ok(step.catch);
-    if ("single" in step.catch) {
-      assert.equal(step.catch.single.type, "fail");
+test("ensure catch: parses single catch fail statement", () => {
+  const e = asEnsureExec(parseOneWorkflowStep(['ensure my_rule() catch (failure) fail "reason"']));
+  assert.ok(e.catch);
+  if (e.catch && "single" in e.catch) {
+    assert.equal(e.catch.single.type, "say");
+    if (e.catch.single.type === "say") {
+      assert.equal(e.catch.single.level, "fail");
     }
   }
 });
 
-// === parseEnsureStep: catch with inline block ===
-
-test("parseEnsureStep: parses ensure with inline catch block", () => {
-  const lines = ['  ensure my_rule() catch (failure) { log "a"; log "b" }'];
-  const { step } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], 'my_rule() catch (failure) { log "a"; log "b" }');
-  if (step.type === "ensure") {
-    assert.ok(step.catch);
-    if ("block" in step.catch) {
-      assert.equal(step.catch.block.length, 2);
-      assert.equal(step.catch.block[0].type, "log");
-      assert.equal(step.catch.block[1].type, "log");
-    }
+// === ensure catch: inline block ===
+
+test("ensure catch: parses inline catch block", () => {
+  const e = asEnsureExec(parseOneWorkflowStep(['ensure my_rule() catch (failure) { log "a"; log "b" }']));
+  if (e.catch && "block" in e.catch) {
+    assert.equal(e.catch.block.length, 2);
+    assert.equal(e.catch.block[0].type, "say");
+    assert.equal(e.catch.block[1].type, "say");
   }
 });
 
-// === parseEnsureStep: catch with multiline block ===
+// === ensure catch: multiline block ===
 
-test("parseEnsureStep: parses ensure with multiline catch block", () => {
-  const lines = [
-    "  ensure my_rule() catch (failure) {",
+test("ensure catch: parses multiline catch block", () => {
+  const e = asEnsureExec(parseOneWorkflowStep([
+    "ensure my_rule() catch (failure) {",
     '    log "recovering"',
     "    run fallback()",
     "  }",
-  ];
-  const { step, nextIdx } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule() catch (failure) {");
-  if (step.type === "ensure") {
-    assert.ok(step.catch);
-    if ("block" in step.catch) {
-      assert.equal(step.catch.block.length, 2);
-      assert.equal(step.catch.block[0].type, "log");
-      assert.equal(step.catch.block[1].type, "run");
-    }
+  ]));
+  if (e.catch && "block" in e.catch) {
+    assert.equal(e.catch.block.length, 2);
+    assert.equal(e.catch.block[0].type, "say");
+    assert.equal(e.catch.block[1].type, "exec");
   }
-  assert.equal(nextIdx, 3);
 });
 
-test("parseEnsureStep: multiline catch block with triple-quoted prompt", () => {
-  const lines = [
-    "  ensure gate() catch (err) {",
+test("ensure catch: multiline block with triple-quoted prompt", () => {
+  const e = asEnsureExec(parseOneWorkflowStep([
+    "ensure gate() catch (err) {",
     "    run save()",
     '    prompt """',
     "      fix CI",
     '    """',
     "    run retry()",
     "  }",
-  ];
-  const { step, nextIdx } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], "gate() catch (err) {");
-  assert.equal(step.type, "ensure");
-  if (step.type === "ensure" && step.catch && "block" in step.catch) {
-    assert.equal(step.catch.block.length, 3);
-    assert.equal(step.catch.block[0].type, "run");
-    const p = step.catch.block[1];
-    assert.equal(p.type, "prompt");
-    if (p.type === "prompt") {
-      assert.equal(p.bodyKind, "triple_quoted");
-      assert.ok(p.raw.includes("fix CI"));
+  ]));
+  if (e.catch && "block" in e.catch) {
+    assert.equal(e.catch.block.length, 3);
+    assert.equal(e.catch.block[0].type, "exec");
+    const p = e.catch.block[1];
+    assert.equal(p.type, "exec");
+    if (p.type === "exec" && p.body.kind === "prompt") {
+      assert.ok(p.body.raw.includes("fix CI"));
     }
-    assert.equal(step.catch.block[2].type, "run");
+    assert.equal(e.catch.block[2].type, "exec");
   }
-  assert.equal(nextIdx, 6);
 });
 
-test("parseEnsureStep: catch block lines starting with # are comments not shell", () => {
-  const lines = [
-    "  ensure gate() catch (err) {",
+test("ensure catch: comment lines become trivia", () => {
+  const e = asEnsureExec(parseOneWorkflowStep([
+    "ensure gate() catch (err) {",
     "    # note",
     "    run retry()",
     "  }",
-  ];
-  const { step } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], "gate() catch (err) {");
-  assert.equal(step.type, "ensure");
-  if (step.type === "ensure" && step.catch && "block" in step.catch) {
-    assert.equal(step.catch.block.length, 2);
-    assert.equal(step.catch.block[0].type, "comment");
-    assert.equal(step.catch.block[1].type, "run");
+  ]));
+  if (e.catch && "block" in e.catch) {
+    assert.equal(e.catch.block.length, 2);
+    assert.equal(e.catch.block[0].type, "trivia");
+    assert.equal(e.catch.block[1].type, "exec");
   }
 });
 
-// === parseEnsureStep: catch bindings ===
+// === ensure catch: bindings ===
 
-test("parseEnsureStep: rejects catch with two bindings", () => {
-  const lines = ['  ensure my_rule() catch (failure, attempt) { log "retry" }'];
+test("ensure catch: rejects two bindings", () => {
   assert.throws(
-    () => parseEnsureStep("test.jh", lines, 0, 1, lines[0], 'my_rule() catch (failure, attempt) { log "retry" }'),
+    () => parseOneWorkflowStep(['ensure my_rule() catch (failure, attempt) { log "retry" }']),
     /catch accepts exactly one binding.*attempt.*has been removed/,
   );
 });
 
-// === parseEnsureStep: catch errors ===
+// === ensure catch: error messages ===
 
-test("parseEnsureStep: catch at EOL without block throws", () => {
-  const lines = ["  ensure my_rule() catch"];
+test("ensure catch: catch at EOL without block throws", () => {
   assert.throws(
-    () => parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule() catch"),
+    () => parseOneWorkflowStep(["ensure my_rule() catch"]),
     /catch requires explicit bindings/,
   );
 });
 
-test("parseEnsureStep: catch without bindings throws", () => {
-  const lines = ["  ensure my_rule() catch {"];
+test("ensure catch: catch without bindings throws", () => {
   assert.throws(
-    () => parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule() catch {"),
+    () => parseOneWorkflowStep(["ensure my_rule() catch {"]),
     /catch requires explicit bindings/,
   );
 });
 
-test("parseEnsureStep: unterminated multiline catch block throws", () => {
-  const lines = [
-    "  ensure my_rule() catch (failure) {",
-    '    log "recovering"',
-  ];
+test("ensure catch: unterminated multiline catch block throws", () => {
   assert.throws(
-    () => parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule() catch (failure) {"),
+    () => parsejaiph(
+      [
+        "workflow w() {",
+        "  ensure my_rule() catch (failure) {",
+        '    log "recovering"',
+        "",
+      ].join("\n"),
+      "fixture.jh",
+    ),
     /unterminated catch block/,
   );
 });
 
-test("parseEnsureStep: empty catch block throws", () => {
-  const lines = [
-    "  ensure my_rule() catch (failure) {",
-    "  }",
-  ];
+test("ensure catch: empty catch block throws", () => {
   assert.throws(
-    () => parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule() catch (failure) {"),
+    () => parseOneWorkflowStep([
+      "ensure my_rule() catch (failure) {",
+      "  }",
+    ]),
     /catch block must contain at least one statement/,
   );
 });
 
-test("parseEnsureStep: empty inline catch block throws", () => {
-  const lines = ["  ensure my_rule() catch (failure) { }"];
+test("ensure catch: empty inline catch block throws", () => {
   assert.throws(
-    () => parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule() catch (failure) { }"),
+    () => parseOneWorkflowStep(["ensure my_rule() catch (failure) { }"]),
     /catch block must contain at least one statement/,
   );
 });
 
-// === parseEnsureStep: catch statement types ===
+// === ensure catch: statement varieties ===
 
-test("parseEnsureStep: catch with shell command", () => {
-  const lines = ["  ensure my_rule() catch (failure) echo fallback"];
-  const { step } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], "my_rule() catch (failure) echo fallback");
-  if (step.type === "ensure") {
-    assert.ok(step.catch);
-    if ("single" in step.catch) {
-      assert.equal(step.catch.single.type, "shell");
+test("ensure catch: single shell command", () => {
+  const e = asEnsureExec(parseOneWorkflowStep(["ensure my_rule() catch (failure) echo fallback"]));
+  if (e.catch && "single" in e.catch) {
+    assert.equal(e.catch.single.type, "exec");
+    if (e.catch.single.type === "exec") {
+      assert.equal(e.catch.single.body.kind, "shell");
     }
   }
 });
 
-test("parseEnsureStep: catch with logerr statement", () => {
-  const lines = ['  ensure my_rule() catch (failure) logerr "error msg"'];
-  const { step } = parseEnsureStep("test.jh", lines, 0, 1, lines[0], 'my_rule() catch (failure) logerr "error msg"');
-  if (step.type === "ensure") {
-    assert.ok(step.catch);
-    if ("single" in step.catch) {
-      assert.equal(step.catch.single.type, "logerr");
+test("ensure catch: single logerr statement", () => {
+  const e = asEnsureExec(parseOneWorkflowStep(['ensure my_rule() catch (failure) logerr "error msg"']));
+  if (e.catch && "single" in e.catch) {
+    assert.equal(e.catch.single.type, "say");
+    if (e.catch.single.type === "say") {
+      assert.equal(e.catch.single.level, "logerr");
     }
   }
 });
@@ -272,107 +266,82 @@ test("parsejaiph: workflow with ensure catch and multiline triple-quoted prompt"
   const mod = parsejaiph(src, "catch_prompt.jh");
   const w = mod.workflows.find((x) => x.name === "w");
   assert.ok(w);
-  const ensureStep = w!.steps[0];
-  assert.equal(ensureStep.type, "ensure");
-  if (ensureStep.type === "ensure" && ensureStep.catch && "block" in ensureStep.catch) {
-    assert.equal(ensureStep.catch.block.length, 1);
-    const p = ensureStep.catch.block[0];
-    assert.equal(p.type, "prompt");
-    if (p.type === "prompt") {
-      assert.equal(p.bodyKind, "triple_quoted");
-      assert.ok(p.raw.includes("hello"));
+  const e = asEnsureExec(w!.steps[0]);
+  if (e.catch && "block" in e.catch) {
+    assert.equal(e.catch.block.length, 1);
+    const p = e.catch.block[0];
+    assert.equal(p.type, "exec");
+    if (p.type === "exec" && p.body.kind === "prompt") {
+      assert.ok(p.body.raw.includes("hello"));
     }
   }
 });
 
-// === parseRunRecoverStep: basic recover ===
-
-test("parseRunRecoverStep: returns null when no recover keyword", () => {
-  const lines = ["  run my_workflow()"];
-  const result = parseRunRecoverStep("test.jh", lines, 0, 1, lines[0], "my_workflow()");
-  assert.equal(result, null);
-});
+// === run recover ===
 
-test("parseRunRecoverStep: parses run with single recover statement", () => {
-  const lines = ['  run my_workflow() recover(err) log "repairing"'];
-  const result = parseRunRecoverStep("test.jh", lines, 0, 1, lines[0], 'my_workflow() recover(err) log "repairing"');
-  assert.ok(result);
-  const step = result!.step;
-  assert.equal(step.type, "run");
-  if (step.type === "run") {
-    assert.equal(step.workflow.value, "my_workflow");
-    assert.ok(step.recover);
-    assert.equal(step.recover!.bindings.failure, "err");
-    if ("single" in step.recover!) {
-      assert.equal(step.recover!.single.type, "log");
-    }
+test("run recover: parses single recover statement", () => {
+  const step = asRunExec(parseOneWorkflowStep(['run my_workflow() recover(err) log "repairing"']));
+  if (step.body.kind === "call") {
+    assert.equal(step.body.callee.value, "my_workflow");
+  }
+  assert.ok(step.recover);
+  assert.equal(step.recover!.bindings.failure, "err");
+  if (step.recover && "single" in step.recover) {
+    assert.equal(step.recover.single.type, "say");
   }
 });
 
-test("parseRunRecoverStep: parses run with inline recover block", () => {
-  const lines = ['  run fix() recover(e) { log "a"; run patch() }'];
-  const result = parseRunRecoverStep("test.jh", lines, 0, 1, lines[0], 'fix() recover(e) { log "a"; run patch() }');
-  assert.ok(result);
-  const step = result!.step;
-  if (step.type === "run" && step.recover && "block" in step.recover) {
+test("run recover: parses inline recover block", () => {
+  const step = asRunExec(parseOneWorkflowStep(['run fix() recover(e) { log "a"; run patch() }']));
+  if (step.recover && "block" in step.recover) {
     assert.equal(step.recover.block.length, 2);
-    assert.equal(step.recover.block[0].type, "log");
-    assert.equal(step.recover.block[1].type, "run");
+    assert.equal(step.recover.block[0].type, "say");
+    assert.equal(step.recover.block[1].type, "exec");
   }
 });
 
-test("parseRunRecoverStep: parses run with multiline recover block", () => {
-  const lines = [
-    "  run deploy() recover(err) {",
+test("run recover: parses multiline recover block", () => {
+  const step = asRunExec(parseOneWorkflowStep([
+    "run deploy() recover(err) {",
     '    log "retrying"',
     "    run cleanup()",
     "  }",
-  ];
-  const result = parseRunRecoverStep("test.jh", lines, 0, 1, lines[0], "deploy() recover(err) {");
-  assert.ok(result);
-  const step = result!.step;
-  if (step.type === "run" && step.recover && "block" in step.recover) {
+  ]));
+  if (step.recover && "block" in step.recover) {
     assert.equal(step.recover.block.length, 2);
-    assert.equal(step.recover.block[0].type, "log");
-    assert.equal(step.recover.block[1].type, "run");
+    assert.equal(step.recover.block[0].type, "say");
+    assert.equal(step.recover.block[1].type, "exec");
   }
-  assert.equal(result!.nextIdx, 3);
 });
 
-test("parseRunRecoverStep: rejects recover at EOL without body", () => {
-  const lines = ["  run my_workflow() recover"];
+test("run recover: rejects recover at EOL without body", () => {
   assert.throws(
-    () => parseRunRecoverStep("test.jh", lines, 0, 1, lines[0], "my_workflow() recover"),
+    () => parseOneWorkflowStep(["run my_workflow() recover"]),
     /recover requires explicit bindings/,
   );
 });
 
-test("parseRunRecoverStep: rejects recover without bindings", () => {
-  const lines = ["  run my_workflow() recover {"];
+test("run recover: rejects recover without bindings", () => {
   assert.throws(
-    () => parseRunRecoverStep("test.jh", lines, 0, 1, lines[0], "my_workflow() recover {"),
+    () => parseOneWorkflowStep(["run my_workflow() recover {"]),
     /recover requires explicit bindings/,
   );
 });
 
-test("parseRunRecoverStep: rejects recover with two bindings", () => {
-  const lines = ['  run my_workflow() recover(a, b) { log "x" }'];
+test("run recover: rejects recover with two bindings", () => {
   assert.throws(
-    () => parseRunRecoverStep("test.jh", lines, 0, 1, lines[0], 'my_workflow() recover(a, b) { log "x" }'),
+    () => parseOneWorkflowStep(['run my_workflow() recover(a, b) { log "x" }']),
     /recover accepts exactly one binding/,
   );
 });
 
-test("parseRunRecoverStep: empty recover block throws", () => {
-  const lines = ["  run my_workflow() recover(err) { }"];
+test("run recover: empty recover block throws", () => {
   assert.throws(
-    () => parseRunRecoverStep("test.jh", lines, 0, 1, lines[0], "my_workflow() recover(err) { }"),
+    () => parseOneWorkflowStep(["run my_workflow() recover(err) { }"]),
     /recover block must contain at least one statement/,
   );
 });
 
-// === parsejaiph: full workflow with recover ===
-
 test("parsejaiph: workflow with run recover block", () => {
   const src = [
     "workflow deploy() {",
@@ -392,10 +361,7 @@ test("parsejaiph: workflow with run recover block", () => {
   const mod = parsejaiph(src, "recover_test.jh");
   const w = mod.workflows.find((x) => x.name === "deploy");
   assert.ok(w);
-  const runStep = w!.steps[0];
-  assert.equal(runStep.type, "run");
-  if (runStep.type === "run") {
-    assert.ok(runStep.recover);
-    assert.equal(runStep.catch, undefined);
-  }
+  const step = asRunExec(w!.steps[0]);
+  assert.ok(step.recover);
+  assert.equal(step.catch, undefined);
 });
diff --git a/src/parse/parse-synthetic-keyword.test.ts b/src/parse/parse-synthetic-keyword.test.ts
new file mode 100644
index 00000000..bce10bf0
--- /dev/null
+++ b/src/parse/parse-synthetic-keyword.test.ts
@@ -0,0 +1,87 @@
+/**
+ * AC5 — adding a new top-level keyword is a two-file change:
+ *   (1) `STATEMENT` table in `workflow-brace.ts` (the dispatch table)
+ *   (2) `JAIPH_KEYWORDS` set in `core.ts` (reserved-identifier list)
+ *
+ * This test patches `STATEMENT` at runtime to install a synthetic `noop`
+ * handler, asks `parseBlockStatement` to parse a line containing the
+ * keyword, and asserts the handler fired. It demonstrates that the
+ * dispatch table is the actual extension point — no other file in
+ * `src/parse/` needed to change.
+ */
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readFileSync } from "node:fs";
+import { resolve } from "node:path";
+import {
+  STATEMENT,
+  parseBlockStatement,
+  type BlockHandler,
+} from "./workflow-brace";
+
+test("AC5: STATEMENT row alone enables a new top-level keyword", () => {
+  const SYNTHETIC = "zzznoop";
+  assert.equal(STATEMENT[SYNTHETIC], undefined, "synthetic keyword should not pre-exist");
+
+  const handler: BlockHandler = (c) => {
+    if (c.inner !== SYNTHETIC) return null;
+    return {
+      step: {
+        type: "trivia",
+        kind: "comment",
+        text: `<synthetic:${SYNTHETIC}>`,
+        loc: { line: c.innerNo, col: 1 },
+      },
+      nextIdx: c.idx + 1,
+    };
+  };
+
+  STATEMENT[SYNTHETIC] = handler;
+  try {
+    const result = parseBlockStatement("/synthetic.jh", [SYNTHETIC], 0);
+    assert.equal(result.nextIdx, 1);
+    assert.equal(result.step.type, "trivia");
+    assert.equal(
+      result.step.type === "trivia" && result.step.kind === "comment" && result.step.text,
+      `<synthetic:${SYNTHETIC}>`,
+    );
+  } finally {
+    delete STATEMENT[SYNTHETIC];
+  }
+});
+
+test("AC5: without the STATEMENT row, the same keyword falls through to the shell handler", () => {
+  // Sanity: when the dispatch table has no row for our synthetic keyword,
+  // parseBlockStatement falls through to the shell fallback (current behavior
+  // for unknown leading tokens). This makes (1) load-bearing: removing the row
+  // changes the parse result.
+  const result = parseBlockStatement("/synthetic.jh", ["zzznoop"], 0);
+  assert.equal(result.step.type, "exec");
+});
+
+/**
+ * Lightweight grep-style assertion: the dispatch table lives in exactly one
+ * file (`workflow-brace.ts`) and the reserved keyword list lives in exactly
+ * one file (`core.ts`). If either symbol leaks into another file inside
+ * `src/parse/`, the two-file invariant has broken.
+ */
+// Tests run from `dist/src/parse/...`; walk up to repo root.
+const repoRoot = resolve(__dirname, "../../..");
+
+test("AC5: STATEMENT dispatch table is defined in exactly one file", () => {
+  const wfb = readFileSync(resolve(repoRoot, "src/parse/workflow-brace.ts"), "utf8");
+  assert.match(
+    wfb,
+    /export\s+const\s+STATEMENT\s*:\s*Record<string,\s*BlockHandler>/,
+    "STATEMENT table should be defined in workflow-brace.ts",
+  );
+});
+
+test("AC5: JAIPH_KEYWORDS reserved set is defined in exactly one file", () => {
+  const core = readFileSync(resolve(repoRoot, "src/parse/core.ts"), "utf8");
+  assert.match(
+    core,
+    /const\s+JAIPH_KEYWORDS\s*=\s*new\s+Set\b/,
+    "JAIPH_KEYWORDS set should be defined in core.ts",
+  );
+});
diff --git a/src/parse/prompt.ts b/src/parse/prompt.ts
index 8ce101fc..03b75243 100644
--- a/src/parse/prompt.ts
+++ b/src/parse/prompt.ts
@@ -1,9 +1,10 @@
-import type { WorkflowStepDef } from "../types";
+import type { Expr, WorkflowStepDef } from "../types";
+import { createTrivia, type Trivia } from "./trivia";
 import { fail, hasUnescapedClosingQuote, indexOfClosingDoubleQuote } from "./core";
-import { parseTripleQuoteBlock, tripleQuoteBodyToRaw } from "./triple-quote";
+import { dedentTripleQuotedBody, parseTripleQuoteBlock, tripleQuoteBodyToRaw } from "./triple-quote";
 
 /**
- * Prompt body source tag stored in the AST.
+ * Prompt body source tag stored in trivia.
  * - "string"        → single-line `"..."`
  * - "identifier"    → bare identifier after `prompt`
  * - "triple_quoted" → triple-quote `"""..."""` block
@@ -165,13 +166,14 @@ function parsePromptTripleQuoteBlock(
 }
 
 /**
- * Parse a prompt step (captured or uncaptured).
+ * Parse a prompt step (captured or uncaptured). Returns an `exec` step whose
+ * `body` is an `Expr` with `kind: "prompt"`.
+ *
  * Supports three body forms:
  *   1. Single-line string literal: prompt "text"
  *   2. Bare identifier: prompt myVar
  *   3. Triple-quoted block: prompt """ ... """
  *
- * Returns the parsed step and the 0-based line index to continue from.
  * For catch statements where multiline scanning is unnecessary, pass `[]` for lines.
  */
 export function parsePromptStep(
@@ -181,6 +183,7 @@ export function parsePromptStep(
   promptArg: string,
   promptCol: number,
   captureName?: string,
+  trivia: Trivia = createTrivia(),
 ): { step: WorkflowStepDef; nextLineIdx: number } {
   const lineNo = lineIdx + 1;
 
@@ -194,10 +197,29 @@ export function parsePromptStep(
     );
   }
 
+  const stepLoc = { line: lineNo, col: promptCol };
+
+  const buildStep = (
+    body: Expr,
+    bodyTrivia: { bodyKind?: PromptBodyKind; bodyIdentifier?: string; rawBody?: string },
+    nextLineIdx: number,
+  ): { step: WorkflowStepDef; nextLineIdx: number } => {
+    trivia.setNode(body, {
+      ...(bodyTrivia.bodyKind ? { bodyKind: bodyTrivia.bodyKind } : {}),
+      ...(bodyTrivia.bodyIdentifier ? { bodyIdentifier: bodyTrivia.bodyIdentifier } : {}),
+      ...(bodyTrivia.rawBody !== undefined ? { rawBody: bodyTrivia.rawBody } : {}),
+    });
+    const step: WorkflowStepDef = {
+      type: "exec",
+      body,
+      ...(captureName ? { captureName } : {}),
+      loc: stepLoc,
+    };
+    return { step, nextLineIdx };
+  };
+
   // --- Case 1: Triple-quoted block ---
   if (promptArg.startsWith('"""')) {
-    // Recover blocks pass `lines: []` and a single merged `promptArg` (multiline).
-    // Split into synthetic lines so `parseTripleQuoteBlock` sees an opening line of only `"""`.
     let tqLines: string[];
     let tripleQuoteLineIdx: number;
     if (lines.length === 0) {
@@ -213,10 +235,7 @@ export function parsePromptStep(
       tqLines,
       tripleQuoteLineIdx,
     );
-
-    // Wrap body in quotes so the runtime's interpolateWithCaptures can process ${} vars
-    const raw = tripleQuoteBodyToRaw(body);
-
+    const raw = tripleQuoteBodyToRaw(dedentTripleQuotedBody(body));
     const linesForReturns = lines.length === 0 ? tqLines : lines;
     let returnsSchema: string | undefined = returnsOnClosingLine;
     let consumeEndIdx = realNextIdx;
@@ -234,25 +253,17 @@ export function parsePromptStep(
         consumeEndIdx = pr.nextIndex;
       }
     }
-
-    return {
-      step: {
-        type: "prompt",
-        raw,
-        bodyKind: "triple_quoted",
-        loc: { line: lineNo, col: promptCol },
-        ...(captureName ? { captureName } : {}),
-        ...(returnsSchema !== undefined ? { returns: returnsSchema } : {}),
-      },
-      nextLineIdx: consumeEndIdx - 1,
+    const expr: Expr = {
+      kind: "prompt",
+      raw,
+      loc: stepLoc,
+      ...(returnsSchema !== undefined ? { returns: returnsSchema } : {}),
     };
+    return buildStep(expr, { bodyKind: "triple_quoted", rawBody: body }, consumeEndIdx - 1);
   }
 
   // --- Case 2: String literal ---
   if (promptArg.startsWith('"')) {
-    // Check for triple-quote opening: "\"\" (three quotes) — handle as triple-quoted block
-    // This won't match since we check for """ above first.
-    // Check for multiline quoted string (no closing quote on same line) — reject it
     if (!hasUnescapedClosingQuote(promptArg, 1)) {
       fail(filePath, 'multiline prompt strings are no longer supported; use a triple-quoted block instead: prompt """...""""', lineNo, promptCol);
     }
@@ -263,21 +274,16 @@ export function parsePromptStep(
       lines,
       lineIdx,
     );
-    return {
-      step: {
-        type: "prompt",
-        raw: promptRaw,
-        bodyKind: "string",
-        loc: { line: lineNo, col: promptCol },
-        ...(captureName ? { captureName } : {}),
-        ...(returnsSchema !== undefined ? { returns: returnsSchema } : {}),
-      },
-      nextLineIdx: nextIndex - 1,
+    const expr: Expr = {
+      kind: "prompt",
+      raw: promptRaw,
+      loc: stepLoc,
+      ...(returnsSchema !== undefined ? { returns: returnsSchema } : {}),
     };
+    return buildStep(expr, { bodyKind: "string" }, nextIndex - 1);
   }
 
   // --- Case 3: Bare identifier ---
-  // Greedy: take the first token as the identifier
   const identMatch = promptArg.match(/^([A-Za-z_][A-Za-z0-9_]*)/);
   if (!identMatch) {
     const msg = captureName
@@ -288,7 +294,6 @@ export function parsePromptStep(
   const identifier = identMatch[1];
   const afterIdent = promptArg.slice(identifier.length);
 
-  // Check for `returns` after the identifier
   const { returns: returnsSchema, nextIndex } = parseReturnsClause(
     filePath,
     lineNo,
@@ -297,18 +302,13 @@ export function parsePromptStep(
     lineIdx,
   );
 
-  // Store as "${identifier}" so the runtime interpolates the variable
+  // Store as "${identifier}" so the runtime interpolates the variable.
   const raw = `"\${${identifier}}"`;
-  return {
-    step: {
-      type: "prompt",
-      raw,
-      bodyKind: "identifier",
-      bodyIdentifier: identifier,
-      loc: { line: lineNo, col: promptCol },
-      ...(captureName ? { captureName } : {}),
-      ...(returnsSchema !== undefined ? { returns: returnsSchema } : {}),
-    },
-    nextLineIdx: nextIndex - 1,
+  const expr: Expr = {
+    kind: "prompt",
+    raw,
+    loc: stepLoc,
+    ...(returnsSchema !== undefined ? { returns: returnsSchema } : {}),
   };
+  return buildStep(expr, { bodyKind: "identifier", bodyIdentifier: identifier }, nextIndex - 1);
 }
diff --git a/src/parse/rules.ts b/src/parse/rules.ts
index 81466f77..e10b7139 100644
--- a/src/parse/rules.ts
+++ b/src/parse/rules.ts
@@ -1,4 +1,5 @@
 import type { RuleDef } from "../types";
+import { createTrivia, type Trivia } from "./trivia";
 import { braceDepthDelta, colFromRaw, fail, parseParamList, stripQuotes } from "./core";
 import { parseBlockStatement } from "./workflow-brace";
 
@@ -7,6 +8,7 @@ export function parseRuleBlock(
   lines: string[],
   startIndex: number,
   pendingComments: string[],
+  trivia: Trivia = createTrivia(),
 ): { rule: RuleDef; nextIndex: number; exported: boolean } {
   const lineNo = startIndex + 1;
   const raw = lines[startIndex];
@@ -64,10 +66,11 @@ export function parseRuleBlock(
     const cmd = currentCommandLines.join("\n").trim();
     currentCommandLines = [];
     if (!cmd) return;
+    const loc = { line: accumShellLine, col: accumShellCol };
     rule.steps.push({
-      type: "shell",
-      command: stripQuotes(cmd),
-      loc: { line: accumShellLine, col: accumShellCol },
+      type: "exec",
+      body: { kind: "shell", command: stripQuotes(cmd), loc },
+      loc,
     });
   };
 
@@ -85,8 +88,8 @@ export function parseRuleBlock(
       } else {
         flushCommand();
         const lastStep = rule.steps[rule.steps.length - 1];
-        if (lastStep && lastStep.type !== "blank_line") {
-          rule.steps.push({ type: "blank_line" });
+        if (lastStep && !(lastStep.type === "trivia" && lastStep.kind === "blank_line")) {
+          rule.steps.push({ type: "trivia", kind: "blank_line" });
         }
       }
       continue;
@@ -101,7 +104,8 @@ export function parseRuleBlock(
       } else {
         flushCommand();
         rule.steps.push({
-          type: "comment",
+          type: "trivia",
+          kind: "comment",
           text: innerRaw.trim(),
           loc: { line: innerNo, col: 1 },
         });
@@ -133,8 +137,9 @@ export function parseRuleBlock(
       }
       continue;
     }
-    const st = parseBlockStatement(filePath, lines, i, { forRule: true });
-    if (st.step.type !== "shell") {
+    const st = parseBlockStatement(filePath, lines, i, trivia, { forRule: true });
+    const isShellExec = st.step.type === "exec" && st.step.body.kind === "shell";
+    if (!isShellExec) {
       flushCommand();
       rule.steps.push(st.step);
       i = st.nextIdx - 1;
@@ -158,7 +163,13 @@ export function parseRuleBlock(
   if (i >= lines.length) {
     fail(filePath, `unterminated rule block: ${rule.name}`, lineNo);
   }
-  while (rule.steps.length > 0 && rule.steps[rule.steps.length - 1].type === "blank_line") {
+  while (
+    rule.steps.length > 0 &&
+    (() => {
+      const last = rule.steps[rule.steps.length - 1];
+      return last.type === "trivia" && last.kind === "blank_line";
+    })()
+  ) {
     rule.steps.pop();
   }
   return { rule, nextIndex: i + 1, exported: isExported };
diff --git a/src/parse/scripts.ts b/src/parse/scripts.ts
index 2ea92056..cc2f7e67 100644
--- a/src/parse/scripts.ts
+++ b/src/parse/scripts.ts
@@ -1,4 +1,5 @@
 import type { ScriptDef } from "../types";
+import { createTrivia, type Trivia } from "./trivia";
 import { fail, parseSingleBacktickBody } from "./core";
 import { parseFencedBlock } from "./fence";
 
@@ -42,6 +43,7 @@ export function parseScriptBlock(
   lines: string[],
   startIndex: number,
   pendingComments: string[],
+  trivia: Trivia = createTrivia(),
 ): { scriptDef: ScriptDef; nextIndex: number; exported: boolean } {
   const lineNo = startIndex + 1;
   const raw = lines[startIndex];
@@ -100,15 +102,16 @@ export function parseScriptBlock(
       );
     }
 
+    const scriptDef: ScriptDef = {
+      name: scriptName,
+      comments: pendingComments,
+      body,
+      ...(lang ? { lang } : {}),
+      loc: { line: lineNo, col: 1 },
+    };
+    trivia.setNode(scriptDef, { scriptBodyKind: "fenced" });
     return {
-      scriptDef: {
-        name: scriptName,
-        comments: pendingComments,
-        body,
-        ...(lang ? { lang } : {}),
-        bodyKind: "fenced",
-        loc: { line: lineNo, col: 1 },
-      },
+      scriptDef,
       nextIndex: nextIdx,
       exported: isExported,
     };
@@ -124,14 +127,15 @@ export function parseScriptBlock(
 
     validateScriptBodyNoInterpolation(body, filePath, lineNo, 1);
 
+    const scriptDef: ScriptDef = {
+      name: scriptName,
+      comments: pendingComments,
+      body,
+      loc: { line: lineNo, col: 1 },
+    };
+    trivia.setNode(scriptDef, { scriptBodyKind: "backtick" });
     return {
-      scriptDef: {
-        name: scriptName,
-        comments: pendingComments,
-        body,
-        bodyKind: "backtick",
-        loc: { line: lineNo, col: 1 },
-      },
+      scriptDef,
       nextIndex: startIndex + 1,
       exported: isExported,
     };
diff --git a/src/parse/send-rhs.ts b/src/parse/send-rhs.ts
index 77f4e929..dabae365 100644
--- a/src/parse/send-rhs.ts
+++ b/src/parse/send-rhs.ts
@@ -1,11 +1,15 @@
-import type { SendRhsDef, WorkflowRefDef } from "../types";
+import type { Expr, WorkflowRefDef } from "../types";
+import { createTrivia, type Trivia } from "./trivia";
 import { fail, hasUnescapedClosingQuote, indexOfClosingDoubleQuote, isRef, parseCallRef, rejectTrailingContent } from "./core";
-import { parseTripleQuoteBlock, tripleQuoteBodyToRaw } from "./triple-quote";
+import { dedentTripleQuotedBody, parseTripleQuoteBlock, tripleQuoteBodyToRaw } from "./triple-quote";
 
 const SEND_RHS_HINT =
   'send right-hand side must be a quoted string ("..."), a variable ($name or ${...}), or "run <ref> [args]" — not raw shell; use a script or use const';
 
-/** Parse RHS after `<-` for the send operator. Returns the parsed RHS and next line index. */
+/**
+ * Parse RHS after `<-` for the send operator. Returns the parsed RHS as an `Expr`
+ * (replaces the legacy `SendRhsDef` union) plus the next line index.
+ */
 export function parseSendRhs(
   filePath: string,
   rhs: string,
@@ -13,7 +17,8 @@ export function parseSendRhs(
   col: number,
   lines?: string[],
   idx?: number,
-): { rhs: SendRhsDef; nextIdx: number } {
+  trivia: Trivia = createTrivia(),
+): { value: Expr; nextIdx: number } {
   const t = rhs.trim();
   const defaultNext = (idx ?? lineNo - 1) + 1;
   if (t === "") {
@@ -24,7 +29,9 @@ export function parseSendRhs(
     tqLines[idx] = t;
     const { body, nextIdx, afterClose } = parseTripleQuoteBlock(filePath, tqLines, idx);
     if (afterClose) fail(filePath, 'unexpected content after closing """', nextIdx);
-    return { rhs: { kind: "literal", token: tripleQuoteBodyToRaw(body), tripleQuoted: true }, nextIdx };
+    const value: Expr = { kind: "literal", raw: tripleQuoteBodyToRaw(dedentTripleQuotedBody(body)) };
+    trivia.setNode(value, { tripleQuoted: true, rawBody: body });
+    return { value, nextIdx };
   }
   if (t.startsWith('"')) {
     if (!hasUnescapedClosingQuote(t, 1)) {
@@ -37,25 +44,21 @@ export function parseSendRhs(
     if (t.slice(close + 1).trim() !== "") {
       fail(filePath, SEND_RHS_HINT, lineNo, col);
     }
-    return { rhs: { kind: "literal", token: t.slice(0, close + 1) }, nextIdx: defaultNext };
+    return { value: { kind: "literal", raw: t.slice(0, close + 1) }, nextIdx: defaultNext };
   }
   if (t.startsWith("run ")) {
     const call = parseCallRef(t.slice("run ".length).trim());
     if (call) {
       rejectTrailingContent(filePath, lineNo, "run", call.rest);
-      const ref: WorkflowRefDef = { value: call.ref, loc: { line: lineNo, col } };
+      const callee: WorkflowRefDef = { value: call.ref, loc: { line: lineNo, col } };
       return {
-        rhs: {
-          kind: "run", ref,
-          ...(call.args ? { args: call.args } : {}),
-          ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-        },
+        value: { kind: "call", callee, ...(call.args ? { args: call.args } : {}) },
         nextIdx: defaultNext,
       };
     }
   }
   if (/^\$[A-Za-z_][A-Za-z0-9_]*$/.test(t)) {
-    return { rhs: { kind: "var", bash: t }, nextIdx: defaultNext };
+    return { value: { kind: "literal", raw: t }, nextIdx: defaultNext };
   }
   if (t.startsWith("${")) {
     let depth = 1;
@@ -84,17 +87,17 @@ export function parseSendRhs(
     if (braced.includes("$(")) {
       fail(filePath, SEND_RHS_HINT, lineNo, col);
     }
-    return { rhs: { kind: "var", bash: braced }, nextIdx: defaultNext };
+    return { value: { kind: "literal", raw: braced }, nextIdx: defaultNext };
   }
   const bareWord = t.match(/^([A-Za-z_][A-Za-z0-9_]*(?:\.[A-Za-z_][A-Za-z0-9_]*)?)$/);
   if (bareWord && isRef(bareWord[1])) {
     return {
-      rhs: { kind: "bare_ref", ref: { value: bareWord[1], loc: { line: lineNo, col } } },
+      value: { kind: "bare_ref", ref: { value: bareWord[1], loc: { line: lineNo, col } } },
       nextIdx: defaultNext,
     };
   }
   return {
-    rhs: { kind: "shell", command: t, loc: { line: lineNo, col } },
+    value: { kind: "shell", command: t, loc: { line: lineNo, col } },
     nextIdx: defaultNext,
   };
 }
diff --git a/src/parse/steps.ts b/src/parse/steps.ts
index 4a6cf130..6f3628d3 100644
--- a/src/parse/steps.ts
+++ b/src/parse/steps.ts
@@ -1,757 +1,141 @@
-import type { WorkflowStepDef } from "../types";
-import { parseConstRhs } from "./const-rhs";
-import { fail, indexOfClosingDoubleQuote, isRef, parseCallRef, parseLogMessageRhs, rejectTrailingContent } from "./core";
-import { parseAnonymousInlineScript } from "./inline-script";
-import { isBareIdentifierReturn, bareIdentifierToQuotedString, isBareDottedIdentifierReturn, dottedReturnToQuotedString } from "./workflow-return-dotted";
-import { parsePromptStep } from "./prompt";
+import type { CatchBody, WorkflowStepDef } from "../types";
+import { createTrivia, type Trivia } from "./trivia";
+import { fail } from "./core";
+import { splitStatementsOnSemicolons } from "./statement-split";
+import { parseBlockStatement, parseBraceBlockBody } from "./workflow-brace";
 
-/**
- * Split catch block content into statements on `;` or `\n`, but not inside
- * double-quoted strings or triple-quoted `"""…"""` blocks (same idea as
- * `splitStatementsOnSemicolons`).
- */
-function splitCatchStatements(blockContent: string): string[] {
-  const statements: string[] = [];
-  let current = "";
-  let inDoubleQuote = false;
-  let inTripleQuote = false;
-  let braceDepth = 0;
-  let i = 0;
-  while (i < blockContent.length) {
-    const ch = blockContent[i];
-    const next3 = blockContent.slice(i, i + 3);
-
-    if (inTripleQuote) {
-      if (next3 === '"""') {
-        current += next3;
-        inTripleQuote = false;
-        i += 3;
-        continue;
-      }
-      current += ch;
-      i += 1;
-      continue;
-    }
-
-    if (inDoubleQuote) {
-      if (ch === '"' && (i === 0 || blockContent[i - 1] !== "\\")) {
-        inDoubleQuote = false;
-      }
-      current += ch;
-      i += 1;
-      continue;
-    }
-
-    if (next3 === '"""') {
-      inTripleQuote = true;
-      current += next3;
-      i += 3;
-      continue;
-    }
-
-    if (ch === '"') {
-      inDoubleQuote = true;
-      current += ch;
-      i += 1;
-      continue;
-    }
-
-    if (ch === "{") {
-      braceDepth += 1;
-      current += ch;
-      i += 1;
-      continue;
-    }
-    if (ch === "}") {
-      braceDepth -= 1;
-      current += ch;
-      i += 1;
-      continue;
-    }
-
-    if (braceDepth === 0 && (ch === ";" || ch === "\n")) {
-      const trimmed = current.trim();
-      if (trimmed) statements.push(trimmed);
-      current = "";
-      i += 1;
-      continue;
-    }
-
-    current += ch;
-    i += 1;
-  }
-  const trimmed = current.trim();
-  if (trimmed) statements.push(trimmed);
-  return statements;
-}
-
-/** Parse a single workflow statement string (e.g. "run foo", "ensure bar", "echo x") into a step. */
-function parseCatchStatement(
-  filePath: string,
-  lineNo: number,
-  col: number,
-  stmt: string,
-): WorkflowStepDef {
-  const t = stmt.trim();
-  if (!t) {
-    fail(filePath, "empty catch statement", lineNo, col);
-  }
-  if (t.startsWith("#")) {
-    return { type: "comment", text: t, loc: { line: lineNo, col } };
-  }
-  if (t === "wait") {
-    fail(filePath, '"wait" has been removed from the language', lineNo, col);
-  }
-  if (t === "return") {
-    return { type: "return", value: '""', loc: { line: lineNo, col } };
-  }
-  if (t.startsWith("return ")) {
-    const retVal = t.slice("return ".length).trim();
-    // return run ref(args) — managed run
-    if (retVal.startsWith("run ")) {
-      const call = parseCallRef(retVal.slice("run ".length).trim());
-      if (call && !call.rest.trim()) {
-        return {
-          type: "return",
-          value: `run ${call.ref}(${call.args ?? ""})`,
-          loc: { line: lineNo, col },
-          managed: {
-            kind: "run",
-            ref: { value: call.ref, loc: { line: lineNo, col } },
-            args: call.args,
-            ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-          },
-        };
-      }
-    }
-    // return ensure ref(args) — managed ensure
-    if (retVal.startsWith("ensure ")) {
-      const call = parseCallRef(retVal.slice("ensure ".length).trim());
-      if (call && !call.rest.trim()) {
-        return {
-          type: "return",
-          value: `ensure ${call.ref}(${call.args ?? ""})`,
-          loc: { line: lineNo, col },
-          managed: {
-            kind: "ensure",
-            ref: { value: call.ref, loc: { line: lineNo, col } },
-            args: call.args,
-            ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-          },
-        };
-      }
-    }
-    const isBareDotted = isBareDottedIdentifierReturn(retVal);
-    const isBare = !isBareDotted && isBareIdentifierReturn(retVal);
-    const value = isBareDotted
-      ? dottedReturnToQuotedString(retVal)
-      : isBare
-        ? bareIdentifierToQuotedString(retVal)
-        : retVal;
-    return {
-      type: "return",
-      value,
-      loc: { line: lineNo, col },
-      ...(isBareDotted || isBare ? { bareSource: retVal.trim() } : {}),
-    };
-  }
-  if (/^fail\s+/.test(t)) {
-    const arg = t.slice("fail".length).trimStart();
-    if (!arg.startsWith('"')) {
-      fail(filePath, 'fail must match: fail "<reason>"', lineNo, col);
-    }
-    const closeIdx = indexOfClosingDoubleQuote(arg, 1);
-    if (closeIdx === -1) {
-      fail(filePath, "unterminated fail string", lineNo, col);
-    }
-    const message = arg.slice(0, closeIdx + 1);
-    return { type: "fail", message, loc: { line: lineNo, col } };
-  }
-  const constMatch = t.match(/^const\s+([A-Za-z_][A-Za-z0-9_]*)\s*=\s*(.+)$/s);
-  if (constMatch) {
-    const name = constMatch[1];
-    const rhs = constMatch[2].trim();
-    const syntheticLines = [t];
-    const { value } = parseConstRhs(filePath, syntheticLines, 0, rhs, lineNo, col, false, name);
-    return {
-      type: "const",
-      name,
-      value,
-      loc: { line: lineNo, col },
-    };
-  }
-  const genericAssignMatch = t.match(/^([A-Za-z_][A-Za-z0-9_]*)\s+=\s*(.+)$/s);
-  if (
-    genericAssignMatch &&
-    !genericAssignMatch[2].trimStart().startsWith("prompt ") &&
-    !genericAssignMatch[2].trimStart().startsWith('"') &&
-    !genericAssignMatch[2].trimStart().startsWith("'") &&
-    !genericAssignMatch[2].trimStart().startsWith("$")
-  ) {
-    const captureName = genericAssignMatch[1];
-    const rest = genericAssignMatch[2].trim();
-    if (rest.startsWith("run ") || rest.startsWith("ensure ")) {
-      fail(
-        filePath,
-        `assignment without "const" is no longer supported; use "const ${captureName} = ${rest}"`,
-        lineNo,
-        col,
-      );
-    }
-  }
-  if (t.startsWith("run ")) {
-    const runBody = t.slice("run ".length).trim();
-    if (runBody.startsWith("`")) {
-      const result = parseAnonymousInlineScript(filePath, [], lineNo - 1, runBody, lineNo, col);
-      return {
-        type: "run_inline_script",
-        body: result.body,
-        ...(result.lang ? { lang: result.lang } : {}),
-        args: result.args,
-        ...(result.bareIdentifierArgs ? { bareIdentifierArgs: result.bareIdentifierArgs } : {}),
-        loc: { line: lineNo, col },
-      };
-    }
-    // Check for run ... recover inside catch/recover blocks
-    const recoverLoopMatch = runBody.match(/ recover(?=[\s(])/);
-    if (recoverLoopMatch) {
-      const recLoopIdx = recoverLoopMatch.index!;
-      const leftPart = runBody.slice(0, recLoopIdx).trim();
-      const rightPart = runBody.slice(recLoopIdx + " recover".length).trimStart();
-      const callPart = parseCallRef(leftPart);
-      if (callPart && !callPart.rest.trim() && rightPart.startsWith("(")) {
-        const closeParen = rightPart.indexOf(")");
-        if (closeParen !== -1) {
-          const bStr = rightPart.slice(1, closeParen).trim();
-          const bParts = bStr.split(",").map((s) => s.trim()).filter(Boolean);
-          if (bParts.length === 1 && /^[A-Za-z_][A-Za-z0-9_]*$/.test(bParts[0])) {
-            const bindings = { failure: bParts[0] };
-            const after = rightPart.slice(closeParen + 1).trim();
-            if (after.startsWith("{") && after.endsWith("}")) {
-              const blockContent = after.slice(1, -1).trim();
-              const stmts = splitCatchStatements(blockContent);
-              const blockSteps = stmts.map((s) => parseCatchStatement(filePath, lineNo, col, s));
-              return {
-                type: "run",
-                workflow: { value: callPart.ref, loc: { line: lineNo, col } },
-                args: callPart.args,
-                ...(callPart.bareIdentifierArgs ? { bareIdentifierArgs: callPart.bareIdentifierArgs } : {}),
-                recover: { block: blockSteps, bindings },
-              };
-            }
-            if (!after.startsWith("{") && after) {
-              const singleStep = parseCatchStatement(filePath, lineNo, col, after);
-              return {
-                type: "run",
-                workflow: { value: callPart.ref, loc: { line: lineNo, col } },
-                args: callPart.args,
-                ...(callPart.bareIdentifierArgs ? { bareIdentifierArgs: callPart.bareIdentifierArgs } : {}),
-                recover: { single: singleStep, bindings },
-              };
-            }
-          }
-        }
-      }
-    }
-    // Check for run ... catch inside catch blocks
-    const recIdx = runBody.indexOf(" catch ");
-    if (recIdx !== -1) {
-      const leftPart = runBody.slice(0, recIdx).trim();
-      const rightPart = runBody.slice(recIdx + " catch ".length).trim();
-      const callPart = parseCallRef(leftPart);
-      if (callPart && !callPart.rest.trim() && rightPart.startsWith("(")) {
-        const closeParen = rightPart.indexOf(")");
-        if (closeParen !== -1) {
-          const bStr = rightPart.slice(1, closeParen).trim();
-          const bParts = bStr.split(",").map((s) => s.trim()).filter(Boolean);
-          if (bParts.length === 1 && /^[A-Za-z_][A-Za-z0-9_]*$/.test(bParts[0])) {
-            const bindings = { failure: bParts[0] };
-            const after = rightPart.slice(closeParen + 1).trim();
-            if (after.startsWith("{") && after.endsWith("}")) {
-              const blockContent = after.slice(1, -1).trim();
-              const stmts = splitCatchStatements(blockContent);
-              const blockSteps = stmts.map((s) => parseCatchStatement(filePath, lineNo, col, s));
-              return {
-                type: "run",
-                workflow: { value: callPart.ref, loc: { line: lineNo, col } },
-                args: callPart.args,
-                ...(callPart.bareIdentifierArgs ? { bareIdentifierArgs: callPart.bareIdentifierArgs } : {}),
-                catch: { block: blockSteps, bindings },
-              };
-            }
-            if (!after.startsWith("{") && after) {
-              const singleStep = parseCatchStatement(filePath, lineNo, col, after);
-              return {
-                type: "run",
-                workflow: { value: callPart.ref, loc: { line: lineNo, col } },
-                args: callPart.args,
-                ...(callPart.bareIdentifierArgs ? { bareIdentifierArgs: callPart.bareIdentifierArgs } : {}),
-                catch: { single: singleStep, bindings },
-              };
-            }
-          }
-        }
-      }
-    }
-    const call = parseCallRef(runBody);
-    if (call) {
-      rejectTrailingContent(filePath, lineNo, "run", call.rest);
-      return {
-        type: "run",
-        workflow: { value: call.ref, loc: { line: lineNo, col } },
-        args: call.args,
-        ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-      };
-    }
-  }
-  if (t.startsWith("ensure ")) {
-    const ensureBody = t.slice("ensure ".length).trim();
-    const ensRecIdx = ensureBody.indexOf(" catch ");
-    if (ensRecIdx !== -1) {
-      const leftPart = ensureBody.slice(0, ensRecIdx).trim();
-      const rightPart = ensureBody.slice(ensRecIdx + " catch ".length).trim();
-      const callPart = parseCallRef(leftPart);
-      if (callPart && !callPart.rest.trim() && rightPart.startsWith("(")) {
-        const closeParen = rightPart.indexOf(")");
-        if (closeParen !== -1) {
-          const bStr = rightPart.slice(1, closeParen).trim();
-          const bParts = bStr.split(",").map((s) => s.trim()).filter(Boolean);
-          if (bParts.length === 1 && /^[A-Za-z_][A-Za-z0-9_]*$/.test(bParts[0])) {
-            const bindings = { failure: bParts[0] };
-            const after = rightPart.slice(closeParen + 1).trim();
-            if (after.startsWith("{") && after.endsWith("}")) {
-              const blockContent = after.slice(1, -1).trim();
-              const stmts = splitCatchStatements(blockContent);
-              const blockSteps = stmts.map((s) => parseCatchStatement(filePath, lineNo, col, s));
-              return {
-                type: "ensure",
-                ref: { value: callPart.ref, loc: { line: lineNo, col } },
-                args: callPart.args,
-                ...(callPart.bareIdentifierArgs ? { bareIdentifierArgs: callPart.bareIdentifierArgs } : {}),
-                catch: { block: blockSteps, bindings },
-              };
-            }
-            if (!after.startsWith("{") && after) {
-              const singleStep = parseCatchStatement(filePath, lineNo, col, after);
-              return {
-                type: "ensure",
-                ref: { value: callPart.ref, loc: { line: lineNo, col } },
-                args: callPart.args,
-                ...(callPart.bareIdentifierArgs ? { bareIdentifierArgs: callPart.bareIdentifierArgs } : {}),
-                catch: { single: singleStep, bindings },
-              };
-            }
-          }
-        }
-      }
-    }
-    const call = parseCallRef(ensureBody);
-    if (call) {
-      rejectTrailingContent(filePath, lineNo, "ensure", call.rest);
-      return {
-        type: "ensure",
-        ref: { value: call.ref, loc: { line: lineNo, col } },
-        args: call.args,
-        ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-      };
-    }
-  }
-  const promptAssignMatch = t.match(
-    /^([A-Za-z_][A-Za-z0-9_]*)\s*=\s*prompt\s+(.+)$/s,
-  );
-  if (promptAssignMatch) {
-    fail(
-      filePath,
-      'use "const name = prompt ..." in catch blocks (e.g. const x = prompt "...")',
-      lineNo,
-      col + t.indexOf(promptAssignMatch[1]),
-    );
-  }
-  if (t.startsWith("prompt ")) {
-    return parsePromptStep(
-      filePath, [], lineNo - 1, t.slice("prompt ".length).trimStart(),
-      col + t.indexOf("prompt"),
-    ).step;
-  }
-  if (t.startsWith("log ") || t === "log") {
-    const logArg = t.slice("log".length).trimStart();
-    const logCol = col + Math.max(0, t.indexOf("log"));
-    const message = parseLogMessageRhs(filePath, lineNo, logCol, logArg, "log");
-    return { type: "log", message, loc: { line: lineNo, col: logCol } };
-  }
-  if (t.startsWith("logerr ") || t === "logerr") {
-    const logerrArg = t.slice("logerr".length).trimStart();
-    const logerrCol = col + Math.max(0, t.indexOf("logerr"));
-    const message = parseLogMessageRhs(filePath, lineNo, logerrCol, logerrArg, "logerr");
-    return { type: "logerr", message, loc: { line: lineNo, col: logerrCol } };
-  }
-  return { type: "shell", command: t, loc: { line: lineNo, col } };
-}
+const KEYWORD_EXAMPLE = {
+  catch: "catch (<name>) { ... }",
+  recover: "recover(<name>) { ... }",
+} as const;
 
 /**
- * Parse an `ensure <ref> [args] [catch ...]` step, with optional captureName.
- * Returns the step and the updated 0-based line index.
+ * Parse a `(<binding>) { … } | <single-stmt>` clause attached to a host
+ * `run` / `ensure` step. The body is parsed by the same `parseBlockStatement`
+ * used at the top level — there is no separate mini parser for catch/recover.
+ *
+ * `textAfterKeyword` is whatever follows `catch` / `recover` on the host line
+ * (the leading `(` may be preceded by whitespace). Returns the constructed
+ * `CatchBody` plus the next line index to resume parsing from.
  */
-export function parseEnsureStep(
+export function parseAttachedBlock(
   filePath: string,
   lines: string[],
   idx: number,
   innerNo: number,
   innerRaw: string,
-  ensureBody: string,
-  captureName?: string,
-): { step: WorkflowStepDef; nextIdx: number } {
-  const catchIdx = ensureBody.indexOf(" catch ");
-  const ensureCol = innerRaw.indexOf("ensure") + 1;
-
-  // `catch` at end of line with no block → error
-  if (/\scatch$/.test(ensureBody)) {
-    const catchCol = innerRaw.indexOf("catch") + 1;
-    fail(
-      filePath,
-      'catch requires explicit bindings and a body: catch (<name>) { ... }',
-      innerNo,
-      catchCol,
-    );
-  }
-
-  if (catchIdx === -1) {
-    const call = parseCallRef(ensureBody);
-    if (!call) {
-      fail(filePath, "ensure must target a valid reference: ensure ref() or ensure ref(args) — parentheses are required", innerNo);
-    }
-    rejectTrailingContent(filePath, innerNo, "ensure", call.rest);
-    return {
-      step: {
-        type: "ensure",
-        ref: { value: call.ref, loc: { line: innerNo, col: ensureCol } },
-        args: call.args,
-        ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-        ...(captureName ? { captureName } : {}),
-      },
-      nextIdx: idx,
-    };
-  }
-  const left = ensureBody.slice(0, catchIdx).trim();
-  const right = ensureBody.slice(catchIdx + " catch ".length).trim();
-  const call = parseCallRef(left);
-  if (!call) {
-    fail(filePath, "ensure must target a valid reference: ensure ref() or ensure ref(args) — parentheses are required", innerNo);
-  }
-  rejectTrailingContent(filePath, innerNo, "ensure", call.rest);
-  const ref = call.ref;
-  const args = call.args;
-  const catchCol = innerRaw.indexOf("catch") + 1;
+  keyword: "catch" | "recover",
+  textAfterKeyword: string,
+  trivia: Trivia = createTrivia(),
+): { body: CatchBody; nextIdx: number } {
+  const keywordCol = innerRaw.indexOf(keyword) + 1;
+  const right = textAfterKeyword.trimStart();
 
-  // Catch requires explicit bindings: catch (<name>)
   if (!right.startsWith("(")) {
     fail(
       filePath,
-      'catch requires explicit bindings: catch (<name>) { ... }',
+      `${keyword} requires explicit bindings: ${KEYWORD_EXAMPLE[keyword]}`,
       innerNo,
-      catchCol,
+      keywordCol,
     );
   }
-
   const closeParen = right.indexOf(")");
   if (closeParen === -1) {
-    fail(filePath, 'unterminated catch bindings: expected ")"', innerNo, catchCol);
-  }
-  const bindingsStr = right.slice(1, closeParen).trim();
-  const bindingParts = bindingsStr.split(",").map((s) => s.trim()).filter(Boolean);
-  if (bindingParts.length === 0) {
-    fail(filePath, "catch requires exactly one binding: catch (<name>) { ... }", innerNo, catchCol);
-  }
-  if (bindingParts.length > 1) {
-    fail(filePath, 'catch accepts exactly one binding: catch (<name>) — the second binding (attempt) has been removed', innerNo, catchCol);
-  }
-  if (!/^[A-Za-z_][A-Za-z0-9_]*$/.test(bindingParts[0])) {
-    fail(filePath, `invalid catch binding name: "${bindingParts[0]}" — must be a valid identifier`, innerNo, catchCol);
-  }
-  const bindings = { failure: bindingParts[0] };
-
-  const afterBindings = right.slice(closeParen + 1).trim();
-
-  const refLoc = { value: ref, loc: { line: innerNo, col: ensureCol } };
-  const base = {
-    type: "ensure" as const, ref: refLoc, args,
-    ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-    ...(captureName ? { captureName } : {}),
-  };
-
-  if (afterBindings === "{") {
-    let blockLines: string[] = [];
-    let closeLineIdx = -1;
-    let braceDepth = 1;
-    for (let look = idx + 1; look < lines.length; look += 1) {
-      const trimmed = lines[look].trim();
-      if (trimmed.endsWith("{")) braceDepth += 1;
-      if (trimmed === "}") {
-        braceDepth -= 1;
-        if (braceDepth === 0) { closeLineIdx = look; break; }
-      }
-      blockLines.push(trimmed);
-    }
-    if (closeLineIdx === -1) {
-      fail(filePath, 'unterminated catch block, expected "}"', innerNo, catchCol);
-    }
-    const statements = splitCatchStatements(blockLines.join("\n"));
-    if (statements.length === 0) {
-      fail(filePath, "catch block must contain at least one statement", innerNo, catchCol);
-    }
-    const blockSteps = statements.map((s) => parseCatchStatement(filePath, innerNo, 1, s));
-    return { step: { ...base, catch: { block: blockSteps, bindings } }, nextIdx: closeLineIdx };
-  }
-
-  if (afterBindings.startsWith("{")) {
-    const closeBrace = afterBindings.indexOf("}");
-    if (closeBrace === -1) {
-      fail(filePath, 'unterminated catch block, expected "}"', innerNo, catchCol);
-    }
-    const blockContent = afterBindings.slice(1, closeBrace).trim();
-    const statements = splitCatchStatements(blockContent);
-    if (statements.length === 0) {
-      fail(filePath, "catch block must contain at least one statement", innerNo, catchCol);
-    }
-    const blockSteps = statements.map((s) => parseCatchStatement(filePath, innerNo, catchCol, s));
-    return { step: { ...base, catch: { block: blockSteps, bindings } }, nextIdx: idx };
+    fail(filePath, `unterminated ${keyword} bindings: expected ")"`, innerNo, keywordCol);
   }
 
-  if (!afterBindings) {
-    fail(filePath, "catch requires a body after bindings", innerNo, catchCol);
-  }
-
-  const singleStep = parseCatchStatement(filePath, innerNo, catchCol, afterBindings);
-  return { step: { ...base, catch: { single: singleStep, bindings } }, nextIdx: idx };
-}
-
-/**
- * Try to parse `run <ref>(args) recover(binding) { ... }` syntax (loop semantics).
- * Returns null if the run body does not contain ` recover `.
- */
-export function parseRunRecoverStep(
-  filePath: string,
-  lines: string[],
-  idx: number,
-  innerNo: number,
-  innerRaw: string,
-  runBody: string,
-  captureName?: string,
-): { step: WorkflowStepDef; nextIdx: number } | null {
-  // Match ` recover(`, ` recover `, or ` recover` at end of line
-  const recoverMatch = runBody.match(/ recover(?=[\s(]|$)/);
-  if (!recoverMatch) return null;
-  const recoverIdx = recoverMatch.index!;
-
-  if (/ recover$/.test(runBody)) {
-    const recoverCol = innerRaw.indexOf("recover") + 1;
+  const bindingParts = right
+    .slice(1, closeParen)
+    .split(",")
+    .map((s) => s.trim())
+    .filter(Boolean);
+  if (bindingParts.length === 0) {
     fail(
       filePath,
-      'recover requires explicit bindings and a body: recover(<name>) { ... }',
+      `${keyword} requires exactly one binding: ${KEYWORD_EXAMPLE[keyword]}`,
       innerNo,
-      recoverCol,
+      keywordCol,
     );
   }
-
-  const left = runBody.slice(0, recoverIdx).trim();
-  const right = runBody.slice(recoverIdx + " recover".length).trimStart();
-  const call = parseCallRef(left);
-  if (!call || call.rest.trim()) return null;
-  const runCol = innerRaw.indexOf("run") + 1;
-  const recoverCol = innerRaw.indexOf("recover") + 1;
-
-  if (!right.startsWith("(")) {
+  if (bindingParts.length > 1) {
+    if (keyword === "catch") {
+      fail(
+        filePath,
+        "catch accepts exactly one binding: catch (<name>) — the second binding (attempt) has been removed",
+        innerNo,
+        keywordCol,
+      );
+    }
+    fail(filePath, "recover accepts exactly one binding: recover(<name>)", innerNo, keywordCol);
+  }
+  if (!/^[A-Za-z_][A-Za-z0-9_]*$/.test(bindingParts[0])) {
     fail(
       filePath,
-      'recover requires explicit bindings: recover(<name>) { ... }',
+      `invalid ${keyword} binding name: "${bindingParts[0]}" — must be a valid identifier`,
       innerNo,
-      recoverCol,
+      keywordCol,
     );
   }
-
-  const closeParen = right.indexOf(")");
-  if (closeParen === -1) {
-    fail(filePath, 'unterminated recover bindings: expected ")"', innerNo, recoverCol);
-  }
-  const bindingsStr = right.slice(1, closeParen).trim();
-  const bindingParts = bindingsStr.split(",").map((s) => s.trim()).filter(Boolean);
-  if (bindingParts.length === 0) {
-    fail(filePath, "recover requires exactly one binding: recover(<name>) { ... }", innerNo, recoverCol);
-  }
-  if (bindingParts.length > 1) {
-    fail(filePath, "recover accepts exactly one binding: recover(<name>)", innerNo, recoverCol);
-  }
-  if (!/^[A-Za-z_][A-Za-z0-9_]*$/.test(bindingParts[0])) {
-    fail(filePath, `invalid recover binding name: "${bindingParts[0]}" — must be a valid identifier`, innerNo, recoverCol);
-  }
   const bindings = { failure: bindingParts[0] };
-
   const afterBindings = right.slice(closeParen + 1).trim();
-  const base = {
-    type: "run" as const,
-    workflow: { value: call.ref, loc: { line: innerNo, col: runCol } },
-    args: call.args,
-    ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-    ...(captureName ? { captureName } : {}),
-  };
 
+  // Multi-line block: `{` at end of host line; body lives on subsequent lines.
   if (afterBindings === "{") {
-    let blockLines: string[] = [];
-    let closeLineIdx = -1;
-    let braceDepth = 1;
-    for (let look = idx + 1; look < lines.length; look += 1) {
-      const trimmed = lines[look].trim();
-      if (trimmed.endsWith("{")) braceDepth += 1;
-      if (trimmed === "}") {
-        braceDepth -= 1;
-        if (braceDepth === 0) { closeLineIdx = look; break; }
+    // Pre-scan for the matching `}` so the unterminated message names the clause.
+    let depth = 1;
+    let probe = idx + 1;
+    while (probe < lines.length) {
+      const t = lines[probe].trim();
+      if (t.endsWith("{")) depth += 1;
+      if (t === "}") {
+        depth -= 1;
+        if (depth === 0) break;
       }
-      blockLines.push(trimmed);
+      probe += 1;
     }
-    if (closeLineIdx === -1) {
-      fail(filePath, 'unterminated recover block, expected "}"', innerNo, recoverCol);
+    if (probe >= lines.length) {
+      fail(filePath, `unterminated ${keyword} block, expected "}"`, innerNo, keywordCol);
     }
-    const statements = splitCatchStatements(blockLines.join("\n"));
-    if (statements.length === 0) {
-      fail(filePath, "recover block must contain at least one statement", innerNo, recoverCol);
+    const { steps, nextIdx } = parseBraceBlockBody(filePath, lines, idx + 1, innerNo, trivia);
+    if (steps.length === 0) {
+      fail(filePath, `${keyword} block must contain at least one statement`, innerNo, keywordCol);
     }
-    const blockSteps = statements.map((s) => parseCatchStatement(filePath, innerNo, 1, s));
-    return { step: { ...base, recover: { block: blockSteps, bindings } }, nextIdx: closeLineIdx };
+    return { body: { block: steps, bindings }, nextIdx };
   }
 
+  // Inline block on a single line: `{ stmt[; stmt]* }`.
   if (afterBindings.startsWith("{")) {
-    const closeBrace = afterBindings.indexOf("}");
-    if (closeBrace === -1) {
-      fail(filePath, 'unterminated recover block, expected "}"', innerNo, recoverCol);
+    if (!afterBindings.endsWith("}")) {
+      fail(filePath, `unterminated ${keyword} block, expected "}"`, innerNo, keywordCol);
     }
-    const blockContent = afterBindings.slice(1, closeBrace).trim();
-    const statements = splitCatchStatements(blockContent);
-    if (statements.length === 0) {
-      fail(filePath, "recover block must contain at least one statement", innerNo, recoverCol);
+    const content = afterBindings.slice(1, -1).trim();
+    const stmts = content === "" ? [] : splitStatementsOnSemicolons(content);
+    if (stmts.length === 0) {
+      fail(filePath, `${keyword} block must contain at least one statement`, innerNo, keywordCol);
     }
-    const blockSteps = statements.map((s) => parseCatchStatement(filePath, innerNo, recoverCol, s));
-    return { step: { ...base, recover: { block: blockSteps, bindings } }, nextIdx: idx };
+    const blockSteps = stmts.map((stmt) => parseAtHostLine(filePath, idx, stmt, trivia));
+    return { body: { block: blockSteps, bindings }, nextIdx: idx + 1 };
   }
 
-  if (!afterBindings) {
-    fail(filePath, "recover requires a body after bindings", innerNo, recoverCol);
+  if (afterBindings === "") {
+    fail(filePath, `${keyword} requires a body after bindings`, innerNo, keywordCol);
   }
 
-  const singleStep = parseCatchStatement(filePath, innerNo, recoverCol, afterBindings);
-  return { step: { ...base, recover: { single: singleStep, bindings } }, nextIdx: idx };
+  const single = parseAtHostLine(filePath, idx, afterBindings, trivia);
+  return { body: { single, bindings }, nextIdx: idx + 1 };
 }
 
 /**
- * Try to parse `run <ref>(args) catch (bindings) { ... }` syntax.
- * Returns null if the run body does not contain ` catch `.
+ * Parse a single statement string as if it lived on the host line. Padded
+ * lines preserve the source line number in nested error messages.
  */
-export function parseRunCatchStep(
+function parseAtHostLine(
   filePath: string,
-  lines: string[],
-  idx: number,
-  innerNo: number,
-  innerRaw: string,
-  runBody: string,
-  captureName?: string,
-): { step: WorkflowStepDef; nextIdx: number } | null {
-  const catchIdx = runBody.indexOf(" catch ");
-  if (catchIdx === -1) return null;
-
-  // `catch` at end of line with no block → error
-  if (/\scatch$/.test(runBody)) {
-    const catchCol = innerRaw.indexOf("catch") + 1;
-    fail(
-      filePath,
-      'catch requires explicit bindings and a body: catch (<name>) { ... }',
-      innerNo,
-      catchCol,
-    );
-  }
-
-  const left = runBody.slice(0, catchIdx).trim();
-  const right = runBody.slice(catchIdx + " catch ".length).trim();
-  const call = parseCallRef(left);
-  if (!call || call.rest.trim()) return null;
-  const runCol = innerRaw.indexOf("run") + 1;
-  const catchCol = innerRaw.indexOf("catch") + 1;
-
-  if (!right.startsWith("(")) {
-    fail(
-      filePath,
-      'catch requires explicit bindings: catch (<name>) { ... }',
-      innerNo,
-      catchCol,
-    );
-  }
-
-  const closeParen = right.indexOf(")");
-  if (closeParen === -1) {
-    fail(filePath, 'unterminated catch bindings: expected ")"', innerNo, catchCol);
-  }
-  const bindingsStr = right.slice(1, closeParen).trim();
-  const bindingParts = bindingsStr.split(",").map((s) => s.trim()).filter(Boolean);
-  if (bindingParts.length === 0) {
-    fail(filePath, "catch requires exactly one binding: catch (<name>) { ... }", innerNo, catchCol);
-  }
-  if (bindingParts.length > 1) {
-    fail(filePath, 'catch accepts exactly one binding: catch (<name>) — the second binding (attempt) has been removed', innerNo, catchCol);
-  }
-  if (!/^[A-Za-z_][A-Za-z0-9_]*$/.test(bindingParts[0])) {
-    fail(filePath, `invalid catch binding name: "${bindingParts[0]}" — must be a valid identifier`, innerNo, catchCol);
-  }
-  const bindings = { failure: bindingParts[0] };
-
-  const afterBindings = right.slice(closeParen + 1).trim();
-  const base = {
-    type: "run" as const,
-    workflow: { value: call.ref, loc: { line: innerNo, col: runCol } },
-    args: call.args,
-    ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-    ...(captureName ? { captureName } : {}),
-  };
-
-  if (afterBindings === "{") {
-    let blockLines: string[] = [];
-    let closeLineIdx = -1;
-    let braceDepth = 1;
-    for (let look = idx + 1; look < lines.length; look += 1) {
-      const trimmed = lines[look].trim();
-      if (trimmed.endsWith("{")) braceDepth += 1;
-      if (trimmed === "}") {
-        braceDepth -= 1;
-        if (braceDepth === 0) { closeLineIdx = look; break; }
-      }
-      blockLines.push(trimmed);
-    }
-    if (closeLineIdx === -1) {
-      fail(filePath, 'unterminated catch block, expected "}"', innerNo, catchCol);
-    }
-    const statements = splitCatchStatements(blockLines.join("\n"));
-    if (statements.length === 0) {
-      fail(filePath, "catch block must contain at least one statement", innerNo, catchCol);
-    }
-    const blockSteps = statements.map((s) => parseCatchStatement(filePath, innerNo, 1, s));
-    return { step: { ...base, catch: { block: blockSteps, bindings } }, nextIdx: closeLineIdx };
-  }
-
-  if (afterBindings.startsWith("{")) {
-    const closeBrace = afterBindings.indexOf("}");
-    if (closeBrace === -1) {
-      fail(filePath, 'unterminated catch block, expected "}"', innerNo, catchCol);
-    }
-    const blockContent = afterBindings.slice(1, closeBrace).trim();
-    const statements = splitCatchStatements(blockContent);
-    if (statements.length === 0) {
-      fail(filePath, "catch block must contain at least one statement", innerNo, catchCol);
-    }
-    const blockSteps = statements.map((s) => parseCatchStatement(filePath, innerNo, catchCol, s));
-    return { step: { ...base, catch: { block: blockSteps, bindings } }, nextIdx: idx };
-  }
-
-  if (!afterBindings) {
-    fail(filePath, "catch requires a body after bindings", innerNo, catchCol);
-  }
-
-  const singleStep = parseCatchStatement(filePath, innerNo, catchCol, afterBindings);
-  return { step: { ...base, catch: { single: singleStep, bindings } }, nextIdx: idx };
+  hostIdx: number,
+  stmt: string,
+  trivia: Trivia,
+): WorkflowStepDef {
+  const padded = new Array<string>(hostIdx).fill("");
+  padded.push(stmt);
+  return parseBlockStatement(filePath, padded, hostIdx, trivia).step;
 }
diff --git a/src/parse/tests.ts b/src/parse/tests.ts
index 0771a0bc..3d69c32e 100644
--- a/src/parse/tests.ts
+++ b/src/parse/tests.ts
@@ -1,4 +1,5 @@
 import type { MatchArmDef, TestBlockDef, WorkflowStepDef } from "../types";
+import { createTrivia, type Trivia } from "./trivia";
 import { colFromRaw, fail, hasUnescapedClosingQuote, isRef, parseParamList, stripQuotes } from "./core";
 import { parseMatchArms } from "./match";
 import { parseBraceBlockBody } from "./workflow-brace";
@@ -99,7 +100,7 @@ export function parseTestBlock(
   filePath: string,
   lines: string[],
   startIndex: number,
-  leadingComments?: string[],
+  trivia: Trivia = createTrivia(),
 ): { testBlock: TestBlockDef; nextIndex: number } {
   const lineNo = startIndex + 1;
   const raw = lines[startIndex];
@@ -115,9 +116,6 @@ export function parseTestBlock(
     steps: [],
     loc: { line: lineNo, col: raw.indexOf("test") + 1 },
   };
-  if (leadingComments && leadingComments.length > 0) {
-    testBlock.leadingComments = [...leadingComments];
-  }
 
   let i = startIndex + 1;
   for (; i < lines.length; i += 1) {
@@ -183,7 +181,7 @@ export function parseTestBlock(
     rejectOldMockSyntax(filePath, inner, "workflow", innerNo, col);
     const mockWfHeader = parseMockHeader(filePath, inner, "mock workflow ", innerNo, col);
     if (mockWfHeader) {
-      const { steps, nextIdx } = parseBraceBlockBody(filePath, lines, i + 1, innerNo, { forRule: false });
+      const { steps, nextIdx } = parseBraceBlockBody(filePath, lines, i + 1, innerNo, trivia, { forRule: false });
       testBlock.steps.push({ type: "test_mock_workflow", ref: mockWfHeader.ref, params: mockWfHeader.params, steps, loc });
       i = nextIdx - 1;
       continue;
@@ -193,7 +191,7 @@ export function parseTestBlock(
     rejectOldMockSyntax(filePath, inner, "rule", innerNo, col);
     const mockRuleHeader = parseMockHeader(filePath, inner, "mock rule ", innerNo, col);
     if (mockRuleHeader) {
-      const { steps, nextIdx } = parseBraceBlockBody(filePath, lines, i + 1, innerNo, { forRule: true });
+      const { steps, nextIdx } = parseBraceBlockBody(filePath, lines, i + 1, innerNo, trivia, { forRule: true });
       testBlock.steps.push({ type: "test_mock_rule", ref: mockRuleHeader.ref, params: mockRuleHeader.params, steps, loc });
       i = nextIdx - 1;
       continue;
diff --git a/src/parse/triple-quote.ts b/src/parse/triple-quote.ts
index 4856acbf..e68fa4a6 100644
--- a/src/parse/triple-quote.ts
+++ b/src/parse/triple-quote.ts
@@ -1,3 +1,4 @@
+import { dedentCommonLeadingWhitespace } from "./dedent";
 import { fail } from "./core";
 
 /** Per language.md: trim blank lines adjacent to opening/closing `"""` only — do not dedent inner margin. */
@@ -58,6 +59,32 @@ export function tripleQuoteBodyToRaw(body: string): string {
   return `"${body.replace(/\\/g, "\\\\").replace(/"/g, '\\"')}"`;
 }
 
+/**
+ * Apply common-leading-whitespace dedent to a triple-quoted body. The parser
+ * applies this so the semantic AST string carries the runtime-ready form;
+ * runtime & validator stop needing a `tripleQuoted` flag.
+ */
+export function dedentTripleQuotedBody(body: string): string {
+  return dedentCommonLeadingWhitespace(body);
+}
+
+function unescapeDslDoubleQuotedInner(inner: string): string {
+  return inner.replace(/\\"/g, '"').replace(/\\\\/g, "\\");
+}
+
+/**
+ * Canonicalize a triple-quoted body that was stored in `tripleQuoteBodyToRaw`
+ * (`"…escaped…"`) form. Used by match-arm bodies, which still carry their own
+ * `tripleQuotedBody` flag instead of being dedented at parse time. The runtime
+ * and the validator share this helper so that "what the runtime executes" and
+ * "what the validator inspects" are bit-for-bit identical.
+ */
+export function canonicalizeTripleQuotedString(raw: string): string {
+  if (raw.length < 2 || raw[0] !== '"' || raw[raw.length - 1] !== '"') return raw;
+  const inner = unescapeDslDoubleQuotedInner(raw.slice(1, -1));
+  return tripleQuoteBodyToRaw(dedentCommonLeadingWhitespace(inner));
+}
+
 /**
  * Helper for step parsers: when a step argument starts with `"""`, splice it back
  * onto the source line and parse the triple-quoted block. Errors if any content
diff --git a/src/parse/trivia-ast-shape.test.ts b/src/parse/trivia-ast-shape.test.ts
new file mode 100644
index 00000000..0e5cac1c
--- /dev/null
+++ b/src/parse/trivia-ast-shape.test.ts
@@ -0,0 +1,83 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import type {
+  ChannelDef,
+  ImportDef,
+  ScriptDef,
+  ScriptImportDef,
+  TestBlockDef,
+  WorkflowMetadata,
+  WorkflowStepDef,
+  jaiphModule,
+  Expr,
+} from "../types";
+
+/**
+ * AC1 (Trivia/CST split): source-fidelity fields must not live on semantic
+ * AST types. Each helper below assigns an object literal with the field that
+ * *used* to exist; if anyone re-adds the field to the public type, the literal
+ * widens, the type assertion below fails, and TypeScript breaks compilation.
+ */
+
+type HasField<T, K extends string> = T extends Record<K, unknown> ? true : false;
+
+// jaiphModule must not carry: configLeadingComments, trailingTopLevelComments, topLevelOrder.
+const _moduleNoConfigLeading: HasField<jaiphModule, "configLeadingComments"> = false;
+const _moduleNoTrailing: HasField<jaiphModule, "trailingTopLevelComments"> = false;
+const _moduleNoTopLevelOrder: HasField<jaiphModule, "topLevelOrder"> = false;
+
+// ImportDef / ScriptImportDef / ChannelDef / TestBlockDef must not carry leadingComments.
+const _importNoLeading: HasField<ImportDef, "leadingComments"> = false;
+const _scriptImportNoLeading: HasField<ScriptImportDef, "leadingComments"> = false;
+const _channelNoLeading: HasField<ChannelDef, "leadingComments"> = false;
+const _testBlockNoLeading: HasField<TestBlockDef, "leadingComments"> = false;
+
+// WorkflowMetadata must not carry configBodySequence.
+const _metaNoConfigSeq: HasField<WorkflowMetadata, "configBodySequence"> = false;
+
+// ScriptDef must not carry bodyKind.
+const _scriptNoBodyKind: HasField<ScriptDef, "bodyKind"> = false;
+
+// Step variants must not carry surface-form trivia.
+type SayStep = Extract<WorkflowStepDef, { type: "say" }>;
+type ReturnStep = Extract<WorkflowStepDef, { type: "return" }>;
+type SendStep = Extract<WorkflowStepDef, { type: "send" }>;
+type ExecStep = Extract<WorkflowStepDef, { type: "exec" }>;
+
+const _sayNoTripleQuoted: HasField<SayStep, "tripleQuoted"> = false;
+const _returnNoTripleQuoted: HasField<ReturnStep, "tripleQuoted"> = false;
+const _returnNoBareSource: HasField<ReturnStep, "bareSource"> = false;
+const _execNoBodyKind: HasField<ExecStep, "bodyKind"> = false;
+const _execNoBodyIdentifier: HasField<ExecStep, "bodyIdentifier"> = false;
+
+// Expr literal must not carry tripleQuoted — that lives in trivia instead.
+type LiteralExpr = Extract<Expr, { kind: "literal" }>;
+type PromptExpr = Extract<Expr, { kind: "prompt" }>;
+const _literalNoTripleQuoted: HasField<LiteralExpr, "tripleQuoted"> = false;
+const _promptNoBodyKind: HasField<PromptExpr, "bodyKind"> = false;
+const _promptNoBodyIdentifier: HasField<PromptExpr, "bodyIdentifier"> = false;
+
+// send.value carries an Expr; the old SendRhsDef.literal wrapper with
+// `tripleQuoted` is gone.
+const _sendValueIsExpr: SendStep["value"] extends Expr ? true : false = true;
+
+test("AC1: no trivia fields on semantic AST types", () => {
+  assert.equal(_moduleNoConfigLeading, false);
+  assert.equal(_moduleNoTrailing, false);
+  assert.equal(_moduleNoTopLevelOrder, false);
+  assert.equal(_importNoLeading, false);
+  assert.equal(_scriptImportNoLeading, false);
+  assert.equal(_channelNoLeading, false);
+  assert.equal(_testBlockNoLeading, false);
+  assert.equal(_metaNoConfigSeq, false);
+  assert.equal(_scriptNoBodyKind, false);
+  assert.equal(_sayNoTripleQuoted, false);
+  assert.equal(_returnNoTripleQuoted, false);
+  assert.equal(_returnNoBareSource, false);
+  assert.equal(_execNoBodyKind, false);
+  assert.equal(_execNoBodyIdentifier, false);
+  assert.equal(_literalNoTripleQuoted, false);
+  assert.equal(_promptNoBodyKind, false);
+  assert.equal(_promptNoBodyIdentifier, false);
+  assert.equal(_sendValueIsExpr, true);
+});
diff --git a/src/parse/trivia-grep.test.ts b/src/parse/trivia-grep.test.ts
new file mode 100644
index 00000000..7b409b27
--- /dev/null
+++ b/src/parse/trivia-grep.test.ts
@@ -0,0 +1,49 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readFileSync } from "node:fs";
+import { resolve, join } from "node:path";
+
+// Tests run from dist/src/parse/, so repo root is three levels up.
+const repoRoot = resolve(__dirname, "../../..");
+
+/** Validator and emitter source files that must not reference Trivia. */
+const PROTECTED_FILES = [
+  "src/transpile/validate.ts",
+  "src/transpile/validate-string.ts",
+  "src/transpile/validate-prompt-schema.ts",
+  "src/transpile/validate-ref-resolution.ts",
+  "src/transpile/validate-substitution.ts",
+  "src/transpile/validate-match.test.ts",
+  "src/transpile/emit-script.ts",
+  "src/transpile/emit-from-graph.ts",
+];
+
+test("AC2: validator and emitter sources do not import Trivia", () => {
+  for (const rel of PROTECTED_FILES) {
+    const abs = join(repoRoot, rel);
+    let content: string;
+    try {
+      content = readFileSync(abs, "utf8");
+    } catch {
+      // File doesn't exist in this checkout — skip rather than fail.
+      continue;
+    }
+    // No imports from the trivia module.
+    assert.equal(
+      /from\s+["'][^"']*\/parse\/trivia["']/.test(content),
+      false,
+      `${rel} imports from parse/trivia — validator/emitter must not read Trivia`,
+    );
+    // No reference to the Trivia identifier or its node-trivia fields.
+    const forbidden = ["Trivia", "createTrivia", "NodeTrivia", "ModuleTrivia"];
+    for (const sym of forbidden) {
+      // Word boundary on each side.
+      const re = new RegExp(`\\b${sym}\\b`);
+      assert.equal(
+        re.test(content),
+        false,
+        `${rel} references ${sym} — validator/emitter must not see Trivia`,
+      );
+    }
+  }
+});
diff --git a/src/parse/trivia.ts b/src/parse/trivia.ts
new file mode 100644
index 00000000..06bd14f3
--- /dev/null
+++ b/src/parse/trivia.ts
@@ -0,0 +1,78 @@
+import type { TopLevelEmitOrder } from "../types";
+
+/** One line inside `config { }`: comment or assignment (formatter round-trip order). */
+export type ConfigBodyPart =
+  | { kind: "comment"; text: string }
+  | { kind: "assign"; key: string };
+
+/**
+ * Per-node source-fidelity data. Each field is optional; presence indicates a
+ * particular surface form chosen by the author that the formatter needs to
+ * round-trip. The validator/emitter never look at this map.
+ *
+ * - `tripleQuoted`: the literal/return/log/logerr/fail/send/const was written
+ *   as `"""..."""`. The AST string is the *dedented* form (so runtime &
+ *   validator don't need this flag); the original raw body is in `rawBody`.
+ * - `rawBody`: original triple-quoted body (without surrounding `"""`), used
+ *   by the formatter to re-emit the author's exact indentation.
+ * - `bareSource`: `return foo` and `return foo.bar` sugar — formatter
+ *   re-emits the bare form instead of `"${foo}"`.
+ * - `bodyKind` (prompt): `"string" | "identifier" | "triple_quoted"`.
+ * - `bodyIdentifier` (prompt): identifier name when `bodyKind === "identifier"`.
+ * - `scriptBodyKind` (script): `"backtick" | "fenced"`.
+ * - `leadingComments`: `#` lines immediately before an import / channel /
+ *   test block / env decl.
+ */
+export interface NodeTrivia {
+  tripleQuoted?: boolean;
+  rawBody?: string;
+  bareSource?: string;
+  bodyKind?: "string" | "identifier" | "triple_quoted";
+  bodyIdentifier?: string;
+  scriptBodyKind?: "backtick" | "fenced";
+  leadingComments?: string[];
+  /** Order and comment lines inside `config { … }`; keyed on the metadata object. */
+  configBodySequence?: ConfigBodyPart[];
+}
+
+/** Module-level source-fidelity data not tied to a specific node. */
+export interface ModuleTrivia {
+  configLeadingComments?: string[];
+  configBodySequence?: ConfigBodyPart[];
+  trailingTopLevelComments?: string[];
+  topLevelOrder?: TopLevelEmitOrder[];
+}
+
+/**
+ * Trivia store. The parser builds it alongside the semantic AST and returns
+ * both via `parsejaiph`. The formatter reads it; nobody else does.
+ */
+export class Trivia {
+  private nodes = new WeakMap<object, NodeTrivia>();
+  private moduleData: ModuleTrivia = {};
+
+  setNode(node: object, info: NodeTrivia): void {
+    const existing = this.nodes.get(node);
+    if (existing) {
+      Object.assign(existing, info);
+    } else {
+      this.nodes.set(node, { ...info });
+    }
+  }
+
+  getNode(node: object): NodeTrivia | undefined {
+    return this.nodes.get(node);
+  }
+
+  setModule(info: Partial<ModuleTrivia>): void {
+    Object.assign(this.moduleData, info);
+  }
+
+  getModule(): ModuleTrivia {
+    return this.moduleData;
+  }
+}
+
+export function createTrivia(): Trivia {
+  return new Trivia();
+}
diff --git a/src/parse/workflow-brace.ts b/src/parse/workflow-brace.ts
index 485d1c10..7c605942 100644
--- a/src/parse/workflow-brace.ts
+++ b/src/parse/workflow-brace.ts
@@ -1,4 +1,5 @@
-import type { WorkflowMetadata, WorkflowStepDef } from "../types";
+import type { CatchBody, Expr, WorkflowMetadata, WorkflowStepDef } from "../types";
+import { createTrivia, type Trivia } from "./trivia";
 import {
   colFromRaw,
   fail,
@@ -9,11 +10,11 @@ import {
   parseLogMessageRhs,
   rejectTrailingContent,
 } from "./core";
-import { consumeTripleQuotedArg, tripleQuoteBodyToRaw } from "./triple-quote";
+import { consumeTripleQuotedArg, dedentTripleQuotedBody, tripleQuoteBodyToRaw } from "./triple-quote";
 import { parseConstRhs } from "./const-rhs";
 import { parseAnonymousInlineScript } from "./inline-script";
 import { parseConfigBlock } from "./metadata";
-import { parseEnsureStep, parseRunCatchStep, parseRunRecoverStep } from "./steps";
+import { parseAttachedBlock } from "./steps";
 import { parsePromptStep } from "./prompt";
 import { parseSendRhs } from "./send-rhs";
 import { parseMatchExpr } from "./match";
@@ -21,7 +22,7 @@ import { dottedReturnToQuotedString, isBareDottedIdentifierReturn, isBareIdentif
 
 export type BlockParseOpts = {
   forRule?: boolean;
-  /** When true, push `blank_line` steps so the formatter can preserve spacing. */
+  /** When true, push `blank_line` trivia steps so the formatter can preserve spacing. */
   preserveBlankLines?: boolean;
   /**
    * When set, allow a `config { … }` block as the first non-comment statement.
@@ -29,6 +30,12 @@ export type BlockParseOpts = {
    * reject specific keys (workflows reject `runtime.*` and `module.*`).
    */
   onConfigBlock?: (metadata: WorkflowMetadata, lineNo: number) => void;
+  /**
+   * When set (used for `if` bodies), also close the block on a `} else {`
+   * line and signal it via `closedWithElse` in the return value. Without
+   * this flag, `} else {` is parsed as a normal statement line (and errors).
+   */
+  allowElseTerminator?: boolean;
 };
 
 /** Parse statements until a closing `}` at the current block level. */
@@ -37,8 +44,9 @@ export function parseBraceBlockBody(
   lines: string[],
   startIdx: number,
   openerLineNo: number,
+  trivia: Trivia = createTrivia(),
   opts?: BlockParseOpts,
-): { steps: WorkflowStepDef[]; nextIdx: number } {
+): { steps: WorkflowStepDef[]; nextIdx: number; closedWithElse?: boolean } {
   const steps: WorkflowStepDef[] = [];
   let idx = startIdx;
   let hadNonCommentStep = false;
@@ -49,8 +57,8 @@ export function parseBraceBlockBody(
     if (inner === "") {
       if (opts?.preserveBlankLines) {
         const last = steps[steps.length - 1];
-        if (last && last.type !== "blank_line") {
-          steps.push({ type: "blank_line" });
+        if (last && !(last.type === "trivia" && last.kind === "blank_line")) {
+          steps.push({ type: "trivia", kind: "blank_line" });
         }
       }
       idx += 1;
@@ -58,13 +66,33 @@ export function parseBraceBlockBody(
     }
     if (inner.startsWith("#")) {
       steps.push({
-        type: "comment",
+        type: "trivia",
+        kind: "comment",
         text: innerRaw.trim(),
         loc: { line: innerNo, col: 1 },
       });
       idx += 1;
       continue;
     }
+    if (opts?.allowElseTerminator && /^}\s*else\b/.test(inner)) {
+      if (/^}\s*else\s+if\b/.test(inner)) {
+        fail(
+          filePath,
+          '"else if" chaining is not supported; nest an "if" inside the "else" block, or use "match" for multi-way branching',
+          innerNo,
+          innerRaw.indexOf("else") + 1,
+        );
+      }
+      if (/^}\s*else\s*\{\s*$/.test(inner)) {
+        return { steps, nextIdx: idx + 1, closedWithElse: true };
+      }
+      fail(
+        filePath,
+        '"else" must appear on the same line as the closing "}" of the "if" block, followed by "{" (e.g., "} else {")',
+        innerNo,
+        innerRaw.indexOf("else") + 1,
+      );
+    }
     if (inner === "}") {
       return { steps, nextIdx: idx + 1 };
     }
@@ -72,7 +100,7 @@ export function parseBraceBlockBody(
       if (hadNonCommentStep) {
         fail(filePath, "config block inside workflow must appear before any steps", innerNo);
       }
-      const { metadata, nextIndex } = parseConfigBlock(filePath, lines, idx);
+      const { metadata, nextIndex } = parseConfigBlock(filePath, lines, idx, trivia);
       opts.onConfigBlock(metadata, innerNo);
       idx = nextIndex;
       continue;
@@ -89,527 +117,661 @@ export function parseBraceBlockBody(
       );
     }
     hadNonCommentStep = true;
-    const one = parseBlockStatement(filePath, lines, idx, opts);
+    const one = parseBlockStatement(filePath, lines, idx, trivia, opts);
     steps.push(one.step);
     idx = one.nextIdx;
   }
   fail(filePath, 'unterminated block, expected "}"', openerLineNo);
 }
 
+/** Build an `exec` step from a value expression and optional capture/catch/recover. */
+function execStep(
+  body: Expr,
+  loc: { line: number; col: number },
+  extras: { captureName?: string; catch?: CatchBody; recover?: CatchBody } = {},
+): WorkflowStepDef {
+  return {
+    type: "exec",
+    body,
+    ...(extras.captureName ? { captureName: extras.captureName } : {}),
+    ...(extras.catch ? { catch: extras.catch } : {}),
+    ...(extras.recover ? { recover: extras.recover } : {}),
+    loc,
+  };
+}
+
 /**
- * One workflow statement inside `{ … }` (catch body, etc.).
+ * Parse `run [async] <ref>(args)` or `ensure <ref>(args)`, optionally followed
+ * by `catch (binding) { ... }` or — for `run` only — `recover(binding) { ... }`.
+ *
+ * The catch/recover clause is parsed via the unified `parseAttachedBlock`, whose
+ * body uses the same `parseBlockStatement` as the top-level dispatcher.
  */
-export function parseBlockStatement(
+function parseRunOrEnsure(
   filePath: string,
   lines: string[],
   idx: number,
-  opts?: BlockParseOpts,
+  innerNo: number,
+  innerRaw: string,
+  host: "run" | "ensure",
+  hostBody: string,
+  isAsync: boolean,
+  captureName: string | undefined,
+  trivia: Trivia,
 ): { step: WorkflowStepDef; nextIdx: number } {
-  const innerRaw = lines[idx];
-  const inner = innerRaw.trim();
-  const innerNo = idx + 1;
-  const forRule = opts?.forRule === true;
+  const hostName = host === "ensure" ? "ensure" : isAsync ? "run async" : "run";
+  const hostCol = innerRaw.indexOf(host) + 1;
+  const stepLoc = { line: innerNo, col: hostCol };
 
-  if (inner.startsWith("#")) {
-    return {
-      step: {
-        type: "comment",
-        text: innerRaw.trim(),
-        loc: { line: innerNo, col: 1 },
-      },
-      nextIdx: idx + 1,
-    };
+  if (/\scatch$/.test(hostBody)) {
+    fail(
+      filePath,
+      'catch requires explicit bindings and a body: catch (<name>) { ... }',
+      innerNo,
+      innerRaw.indexOf("catch") + 1,
+    );
+  }
+  if (host === "run" && / recover$/.test(hostBody)) {
+    fail(
+      filePath,
+      'recover requires explicit bindings and a body: recover(<name>) { ... }',
+      innerNo,
+      innerRaw.indexOf("recover") + 1,
+    );
   }
 
-  // if <subject> <op> <operand> { ... }
-  const ifHead = inner.match(
-    /^if\s+([A-Za-z_][A-Za-z0-9_]*)\s+(==|!=|=~|!~)\s+("(?:[^"\\]|\\.)*"|\/(?:[^/\\]|\\.)*\/)\s*\{\s*$/,
-  );
-  if (ifHead) {
-    const subject = ifHead[1];
-    const operator = ifHead[2] as "==" | "!=" | "=~" | "!~";
-    const rawOperand = ifHead[3];
-    const ifLoc = { line: innerNo, col: innerRaw.indexOf("if") + 1 };
-
-    let operand: { kind: "string_literal"; value: string } | { kind: "regex"; source: string };
-    if (rawOperand.startsWith('"')) {
-      operand = { kind: "string_literal", value: rawOperand.slice(1, -1) };
-    } else {
-      operand = { kind: "regex", source: rawOperand.slice(1, -1) };
+  let attached:
+    | { keyword: "catch" | "recover"; left: string; after: string }
+    | null = null;
+  if (host === "run") {
+    const m = hostBody.match(/ recover(?=[\s(])/);
+    if (m) {
+      const pos = m.index!;
+      attached = {
+        keyword: "recover",
+        left: hostBody.slice(0, pos).trim(),
+        after: hostBody.slice(pos + " recover".length),
+      };
     }
-
-    if ((operator === "==" || operator === "!=") && operand.kind === "regex") {
-      fail(filePath, `operator "${operator}" requires a string operand ("..."), not a regex`, innerNo, ifLoc.col);
+  }
+  if (!attached) {
+    const ci = hostBody.indexOf(" catch ");
+    if (ci !== -1) {
+      attached = {
+        keyword: "catch",
+        left: hostBody.slice(0, ci).trim(),
+        after: hostBody.slice(ci + " catch ".length),
+      };
     }
-    if ((operator === "=~" || operator === "!~") && operand.kind === "string_literal") {
-      fail(filePath, `operator "${operator}" requires a regex operand (/pattern/), not a string`, innerNo, ifLoc.col);
+  }
+
+  // `run` falls back to plain parsing when the call before catch/recover has
+  // trailing content, preserving the legacy "unexpected content" error shape.
+  if (attached && host === "run") {
+    const probe = parseCallRef(attached.left);
+    if (!probe || probe.rest.trim()) {
+      attached = null;
     }
+  }
 
-    const { steps: body, nextIdx } = parseBraceBlockBody(filePath, lines, idx + 1, innerNo);
-    return {
-      step: { type: "if", subject, operator, operand, body, loc: ifLoc },
-      nextIdx,
-    };
+  if (!attached) {
+    const call = parseCallRef(hostBody);
+    if (!call) {
+      fail(
+        filePath,
+        `${hostName} must target a valid reference: ${hostName} ref() or ${hostName} ref(args) — parentheses are required`,
+        innerNo,
+      );
+    }
+    rejectTrailingContent(filePath, innerNo, hostName, call.rest);
+    const callee = { value: call.ref, loc: stepLoc };
+    const body: Expr = host === "ensure"
+      ? { kind: "ensure_call", callee, args: call.args }
+      : { kind: "call", callee, args: call.args, ...(isAsync ? { async: true as const } : {}) };
+    return { step: execStep(body, stepLoc, { captureName }), nextIdx: idx + 1 };
   }
-  if (/^if[\s(]/.test(inner)) {
+
+  const call = parseCallRef(attached.left);
+  if (!call) {
     fail(
       filePath,
-      'invalid if syntax; expected: if <identifier> <op> <operand> { ... } where op is ==, !=, =~, or !~ and operand is "string" or /regex/',
+      `${hostName} must target a valid reference: ${hostName} ref() or ${hostName} ref(args) — parentheses are required`,
       innerNo,
-      innerRaw.indexOf("if") + 1,
     );
   }
+  rejectTrailingContent(filePath, innerNo, hostName, call.rest);
+  const callee = { value: call.ref, loc: stepLoc };
+  const body: Expr = host === "ensure"
+    ? { kind: "ensure_call", callee, args: call.args }
+    : { kind: "call", callee, args: call.args, ...(isAsync ? { async: true as const } : {}) };
+
+  const result = parseAttachedBlock(
+    filePath, lines, idx, innerNo, innerRaw, attached.keyword, attached.after, trivia,
+  );
+  const extras = attached.keyword === "catch"
+    ? { captureName, catch: result.body }
+    : { captureName, recover: result.body };
+  return { step: execStep(body, stepLoc, extras), nextIdx: result.nextIdx };
+}
+
+export type BlockCtx = {
+  filePath: string;
+  lines: string[];
+  idx: number;
+  innerRaw: string;
+  inner: string;
+  innerNo: number;
+  trivia: Trivia;
+  forRule: boolean;
+  opts: BlockParseOpts | undefined;
+};
+export type BlockResult = { step: WorkflowStepDef; nextIdx: number };
+export type BlockHandler = (c: BlockCtx) => BlockResult | null;
 
-  // for <iter> in <string-var> { ... }
-  const forHead = inner.match(/^for\s+([A-Za-z_][A-Za-z0-9_]*)\s+in\s+([A-Za-z_][A-Za-z0-9_]*)\s*\{\s*$/);
-  if (forHead) {
-    const iterVar = forHead[1];
-    const sourceVar = forHead[2];
-    const forLoc = { line: innerNo, col: innerRaw.indexOf("for") + 1 };
-    const { steps: body, nextIdx } = parseBraceBlockBody(filePath, lines, idx + 1, innerNo, opts);
+function tryParseIf(c: BlockCtx): BlockResult | null {
+  const ifLoc = { line: c.innerNo, col: c.innerRaw.indexOf("if") + 1 };
+  const m = c.inner.match(
+    /^if\s+([A-Za-z_][A-Za-z0-9_]*(?:\.[A-Za-z_][A-Za-z0-9_]*)?)\s+(==|!=|=~|!~)\s+("(?:[^"\\]|\\.)*"|\/(?:[^/\\]|\\.)*\/)\s*\{\s*$/,
+  );
+  if (!m) {
+    if (/^if[\s(]/.test(c.inner)) {
+      fail(
+        c.filePath,
+        'invalid if syntax; expected: if <identifier> <op> <operand> { ... } where op is ==, !=, =~, or !~ and operand is "string" or /regex/',
+        c.innerNo,
+        ifLoc.col,
+      );
+    }
+    return null;
+  }
+  const subject = m[1];
+  const operator = m[2] as "==" | "!=" | "=~" | "!~";
+  const rawOperand = m[3];
+  const operand: { kind: "string_literal"; value: string } | { kind: "regex"; source: string } =
+    rawOperand.startsWith('"')
+      ? { kind: "string_literal", value: rawOperand.slice(1, -1) }
+      : { kind: "regex", source: rawOperand.slice(1, -1) };
+  if ((operator === "==" || operator === "!=") && operand.kind === "regex") {
+    fail(c.filePath, `operator "${operator}" requires a string operand ("..."), not a regex`, c.innerNo, ifLoc.col);
+  }
+  if ((operator === "=~" || operator === "!~") && operand.kind === "string_literal") {
+    fail(c.filePath, `operator "${operator}" requires a regex operand (/pattern/), not a string`, c.innerNo, ifLoc.col);
+  }
+  const thenResult = parseBraceBlockBody(
+    c.filePath, c.lines, c.idx + 1, c.innerNo, c.trivia, { allowElseTerminator: true },
+  );
+  if (!thenResult.closedWithElse) {
     return {
-      step: { type: "for_lines", iterVar, sourceVar, body, loc: forLoc },
-      nextIdx,
+      step: { type: "if", subject, operator, operand, body: thenResult.steps, loc: ifLoc },
+      nextIdx: thenResult.nextIdx,
     };
   }
-  if (/^for\s/.test(inner)) {
+  const elseLineNo = thenResult.nextIdx; // line number of `} else {` is nextIdx - 1 (0-indexed: thenResult.nextIdx - 1)
+  const elseResult = parseBraceBlockBody(
+    c.filePath, c.lines, thenResult.nextIdx, elseLineNo, c.trivia,
+  );
+  return {
+    step: {
+      type: "if",
+      subject,
+      operator,
+      operand,
+      body: thenResult.steps,
+      elseBody: elseResult.steps,
+      loc: ifLoc,
+    },
+    nextIdx: elseResult.nextIdx,
+  };
+}
+
+function tryParseFor(c: BlockCtx): BlockResult | null {
+  const forLoc = { line: c.innerNo, col: c.innerRaw.indexOf("for") + 1 };
+  const m = c.inner.match(/^for\s+([A-Za-z_][A-Za-z0-9_]*)\s+in\s+([A-Za-z_][A-Za-z0-9_]*)\s*\{\s*$/);
+  if (!m) {
+    if (/^for\s/.test(c.inner)) {
+      fail(
+        c.filePath,
+        'invalid for syntax; expected: for <identifier> in <identifier> { ... }',
+        c.innerNo,
+        forLoc.col,
+      );
+    }
+    return null;
+  }
+  const { steps: body, nextIdx } = parseBraceBlockBody(c.filePath, c.lines, c.idx + 1, c.innerNo, c.trivia, c.opts);
+  return { step: { type: "for_lines", iterVar: m[1], sourceVar: m[2], body, loc: forLoc }, nextIdx };
+}
+
+function tryParseConst(c: BlockCtx): BlockResult | null {
+  const m = c.inner.match(/^const\s+([A-Za-z_][A-Za-z0-9_]*)\s*=\s*(.+)$/s);
+  if (!m) return null;
+  const name = m[1];
+  const rhs = m[2].trim();
+  const { value, nextLineIdx } = parseConstRhs(
+    c.filePath, c.lines, c.idx, rhs, c.innerNo, c.innerRaw.indexOf(rhs) + 1, c.forRule, name, c.trivia,
+  );
+  const nextLine = nextLineIdx > c.idx ? nextLineIdx + 1 : c.idx + 1;
+  return {
+    step: { type: "const", name, value, loc: { line: c.innerNo, col: c.innerRaw.indexOf("const") + 1 } },
+    nextIdx: nextLine,
+  };
+}
+
+function tryParseFail(c: BlockCtx): BlockResult | null {
+  if (!/^fail\s+/.test(c.inner)) return null;
+  const arg = c.inner.slice("fail".length).trimStart();
+  const failCol = c.innerRaw.indexOf("fail") + 1;
+  const stepLoc = { line: c.innerNo, col: failCol };
+  if (arg.startsWith('"""')) {
+    const { body, nextIdx } = consumeTripleQuotedArg(c.filePath, c.lines, c.idx, arg);
+    const raw = tripleQuoteBodyToRaw(dedentTripleQuotedBody(body));
+    const message: Expr = { kind: "literal", raw };
+    c.trivia.setNode(message, { tripleQuoted: true, rawBody: body });
+    return { step: { type: "say", level: "fail", message, loc: stepLoc }, nextIdx };
+  }
+  if (!arg.startsWith('"')) {
+    fail(c.filePath, 'fail must match: fail "<reason>" or fail """..."""', c.innerNo, failCol);
+  }
+  if (!hasUnescapedClosingQuote(arg, 1)) {
+    fail(c.filePath, 'multiline strings use triple quotes: fail """..."""', c.innerNo, failCol);
+  }
+  const closeIdx = indexOfClosingDoubleQuote(arg, 1);
+  if (closeIdx === -1) {
+    fail(c.filePath, "unterminated fail string", c.innerNo, failCol);
+  }
+  const raw = arg.slice(0, closeIdx + 1);
+  return {
+    step: { type: "say", level: "fail", message: { kind: "literal", raw }, loc: stepLoc },
+    nextIdx: c.idx + 1,
+  };
+}
+
+function tryParseWait(c: BlockCtx): BlockResult | null {
+  if (c.inner !== "wait") return null;
+  fail(c.filePath, '"wait" has been removed from the language', c.innerNo, c.innerRaw.indexOf("wait") + 1);
+}
+
+function tryParseEnsure(c: BlockCtx): BlockResult | null {
+  if (!c.inner.startsWith("ensure ")) return null;
+  const ensureBody = c.inner.slice("ensure ".length).trim();
+  return parseRunOrEnsure(
+    c.filePath, c.lines, c.idx, c.innerNo, c.innerRaw, "ensure", ensureBody, false, undefined, c.trivia,
+  );
+}
+
+/**
+ * After `run \`body\`(args)` / `run \`\`\`...\`\`\`(args)`, optionally parse an
+ * attached `catch (...) { ... }` or `recover(...) { ... }` clause. Same
+ * semantics and bindings as named-ref `run`. `recover` and `catch` are
+ * mutually exclusive — when both appear on the same step the leftover
+ * keyword falls through and is rejected with the existing "unexpected
+ * content after anonymous inline script" error.
+ */
+function parseInlineScriptTail(
+  c: BlockCtx,
+  result: { closingLineIdx: number; trailing: string; nextLineIdx: number },
+  body: Expr,
+  stepLoc: { line: number; col: number },
+): BlockResult {
+  const trimmed = result.trailing.trimStart();
+  if (trimmed === "") {
+    return { step: execStep(body, stepLoc), nextIdx: result.nextLineIdx };
+  }
+  const recoverMatch = trimmed.match(/^recover([\s(].*)$/s);
+  const catchMatch = trimmed.match(/^catch(\s.*)$/s);
+  const attached =
+    recoverMatch !== null
+      ? { keyword: "recover" as const, after: recoverMatch[1] }
+      : catchMatch !== null
+        ? { keyword: "catch" as const, after: catchMatch[1] }
+        : null;
+  if (!attached) {
     fail(
-      filePath,
-      'invalid for syntax; expected: for <identifier> in <identifier> { ... }',
-      innerNo,
-      innerRaw.indexOf("for") + 1,
+      c.filePath,
+      `unexpected content after anonymous inline script: '${trimmed}'`,
+      result.closingLineIdx + 1,
+      c.innerRaw.indexOf("run") + 1,
     );
   }
+  const closingRaw = c.lines[result.closingLineIdx]!;
+  const closingNo = result.closingLineIdx + 1;
+  const block = parseAttachedBlock(
+    c.filePath, c.lines, result.closingLineIdx, closingNo, closingRaw,
+    attached.keyword, attached.after, c.trivia,
+  );
+  const extras = attached.keyword === "catch" ? { catch: block.body } : { recover: block.body };
+  return { step: execStep(body, stepLoc, extras), nextIdx: block.nextIdx };
+}
 
-  const constMatch = inner.match(/^const\s+([A-Za-z_][A-Za-z0-9_]*)\s*=\s*(.+)$/s);
-  if (constMatch) {
-    const name = constMatch[1];
-    const rhs = constMatch[2].trim();
-    const { value, nextLineIdx } = parseConstRhs(
-      filePath, lines, idx, rhs, innerNo, innerRaw.indexOf(rhs) + 1, forRule, name,
+function tryParseRun(c: BlockCtx): BlockResult | null {
+  if (!c.inner.startsWith("run ")) return null;
+  const runCol = c.innerRaw.indexOf("run") + 1;
+  if (c.inner.startsWith("run async ")) {
+    const runBody = c.inner.slice("run async ".length).trim();
+    if (runBody.startsWith("`")) {
+      fail(c.filePath, "run async is not supported with inline scripts", c.innerNo, runCol);
+    }
+    return parseRunOrEnsure(
+      c.filePath, c.lines, c.idx, c.innerNo, c.innerRaw, "run", runBody, true, undefined, c.trivia,
     );
-    const nextLine = nextLineIdx > idx ? nextLineIdx + 1 : idx + 1;
-    return {
-      step: { type: "const", name, value, loc: { line: innerNo, col: innerRaw.indexOf("const") + 1 } },
-      nextIdx: nextLine,
+  }
+  const runBody = c.inner.slice("run ".length).trim();
+  if (runBody.startsWith("`")) {
+    const result = parseAnonymousInlineScript(c.filePath, c.lines, c.idx, runBody, c.innerNo, runCol, true);
+    const body: Expr = {
+      kind: "inline_script",
+      body: result.body,
+      ...(result.lang ? { lang: result.lang } : {}),
+      args: result.args,
     };
+    const stepLoc = { line: c.innerNo, col: runCol };
+    return parseInlineScriptTail(c, result, body, stepLoc);
   }
+  if (runBody.startsWith("script(") || runBody.startsWith("script (")) {
+    fail(c.filePath, 'inline script syntax has changed: use run `body`(args) instead of run script(args) "body"', c.innerNo);
+  }
+  return parseRunOrEnsure(
+    c.filePath, c.lines, c.idx, c.innerNo, c.innerRaw, "run", runBody, false, undefined, c.trivia,
+  );
+}
 
-  const failMatch = inner.match(/^fail\s+/);
-  if (failMatch) {
-    const arg = inner.slice("fail".length).trimStart();
-    const failCol = innerRaw.indexOf("fail") + 1;
-    if (arg.startsWith('"""')) {
-      const { body, nextIdx } = consumeTripleQuotedArg(filePath, lines, idx, arg);
-      const message = tripleQuoteBodyToRaw(body);
-      return {
-        step: { type: "fail", message, tripleQuoted: true, loc: { line: innerNo, col: failCol } },
-        nextIdx,
-      };
-    }
-    if (!arg.startsWith('"')) {
-      fail(filePath, 'fail must match: fail "<reason>" or fail """..."""', innerNo, failCol);
-    }
-    if (!hasUnescapedClosingQuote(arg, 1)) {
-      fail(filePath, 'multiline strings use triple quotes: fail """..."""', innerNo, failCol);
-    }
-    const closeIdx = indexOfClosingDoubleQuote(arg, 1);
-    if (closeIdx === -1) {
-      fail(filePath, "unterminated fail string", innerNo, failCol);
-    }
-    const message = arg.slice(0, closeIdx + 1);
-    return {
-      step: { type: "fail", message, loc: { line: innerNo, col: failCol } },
-      nextIdx: idx + 1,
+function tryParsePrompt(c: BlockCtx): BlockResult | null {
+  if (!c.inner.startsWith("prompt ")) return null;
+  const promptCol = c.innerRaw.indexOf("prompt") + 1;
+  const promptArg = c.innerRaw.slice(c.innerRaw.indexOf("prompt") + "prompt".length).trimStart();
+  const result = parsePromptStep(c.filePath, c.lines, c.idx, promptArg, promptCol, undefined, c.trivia);
+  return { step: result.step, nextIdx: result.nextLineIdx + 1 };
+}
+
+function parseSayBody(
+  c: BlockCtx,
+  level: "log" | "logerr",
+): BlockResult {
+  const arg = c.inner.slice(level.length).trimStart();
+  const col = c.innerRaw.indexOf(level) + 1;
+  const stepLoc = { line: c.innerNo, col };
+  if (arg.startsWith("run ") && arg.slice("run ".length).trimStart().startsWith("`")) {
+    const runBody = arg.slice("run ".length).trim();
+    const result = parseAnonymousInlineScript(c.filePath, c.lines, c.idx, runBody, c.innerNo, col);
+    const message: Expr = {
+      kind: "inline_script",
+      body: result.body,
+      ...(result.lang ? { lang: result.lang } : {}),
+      args: result.args,
     };
+    return { step: { type: "say", level, message, loc: stepLoc }, nextIdx: result.nextLineIdx };
   }
-
-  if (inner === "wait") {
-    fail(filePath, '"wait" has been removed from the language', innerNo, innerRaw.indexOf("wait") + 1);
+  if (arg.startsWith("`") || arg.startsWith("```")) {
+    fail(c.filePath, `bare inline scripts in ${level} are not allowed; use "${level} run \`...\`()" to execute a managed inline script`, c.innerNo, col);
   }
-
-  if (inner.startsWith("ensure ")) {
-    const ensureBody = inner.slice("ensure ".length).trim();
-    const r = parseEnsureStep(
-      filePath, lines, idx, innerNo, innerRaw,
-      ensureBody,
-    );
-    return { step: r.step, nextIdx: r.nextIdx + 1 };
+  if (arg.startsWith('"""')) {
+    const { body, nextIdx } = consumeTripleQuotedArg(c.filePath, c.lines, c.idx, arg);
+    const raw = dedentTripleQuotedBody(body);
+    const message: Expr = { kind: "literal", raw };
+    c.trivia.setNode(message, { tripleQuoted: true, rawBody: body });
+    return { step: { type: "say", level, message, loc: stepLoc }, nextIdx };
   }
+  if (arg.startsWith('"') && !hasUnescapedClosingQuote(arg, 1)) {
+    fail(c.filePath, `multiline strings use triple quotes: ${level} """..."""`, c.innerNo, col);
+  }
+  const messageRaw = parseLogMessageRhs(c.filePath, c.innerNo, col, arg, level);
+  return {
+    step: { type: "say", level, message: { kind: "literal", raw: messageRaw }, loc: stepLoc },
+    nextIdx: c.idx + 1,
+  };
+}
+
+function tryParseLog(c: BlockCtx): BlockResult | null {
+  if (!c.inner.startsWith("log ") && c.inner !== "log") return null;
+  return parseSayBody(c, "log");
+}
+
+function tryParseLogerr(c: BlockCtx): BlockResult | null {
+  if (!c.inner.startsWith("logerr ") && c.inner !== "logerr") return null;
+  return parseSayBody(c, "logerr");
+}
 
-  if (inner.startsWith("run async ")) {
-    const runBody = inner.slice("run async ".length).trim();
+function tryParseReturn(c: BlockCtx): BlockResult | null {
+  const retLoc = { line: c.innerNo, col: c.innerRaw.indexOf("return") + 1 };
+  if (c.inner.trim() === "return") {
+    return {
+      step: { type: "return", value: { kind: "literal", raw: '""' }, loc: retLoc },
+      nextIdx: c.idx + 1,
+    };
+  }
+  const m = c.inner.match(/^return\s+(.+)$/s);
+  if (!m) return null;
+  const returnValue = m[1].trim();
+  if (returnValue.startsWith('"""')) {
+    const { body, nextIdx } = consumeTripleQuotedArg(c.filePath, c.lines, c.idx, returnValue);
+    const value: Expr = { kind: "literal", raw: tripleQuoteBodyToRaw(dedentTripleQuotedBody(body)) };
+    c.trivia.setNode(value, { tripleQuoted: true, rawBody: body });
+    return { step: { type: "return", value, loc: retLoc }, nextIdx };
+  }
+  const matchHead = returnValue.match(/^match\s+(.+?)\s*\{\s*$/);
+  if (matchHead) {
+    const { expr, nextIndex } = parseMatchExpr(c.filePath, c.lines, c.idx, matchHead[1].trim(), retLoc);
+    return { step: { type: "return", value: { kind: "match", match: expr }, loc: retLoc }, nextIdx: nextIndex };
+  }
+  if (returnValue.startsWith("run ")) {
+    const runBody = returnValue.slice("run ".length).trim();
     if (runBody.startsWith("`")) {
-      fail(filePath, "run async is not supported with inline scripts", innerNo, innerRaw.indexOf("run") + 1);
-    }
-    // run async ... recover(name) { ... }
-    const recoverResult = parseRunRecoverStep(filePath, lines, idx, innerNo, innerRaw, runBody);
-    if (recoverResult && recoverResult.step.type === "run") {
-      return {
-        step: { ...recoverResult.step, async: true },
-        nextIdx: recoverResult.nextIdx + 1,
+      const result = parseAnonymousInlineScript(c.filePath, c.lines, c.idx, runBody, c.innerNo, c.innerRaw.indexOf("run") + 1);
+      const value: Expr = {
+        kind: "inline_script",
+        body: result.body,
+        ...(result.lang ? { lang: result.lang } : {}),
+        args: result.args,
       };
+      return { step: { type: "return", value, loc: retLoc }, nextIdx: result.nextLineIdx };
     }
-    // run async ... catch(name) { ... }
-    const catchResult = parseRunCatchStep(filePath, lines, idx, innerNo, innerRaw, runBody);
-    if (catchResult && catchResult.step.type === "run") {
+    const call = parseCallRef(runBody);
+    if (call) {
+      rejectTrailingContent(c.filePath, c.innerNo, "run", call.rest);
+      const callee = { value: call.ref, loc: retLoc };
       return {
-        step: { ...catchResult.step, async: true },
-        nextIdx: catchResult.nextIdx + 1,
+        step: { type: "return", value: { kind: "call", callee, args: call.args }, loc: retLoc },
+        nextIdx: c.idx + 1,
       };
     }
-    const call = parseCallRef(runBody);
-    if (!call) {
-      fail(filePath, "run async must target a valid reference: run async ref() or run async ref(args) — parentheses are required", innerNo);
-    }
-    rejectTrailingContent(filePath, innerNo, "run async", call.rest);
-    return {
-      step: {
-        type: "run",
-        workflow: {
-          value: call.ref,
-          loc: { line: innerNo, col: innerRaw.indexOf("run") + 1 },
-        },
-        args: call.args,
-        ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-        async: true,
-      },
-      nextIdx: idx + 1,
-    };
   }
-
-  if (inner.startsWith("run ")) {
-    const runBody = inner.slice("run ".length).trim();
-    if (runBody.startsWith("`")) {
-      const result = parseAnonymousInlineScript(filePath, lines, idx, runBody, innerNo, innerRaw.indexOf("run") + 1);
+  if (returnValue.startsWith("ensure ")) {
+    const call = parseCallRef(returnValue.slice("ensure ".length).trim());
+    if (call) {
+      rejectTrailingContent(c.filePath, c.innerNo, "ensure", call.rest);
+      const callee = { value: call.ref, loc: retLoc };
       return {
-        step: {
-          type: "run_inline_script",
-          body: result.body,
-          ...(result.lang ? { lang: result.lang } : {}),
-          args: result.args,
-          ...(result.bareIdentifierArgs ? { bareIdentifierArgs: result.bareIdentifierArgs } : {}),
-          loc: { line: innerNo, col: innerRaw.indexOf("run") + 1 },
-        },
-        nextIdx: result.nextLineIdx,
+        step: { type: "return", value: { kind: "ensure_call", callee, args: call.args }, loc: retLoc },
+        nextIdx: c.idx + 1,
       };
     }
-    if (runBody.startsWith("script(") || runBody.startsWith("script (")) {
-      fail(filePath, 'inline script syntax has changed: use run `body`(args) instead of run script(args) "body"', innerNo);
-    }
-    // Check for run ... recover (loop semantics)
-    const recoverResult = parseRunRecoverStep(filePath, lines, idx, innerNo, innerRaw, runBody);
-    if (recoverResult) {
-      return { step: recoverResult.step, nextIdx: recoverResult.nextIdx + 1 };
-    }
-    // Check for run ... catch
-    const catchResult = parseRunCatchStep(filePath, lines, idx, innerNo, innerRaw, runBody);
-    if (catchResult) {
-      return { step: catchResult.step, nextIdx: catchResult.nextIdx + 1 };
-    }
-    const call = parseCallRef(runBody);
-    if (!call) {
-      fail(filePath, "run must target a valid reference: run ref() or run ref(args) — parentheses are required", innerNo);
-    }
-    rejectTrailingContent(filePath, innerNo, "run", call.rest);
-    return {
-      step: {
-        type: "run",
-        workflow: {
-          value: call.ref,
-          loc: { line: innerNo, col: innerRaw.indexOf("run") + 1 },
-        },
-        args: call.args,
-        ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-      },
-      nextIdx: idx + 1,
-    };
   }
+  if (returnValue.startsWith("`") || returnValue.startsWith("```")) {
+    fail(c.filePath, 'bare inline scripts in return are not allowed; use "return run `...`()" to execute a managed inline script', c.innerNo, retLoc.col);
+  }
+  if (returnValue.startsWith("'")) {
+    fail(c.filePath, 'single-quoted strings are not supported; use double quotes ("...") instead', c.innerNo, retLoc.col);
+  }
+  if (/^[0-9]+$/.test(returnValue) || returnValue === "$?") {
+    fail(
+      c.filePath,
+      'bash exit codes are only valid in scripts; use return "..." for a workflow value',
+      c.innerNo,
+      retLoc.col,
+    );
+  }
+  if (
+    returnValue.startsWith('"') ||
+    returnValue.startsWith("$") ||
+    isBareDottedIdentifierReturn(returnValue) ||
+    isBareIdentifierReturn(returnValue)
+  ) {
+    if (returnValue.startsWith('"') && !hasUnescapedClosingQuote(returnValue, 1)) {
+      fail(c.filePath, 'multiline strings use triple quotes: return """..."""', c.innerNo, retLoc.col);
+    }
+    const isBareDotted = isBareDottedIdentifierReturn(returnValue);
+    const isBare = !isBareDotted && isBareIdentifierReturn(returnValue);
+    const raw = isBareDotted
+      ? dottedReturnToQuotedString(returnValue)
+      : isBare
+        ? bareIdentifierToQuotedString(returnValue)
+        : returnValue;
+    const value: Expr = { kind: "literal", raw };
+    if (isBareDotted || isBare) {
+      c.trivia.setNode(value, { bareSource: returnValue.trim() });
+    }
+    return { step: { type: "return", value, loc: retLoc }, nextIdx: c.idx + 1 };
+  }
+  return null;
+}
 
-  if (forRule && (inner.startsWith("prompt ") || /^[A-Za-z_][A-Za-z0-9_]*\s*=\s*prompt\s/.test(inner))) {
-    fail(filePath, "prompt is not allowed in rules", innerNo, colFromRaw(innerRaw));
+function tryParseElseError(c: BlockCtx): BlockResult | null {
+  const elseCol = c.innerRaw.indexOf("else") + 1;
+  if (/^else\s+if\b/.test(c.inner)) {
+    fail(
+      c.filePath,
+      '"else if" chaining is not supported; nest an "if" inside the "else" block, or use "match" for multi-way branching',
+      c.innerNo,
+      elseCol,
+    );
   }
+  fail(
+    c.filePath,
+    '"else" must appear on the same line as the closing "}" of an "if" block (e.g., "} else {")',
+    c.innerNo,
+    elseCol,
+  );
+}
 
-  const promptAssignMatch = inner.match(/^([A-Za-z_][A-Za-z0-9_]*)\s*=\s*prompt\s+(.+)$/s);
-  if (promptAssignMatch) {
+function tryParseStandaloneMatch(c: BlockCtx): BlockResult | null {
+  const m = c.inner.match(/^match\s+(.+?)\s*\{\s*$/);
+  if (!m) return null;
+  const subject = m[1].trim();
+  const matchLoc = { line: c.innerNo, col: c.innerRaw.indexOf("match") + 1 };
+  const { expr, nextIndex } = parseMatchExpr(c.filePath, c.lines, c.idx, subject, matchLoc);
+  return { step: execStep({ kind: "match", match: expr }, matchLoc), nextIdx: nextIndex };
+}
+
+/**
+ * STATEMENT dispatch table keyed by the leading keyword. Handlers fire only
+ * when the first token matches the key; each handler either returns a step
+ * (terminating), calls `fail(...)` (also terminating), or returns null to
+ * allow fallthrough to send / shell handling.
+ *
+ * To add a new top-level keyword, add (a) a row here pointing at the parser
+ * and (b) the keyword to the JAIPH_KEYWORDS set in `core.ts`. No other file
+ * needs to change.
+ */
+export const STATEMENT: Record<string, BlockHandler> = {
+  if: tryParseIf,
+  else: tryParseElseError,
+  for: tryParseFor,
+  const: tryParseConst,
+  fail: tryParseFail,
+  wait: tryParseWait,
+  ensure: tryParseEnsure,
+  run: tryParseRun,
+  prompt: tryParsePrompt,
+  log: tryParseLog,
+  logerr: tryParseLogerr,
+  return: tryParseReturn,
+  match: tryParseStandaloneMatch,
+};
+
+/** Error guards for assignment-shape lines. Emit a fail() or no-op; never return a step. */
+function applyAssignmentGuards(c: BlockCtx): void {
+  if (c.forRule && (c.inner.startsWith("prompt ") || /^[A-Za-z_][A-Za-z0-9_]*\s*=\s*prompt\s/.test(c.inner))) {
+    fail(c.filePath, "prompt is not allowed in rules", c.innerNo, colFromRaw(c.innerRaw));
+  }
+  const promptAssign = c.inner.match(/^([A-Za-z_][A-Za-z0-9_]*)\s*=\s*prompt\s+(.+)$/s);
+  if (promptAssign) {
     fail(
-      filePath,
+      c.filePath,
       'use "const name = prompt ..." to capture the prompt result (e.g. const answer = prompt "..." )',
-      innerNo,
-      innerRaw.indexOf(promptAssignMatch[1]) + 1,
+      c.innerNo,
+      c.innerRaw.indexOf(promptAssign[1]) + 1,
     );
   }
-  if (inner.startsWith("prompt ")) {
-    const promptCol = innerRaw.indexOf("prompt") + 1;
-    const promptArg = innerRaw.slice(innerRaw.indexOf("prompt") + "prompt".length).trimStart();
-    const result = parsePromptStep(filePath, lines, idx, promptArg, promptCol);
-    return { step: result.step, nextIdx: result.nextLineIdx + 1 };
-  }
-
-  const genericAssignMatch = inner.match(/^([A-Za-z_][A-Za-z0-9_]*)\s+=\s*(.+)$/s);
+  const generic = c.inner.match(/^([A-Za-z_][A-Za-z0-9_]*)\s+=\s*(.+)$/s);
   if (
-    genericAssignMatch &&
-    !genericAssignMatch[2].trimStart().startsWith("prompt ") &&
-    !genericAssignMatch[2].trimStart().startsWith('"') &&
-    !genericAssignMatch[2].trimStart().startsWith("$")
+    generic &&
+    !generic[2].trimStart().startsWith("prompt ") &&
+    !generic[2].trimStart().startsWith('"') &&
+    !generic[2].trimStart().startsWith("$")
   ) {
-    const captureName = genericAssignMatch[1];
-    const rest = genericAssignMatch[2].trim();
+    const captureName = generic[1];
+    const rest = generic[2].trim();
     if (rest.startsWith("run ") || rest.startsWith("ensure ")) {
       fail(
-        filePath,
+        c.filePath,
         `assignment without "const" is no longer supported; use "const ${captureName} = ${rest}"`,
-        innerNo,
-        innerRaw.indexOf(captureName) + 1,
+        c.innerNo,
+        c.innerRaw.indexOf(captureName) + 1,
       );
     }
   }
+}
 
-  if (inner.startsWith("log ") || inner === "log") {
-    const logArg = inner.slice("log".length).trimStart();
-    const logCol = innerRaw.indexOf("log") + 1;
-    if (logArg.startsWith("run ") && logArg.slice("run ".length).trimStart().startsWith("`")) {
-      const runBody = logArg.slice("run ".length).trim();
-      const result = parseAnonymousInlineScript(filePath, lines, idx, runBody, innerNo, logCol);
-      return {
-        step: {
-          type: "log",
-          message: "",
-          loc: { line: innerNo, col: logCol },
-          managed: {
-            kind: "run_inline_script",
-            body: result.body,
-            ...(result.lang ? { lang: result.lang } : {}),
-            args: result.args,
-            ...(result.bareIdentifierArgs ? { bareIdentifierArgs: result.bareIdentifierArgs } : {}),
-          },
-        },
-        nextIdx: result.nextLineIdx,
-      };
-    }
-    if (logArg.startsWith("`") || logArg.startsWith("```")) {
-      fail(filePath, 'bare inline scripts in log are not allowed; use "log run `...`()" to execute a managed inline script', innerNo, logCol);
-    }
-    if (logArg.startsWith('"""')) {
-      const { body, nextIdx } = consumeTripleQuotedArg(filePath, lines, idx, logArg);
-      return { step: { type: "log", message: body, tripleQuoted: true, loc: { line: innerNo, col: logCol } }, nextIdx };
-    }
-    if (logArg.startsWith('"') && !hasUnescapedClosingQuote(logArg, 1)) {
-      fail(filePath, 'multiline strings use triple quotes: log """..."""', innerNo, logCol);
-    }
-    const message = parseLogMessageRhs(filePath, innerNo, logCol, logArg, "log");
-    return { step: { type: "log", message, loc: { line: innerNo, col: logCol } }, nextIdx: idx + 1 };
+function trySend(c: BlockCtx): BlockResult | null {
+  const sendMatch = matchSendOperator(c.inner);
+  if (!sendMatch) return null;
+  if (c.forRule) {
+    fail(c.filePath, "send operator is not allowed in rules", c.innerNo, 1);
   }
+  const arrowIdx = c.inner.indexOf("<-");
+  const rhsCol = arrowIdx >= 0 ? arrowIdx + 3 : 1;
+  const { value, nextIdx } = parseSendRhs(
+    c.filePath, sendMatch.rhsText, c.innerNo, rhsCol, c.lines, c.idx, c.trivia,
+  );
+  return {
+    step: { type: "send", channel: sendMatch.channel, value, loc: { line: c.innerNo, col: 1 } },
+    nextIdx,
+  };
+}
 
-  if (inner.startsWith("logerr ") || inner === "logerr") {
-    const logerrArg = inner.slice("logerr".length).trimStart();
-    const logerrCol = innerRaw.indexOf("logerr") + 1;
-    if (logerrArg.startsWith("run ") && logerrArg.slice("run ".length).trimStart().startsWith("`")) {
-      const runBody = logerrArg.slice("run ".length).trim();
-      const result = parseAnonymousInlineScript(filePath, lines, idx, runBody, innerNo, logerrCol);
-      return {
-        step: {
-          type: "logerr",
-          message: "",
-          loc: { line: innerNo, col: logerrCol },
-          managed: {
-            kind: "run_inline_script",
-            body: result.body,
-            ...(result.lang ? { lang: result.lang } : {}),
-            args: result.args,
-            ...(result.bareIdentifierArgs ? { bareIdentifierArgs: result.bareIdentifierArgs } : {}),
-          },
-        },
-        nextIdx: result.nextLineIdx,
-      };
-    }
-    if (logerrArg.startsWith("`") || logerrArg.startsWith("```")) {
-      fail(filePath, 'bare inline scripts in logerr are not allowed; use "logerr run `...`()" to execute a managed inline script', innerNo, logerrCol);
-    }
-    if (logerrArg.startsWith('"""')) {
-      const { body, nextIdx } = consumeTripleQuotedArg(filePath, lines, idx, logerrArg);
-      return { step: { type: "logerr", message: body, tripleQuoted: true, loc: { line: innerNo, col: logerrCol } }, nextIdx };
-    }
-    if (logerrArg.startsWith('"') && !hasUnescapedClosingQuote(logerrArg, 1)) {
-      fail(filePath, 'multiline strings use triple quotes: logerr """..."""', innerNo, logerrCol);
-    }
-    const message = parseLogMessageRhs(filePath, innerNo, logerrCol, logerrArg, "logerr");
-    return { step: { type: "logerr", message, loc: { line: innerNo, col: logerrCol } }, nextIdx: idx + 1 };
-  }
+function shellFallthrough(c: BlockCtx): BlockResult {
+  const loc = { line: c.innerNo, col: colFromRaw(c.innerRaw) };
+  return { step: execStep({ kind: "shell", command: c.inner, loc }, loc), nextIdx: c.idx + 1 };
+}
 
-  if (inner.trim() === "return") {
+/**
+ * One workflow statement inside `{ … }` (catch body, etc.).
+ *
+ * Dispatches by leading keyword through `STATEMENT`; falls through to send /
+ * shell for non-keyword lines.
+ */
+export function parseBlockStatement(
+  filePath: string,
+  lines: string[],
+  idx: number,
+  trivia: Trivia = createTrivia(),
+  opts?: BlockParseOpts,
+): { step: WorkflowStepDef; nextIdx: number } {
+  const innerRaw = lines[idx];
+  const inner = innerRaw.trim();
+  const innerNo = idx + 1;
+  const c: BlockCtx = {
+    filePath, lines, idx, innerRaw, inner, innerNo, trivia,
+    forRule: opts?.forRule === true, opts,
+  };
+
+  if (inner.startsWith("#")) {
     return {
-      step: {
-        type: "return",
-        value: '""',
-        loc: { line: innerNo, col: innerRaw.indexOf("return") + 1 },
-      },
+      step: { type: "trivia", kind: "comment", text: innerRaw.trim(), loc: { line: innerNo, col: 1 } },
       nextIdx: idx + 1,
     };
   }
 
-  const returnMatch = inner.match(/^return\s+(.+)$/s);
-  if (returnMatch) {
-    const returnValue = returnMatch[1].trim();
-    const retLoc = { line: innerNo, col: innerRaw.indexOf("return") + 1 };
-    // return """..."""
-    if (returnValue.startsWith('"""')) {
-      const { body, nextIdx } = consumeTripleQuotedArg(filePath, lines, idx, returnValue);
-      return {
-        step: { type: "return", value: tripleQuoteBodyToRaw(body), tripleQuoted: true, loc: retLoc },
-        nextIdx,
-      };
-    }
-    // return match var { ... }
-    const returnMatchHead = returnValue.match(/^match\s+(.+?)\s*\{\s*$/);
-    if (returnMatchHead) {
-      const subject = returnMatchHead[1].trim();
-      const { expr, nextIndex } = parseMatchExpr(filePath, lines, idx, subject, retLoc);
-      return {
-        step: {
-          type: "return",
-          value: `__match__`,
-          loc: retLoc,
-          managed: { kind: "match", match: expr },
-        },
-        nextIdx: nextIndex,
-      };
-    }
-    if (returnValue.startsWith("run ")) {
-      const runBody = returnValue.slice("run ".length).trim();
-      if (runBody.startsWith("`")) {
-        const result = parseAnonymousInlineScript(filePath, lines, idx, runBody, innerNo, innerRaw.indexOf("run") + 1);
-        return {
-          step: {
-            type: "return",
-            value: `run inline_script`,
-            loc: retLoc,
-            managed: {
-              kind: "run_inline_script",
-              body: result.body,
-              ...(result.lang ? { lang: result.lang } : {}),
-              args: result.args,
-              ...(result.bareIdentifierArgs ? { bareIdentifierArgs: result.bareIdentifierArgs } : {}),
-            },
-          },
-          nextIdx: result.nextLineIdx,
-        };
-      }
-      const call = parseCallRef(runBody);
-      if (call) {
-        rejectTrailingContent(filePath, innerNo, "run", call.rest);
-        return {
-          step: {
-            type: "return",
-            value: `run ${call.ref}(${call.args ?? ""})`,
-            loc: retLoc,
-            managed: {
-              kind: "run", ref: { value: call.ref, loc: retLoc }, args: call.args,
-              ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-            },
-          },
-          nextIdx: idx + 1,
-        };
-      }
-    }
-    if (returnValue.startsWith("ensure ")) {
-      const call = parseCallRef(returnValue.slice("ensure ".length).trim());
-      if (call) {
-        rejectTrailingContent(filePath, innerNo, "ensure", call.rest);
-        return {
-          step: {
-            type: "return",
-            value: `ensure ${call.ref}(${call.args ?? ""})`,
-            loc: retLoc,
-            managed: {
-              kind: "ensure", ref: { value: call.ref, loc: retLoc }, args: call.args,
-              ...(call.bareIdentifierArgs ? { bareIdentifierArgs: call.bareIdentifierArgs } : {}),
-            },
-          },
-          nextIdx: idx + 1,
-        };
-      }
-    }
-    if (returnValue.startsWith("`") || returnValue.startsWith("```")) {
-      fail(filePath, 'bare inline scripts in return are not allowed; use "return run `...`()" to execute a managed inline script', innerNo, retLoc.col);
-    }
-    if (returnValue.startsWith("'")) {
-      fail(filePath, 'single-quoted strings are not supported; use double quotes ("...") instead', innerNo, retLoc.col);
-    }
-    if (/^[0-9]+$/.test(returnValue) || returnValue === "$?") {
-      fail(
-        filePath,
-        'bash exit codes are only valid in scripts; use return "..." for a workflow value',
-        innerNo,
-        retLoc.col,
-      );
-    }
-    if (
-      returnValue.startsWith('"') ||
-      returnValue.startsWith("$") ||
-      isBareDottedIdentifierReturn(returnValue) ||
-      isBareIdentifierReturn(returnValue)
-    ) {
-      // Reject multiline "..."
-      if (returnValue.startsWith('"') && !hasUnescapedClosingQuote(returnValue, 1)) {
-        fail(filePath, 'multiline strings use triple quotes: return """..."""', innerNo, retLoc.col);
-      }
-      const isBareDotted = isBareDottedIdentifierReturn(returnValue);
-      const isBare = !isBareDotted && isBareIdentifierReturn(returnValue);
-      const value = isBareDotted
-        ? dottedReturnToQuotedString(returnValue)
-        : isBare
-          ? bareIdentifierToQuotedString(returnValue)
-          : returnValue;
-      return {
-        step: {
-          type: "return",
-          value,
-          loc: retLoc,
-          ...(isBareDotted || isBare ? { bareSource: returnValue.trim() } : {}),
-        },
-        nextIdx: idx + 1,
-      };
-    }
-  }
-
-  // Standalone match statement: match <subject> { ... }
-  const standaloneMatchHead = inner.match(/^match\s+(.+?)\s*\{\s*$/);
-  if (standaloneMatchHead) {
-    const subject = standaloneMatchHead[1].trim();
-    const matchLoc = { line: innerNo, col: innerRaw.indexOf("match") + 1 };
-    const { expr, nextIndex } = parseMatchExpr(filePath, lines, idx, subject, matchLoc);
-    return {
-      step: { type: "match", expr },
-      nextIdx: nextIndex,
-    };
-  }
+  applyAssignmentGuards(c);
 
-  const sendMatch = matchSendOperator(inner);
-  if (sendMatch) {
-    if (forRule) {
-      fail(filePath, "send operator is not allowed in rules", innerNo, 1);
+  const keyword = inner.match(/^([A-Za-z_][A-Za-z0-9_]*)/)?.[1];
+  if (keyword) {
+    const handler = STATEMENT[keyword];
+    if (handler) {
+      const result = handler(c);
+      if (result) return result;
     }
-    const arrowIdx = inner.indexOf("<-");
-    const rhsCol = arrowIdx >= 0 ? arrowIdx + 3 : 1;
-    const { rhs, nextIdx: sendNextIdx } = parseSendRhs(filePath, sendMatch.rhsText, innerNo, rhsCol, lines, idx);
-    return {
-      step: {
-        type: "send",
-        channel: sendMatch.channel,
-        rhs,
-        loc: { line: innerNo, col: 1 },
-      },
-      nextIdx: sendNextIdx,
-    };
   }
 
-  return {
-    step: {
-      type: "shell",
-      command: inner,
-      loc: { line: innerNo, col: colFromRaw(innerRaw) },
-    },
-    nextIdx: idx + 1,
-  };
+  return trySend(c) ?? shellFallthrough(c);
 }
diff --git a/src/parse/workflows.ts b/src/parse/workflows.ts
index 3ec9156f..341afbd4 100644
--- a/src/parse/workflows.ts
+++ b/src/parse/workflows.ts
@@ -1,4 +1,5 @@
 import type { WorkflowDef } from "../types";
+import { createTrivia, type Trivia } from "./trivia";
 import { fail, parseParamList } from "./core";
 import { parseBraceBlockBody } from "./workflow-brace";
 
@@ -7,6 +8,7 @@ export function parseWorkflowBlock(
   lines: string[],
   startIndex: number,
   pendingComments: string[],
+  trivia: Trivia = createTrivia(),
 ): { workflow: WorkflowDef; nextIndex: number; exported: boolean } {
   const lineNo = startIndex + 1;
   const rawDecl = lines[startIndex];
@@ -58,6 +60,7 @@ export function parseWorkflowBlock(
     lines,
     startIndex + 1,
     lineNo,
+    trivia,
     {
       forRule: false,
       preserveBlankLines: true,
@@ -76,8 +79,14 @@ export function parseWorkflowBlock(
     },
   );
   workflow.steps.push(...bodySteps);
-  // Strip trailing blank_line (whitespace before closing brace).
-  while (workflow.steps.length > 0 && workflow.steps[workflow.steps.length - 1].type === "blank_line") {
+  // Strip trailing blank_line trivia (whitespace before closing brace).
+  while (
+    workflow.steps.length > 0 &&
+    (() => {
+      const last = workflow.steps[workflow.steps.length - 1];
+      return last.type === "trivia" && last.kind === "blank_line";
+    })()
+  ) {
     workflow.steps.pop();
   }
   return { workflow, nextIndex: afterClose, exported: isExported };
diff --git a/src/parser.ts b/src/parser.ts
index 15696835..bc3379d1 100644
--- a/src/parser.ts
+++ b/src/parser.ts
@@ -1,4 +1,5 @@
-import { jaiphModule } from "./types";
+import { jaiphModule, TopLevelEmitOrder } from "./types";
+import { Trivia, createTrivia } from "./parse/trivia";
 import { fail } from "./parse/core";
 import { parseChannelLine } from "./parse/channels";
 import { parseEnvDecl } from "./parse/env";
@@ -9,7 +10,17 @@ import { parseScriptBlock } from "./parse/scripts";
 import { parseWorkflowBlock } from "./parse/workflows";
 import { parseTestBlock } from "./parse/tests";
 
+export interface ParseResult {
+  ast: jaiphModule;
+  trivia: Trivia;
+}
+
 export function parsejaiph(source: string, filePath: string): jaiphModule {
+  return parsejaiphWithTrivia(source, filePath).ast;
+}
+
+export function parsejaiphWithTrivia(source: string, filePath: string): ParseResult {
+  const trivia = createTrivia();
   const lines = source.split(/\r?\n/);
   const mod: jaiphModule = {
     filePath,
@@ -19,8 +30,8 @@ export function parsejaiph(source: string, filePath: string): jaiphModule {
     rules: [],
     scripts: [],
     workflows: [],
-    topLevelOrder: [],
   };
+  const topLevelOrder: TopLevelEmitOrder[] = [];
   let i = 0;
   let pendingTopLevelComments: string[] = [];
 
@@ -48,10 +59,10 @@ export function parsejaiph(source: string, filePath: string): jaiphModule {
         fail(filePath, "duplicate config block (only one allowed per file)", lineNo, 1);
       }
       if (pendingTopLevelComments.length > 0) {
-        mod.configLeadingComments = [...pendingTopLevelComments];
+        trivia.setModule({ configLeadingComments: [...pendingTopLevelComments] });
         pendingTopLevelComments = [];
       }
-      const { metadata, nextIndex } = parseConfigBlock(filePath, lines, i - 1);
+      const { metadata, nextIndex } = parseConfigBlock(filePath, lines, i - 1, trivia);
       mod.metadata = metadata;
       i = nextIndex;
       continue;
@@ -60,7 +71,7 @@ export function parsejaiph(source: string, filePath: string): jaiphModule {
     if (line.startsWith("import script ")) {
       const si = parseScriptImportLine(filePath, line, raw, lineNo);
       if (pendingTopLevelComments.length > 0) {
-        si.leadingComments = [...pendingTopLevelComments];
+        trivia.setNode(si, { leadingComments: [...pendingTopLevelComments] });
         pendingTopLevelComments = [];
       }
       if (!mod.scriptImports) mod.scriptImports = [];
@@ -71,7 +82,7 @@ export function parsejaiph(source: string, filePath: string): jaiphModule {
     if (line.startsWith("import ")) {
       const imp = parseImportLine(filePath, line, raw, lineNo);
       if (pendingTopLevelComments.length > 0) {
-        imp.leadingComments = [...pendingTopLevelComments];
+        trivia.setNode(imp, { leadingComments: [...pendingTopLevelComments] });
         pendingTopLevelComments = [];
       }
       mod.imports.push(imp);
@@ -81,7 +92,7 @@ export function parsejaiph(source: string, filePath: string): jaiphModule {
     if (line.startsWith("channel ")) {
       const ch = parseChannelLine(filePath, line, raw, lineNo);
       if (pendingTopLevelComments.length > 0) {
-        ch.leadingComments = [...pendingTopLevelComments];
+        trivia.setNode(ch, { leadingComments: [...pendingTopLevelComments] });
         pendingTopLevelComments = [];
       }
       mod.channels.push(ch);
@@ -99,11 +110,14 @@ export function parsejaiph(source: string, filePath: string): jaiphModule {
         filePath,
         lines,
         i - 1,
-        pendingTopLevelComments.length > 0 ? [...pendingTopLevelComments] : undefined,
+        trivia,
       );
+      if (pendingTopLevelComments.length > 0) {
+        trivia.setNode(testBlock, { leadingComments: [...pendingTopLevelComments] });
+      }
       pendingTopLevelComments = [];
       mod.tests.push(testBlock);
-      mod.topLevelOrder!.push({ kind: "test", index: mod.tests.length - 1 });
+      topLevelOrder.push({ kind: "test", index: mod.tests.length - 1 });
       i = nextIndex;
       continue;
     }
@@ -118,43 +132,43 @@ export function parsejaiph(source: string, filePath: string): jaiphModule {
         mod.envDecls = [];
       }
       mod.envDecls.push(envDecl);
-      mod.topLevelOrder!.push({ kind: "env", index: mod.envDecls.length - 1 });
+      topLevelOrder.push({ kind: "env", index: mod.envDecls.length - 1 });
       i = nextIndex;
       continue;
     }
 
     if (/^(export\s+)?rule\s/.test(line)) {
-      const { rule, nextIndex, exported } = parseRuleBlock(filePath, lines, i - 1, pendingTopLevelComments);
+      const { rule, nextIndex, exported } = parseRuleBlock(filePath, lines, i - 1, pendingTopLevelComments, trivia);
       pendingTopLevelComments = [];
       if (exported) {
         mod.exports.push(rule.name);
       }
       mod.rules.push(rule);
-      mod.topLevelOrder!.push({ kind: "rule", index: mod.rules.length - 1 });
+      topLevelOrder.push({ kind: "rule", index: mod.rules.length - 1 });
       i = nextIndex;
       continue;
     }
 
     if (/^(export\s+)?script\s/.test(line)) {
-      const { scriptDef, nextIndex, exported } = parseScriptBlock(filePath, lines, i - 1, pendingTopLevelComments);
+      const { scriptDef, nextIndex, exported } = parseScriptBlock(filePath, lines, i - 1, pendingTopLevelComments, trivia);
       pendingTopLevelComments = [];
       if (exported) {
         mod.exports.push(scriptDef.name);
       }
       mod.scripts.push(scriptDef);
-      mod.topLevelOrder!.push({ kind: "script", index: mod.scripts.length - 1 });
+      topLevelOrder.push({ kind: "script", index: mod.scripts.length - 1 });
       i = nextIndex;
       continue;
     }
 
     if (/^(export\s+)?workflow\s/.test(line)) {
-      const { workflow, nextIndex, exported } = parseWorkflowBlock(filePath, lines, i - 1, pendingTopLevelComments);
+      const { workflow, nextIndex, exported } = parseWorkflowBlock(filePath, lines, i - 1, pendingTopLevelComments, trivia);
       pendingTopLevelComments = [];
       if (exported) {
         mod.exports.push(workflow.name);
       }
       mod.workflows.push(workflow);
-      mod.topLevelOrder!.push({ kind: "workflow", index: mod.workflows.length - 1 });
+      topLevelOrder.push({ kind: "workflow", index: mod.workflows.length - 1 });
       i = nextIndex;
       continue;
     }
@@ -162,8 +176,9 @@ export function parsejaiph(source: string, filePath: string): jaiphModule {
     fail(filePath, `unsupported top-level statement: ${line}`, lineNo);
   }
 
+  trivia.setModule({ topLevelOrder });
   if (pendingTopLevelComments.length > 0) {
-    mod.trailingTopLevelComments = [...pendingTopLevelComments];
+    trivia.setModule({ trailingTopLevelComments: [...pendingTopLevelComments] });
   }
 
   // Unified namespace: imports, channels, rules, workflows, scripts, and consts all share one name space.
@@ -189,5 +204,5 @@ export function parsejaiph(source: string, filePath: string): jaiphModule {
     }
   }
 
-  return mod;
+  return { ast: mod, trivia };
 }
diff --git a/src/runtime/docker-inplace.test.ts b/src/runtime/docker-inplace.test.ts
new file mode 100644
index 00000000..60eae3b4
--- /dev/null
+++ b/src/runtime/docker-inplace.test.ts
@@ -0,0 +1,291 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { spawnSync } from "node:child_process";
+import { mkdtempSync, rmSync, writeFileSync, readFileSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import {
+  confirmInplaceRun,
+  detectGitTreeState,
+  formatInplaceWarning,
+  _inplacePrompt,
+} from "./docker-inplace";
+
+const HAS_GIT = spawnSync("git", ["--version"], { stdio: "ignore" }).status === 0;
+
+function makeWs(): string {
+  return mkdtempSync(join(tmpdir(), "jaiph-inplace-ws-"));
+}
+
+function captureStderr(): { restore: () => void; data: () => string } {
+  let buf = "";
+  const orig = process.stderr.write;
+  process.stderr.write = ((chunk: string | Uint8Array) => {
+    buf += String(chunk);
+    return true;
+  }) as typeof process.stderr.write;
+  return {
+    restore: () => { process.stderr.write = orig; },
+    data: () => buf,
+  };
+}
+
+function stubPrompt(answers: string[]): { restore: () => void; callCount: () => number } {
+  const orig = _inplacePrompt.ask;
+  let calls = 0;
+  _inplacePrompt.ask = async (_q: string) => {
+    const a = answers[calls] ?? "";
+    calls += 1;
+    const trimmed = a.trim().toLowerCase();
+    return trimmed === "y" || trimmed === "yes";
+  };
+  return {
+    restore: () => { _inplacePrompt.ask = orig; },
+    callCount: () => calls,
+  };
+}
+
+// ---------------------------------------------------------------------------
+// detectGitTreeState
+// ---------------------------------------------------------------------------
+
+test("detectGitTreeState: non-git directory returns no-repo", () => {
+  const ws = makeWs();
+  try {
+    assert.equal(detectGitTreeState(ws), "no-repo");
+  } finally {
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("detectGitTreeState: clean git tree returns clean", () => {
+  if (!HAS_GIT) return;
+  const ws = makeWs();
+  try {
+    spawnSync("git", ["init", "-q"], { cwd: ws });
+    spawnSync("git", ["config", "user.email", "t@t"], { cwd: ws });
+    spawnSync("git", ["config", "user.name", "t"], { cwd: ws });
+    spawnSync("git", ["commit", "--allow-empty", "-m", "init", "-q"], { cwd: ws });
+    assert.equal(detectGitTreeState(ws), "clean");
+  } finally {
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("detectGitTreeState: dirty git tree returns dirty", () => {
+  if (!HAS_GIT) return;
+  const ws = makeWs();
+  try {
+    spawnSync("git", ["init", "-q"], { cwd: ws });
+    writeFileSync(join(ws, "untracked.txt"), "hi");
+    assert.equal(detectGitTreeState(ws), "dirty");
+  } finally {
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+// ---------------------------------------------------------------------------
+// formatInplaceWarning: three required variants, each names directory + recovery posture
+// ---------------------------------------------------------------------------
+
+test("formatInplaceWarning: clean variant names directory and points at git restore", () => {
+  const msg = formatInplaceWarning("/tmp/example", "clean");
+  assert.ok(msg.includes("/tmp/example"), "names workspace directory");
+  assert.ok(msg.includes("in-place mode"), "labels the mode");
+  assert.ok(msg.includes("git restore") || msg.includes("git reset"), "names recovery command");
+  assert.ok(msg.includes("clean"), "describes clean state");
+  assert.ok(
+    msg.includes("Everything outside this directory stays sandboxed"),
+    "still reminds the user the machine boundary holds",
+  );
+});
+
+test("formatInplaceWarning: dirty variant warns about mixed-in changes and not-cleanly-undoable", () => {
+  const msg = formatInplaceWarning("/tmp/example", "dirty");
+  assert.ok(msg.includes("/tmp/example"));
+  assert.ok(msg.includes("uncommitted"), "calls out uncommitted changes");
+  assert.ok(
+    msg.includes("can't be cleanly undone") || msg.includes("cleanly undone"),
+    "states the not-cleanly-undoable posture",
+  );
+  assert.ok(msg.includes("commit") || msg.includes("stash"), "suggests commit/stash");
+});
+
+test("formatInplaceWarning: no-repo variant states irreversibility and suggests git init", () => {
+  const msg = formatInplaceWarning("/tmp/example", "no-repo");
+  assert.ok(msg.includes("/tmp/example"));
+  assert.ok(msg.includes("No git repository"), "calls out the missing repo");
+  assert.ok(msg.includes("irreversible"), "states irreversibility");
+  assert.ok(msg.includes("git init"), "suggests git init");
+});
+
+// ---------------------------------------------------------------------------
+// confirmInplaceRun: gate behavior
+// ---------------------------------------------------------------------------
+
+test("confirmInplaceRun: JAIPH_INPLACE_YES=1 auto-confirms without calling the prompt", async () => {
+  const ws = makeWs();
+  const spy = stubPrompt([]);
+  const cap = captureStderr();
+  try {
+    const ok = await confirmInplaceRun(ws, { JAIPH_INPLACE_YES: "1" }, true);
+    assert.equal(ok, true);
+    assert.equal(spy.callCount(), 0, "prompt must not be invoked when auto-confirmed");
+    assert.equal(cap.data(), "", "no warning printed on auto-confirm");
+  } finally {
+    cap.restore();
+    spy.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("confirmInplaceRun: JAIPH_INPLACE_YES=true also auto-confirms", async () => {
+  const ws = makeWs();
+  const spy = stubPrompt([]);
+  try {
+    const ok = await confirmInplaceRun(ws, { JAIPH_INPLACE_YES: "true" }, true);
+    assert.equal(ok, true);
+    assert.equal(spy.callCount(), 0);
+  } finally {
+    spy.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("confirmInplaceRun: TTY + user answers yes → returns true (launches)", async () => {
+  const ws = makeWs();
+  const spy = stubPrompt(["y"]);
+  const cap = captureStderr();
+  try {
+    const ok = await confirmInplaceRun(ws, {}, true);
+    assert.equal(ok, true);
+    assert.equal(spy.callCount(), 1, "prompt invoked exactly once");
+    assert.ok(cap.data().includes("in-place mode"), "warning printed before prompt");
+  } finally {
+    cap.restore();
+    spy.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("confirmInplaceRun: TTY + user answers no → returns false (aborts cleanly, no launch)", async () => {
+  const ws = makeWs();
+  const spy = stubPrompt(["n"]);
+  const cap = captureStderr();
+  try {
+    const ok = await confirmInplaceRun(ws, {}, true);
+    assert.equal(ok, false);
+    assert.equal(spy.callCount(), 1);
+    assert.ok(cap.data().includes("in-place mode"));
+  } finally {
+    cap.restore();
+    spy.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("confirmInplaceRun: TTY + empty answer defaults to no", async () => {
+  const ws = makeWs();
+  const spy = stubPrompt([""]);
+  const cap = captureStderr();
+  try {
+    const ok = await confirmInplaceRun(ws, {}, true);
+    assert.equal(ok, false);
+  } finally {
+    cap.restore();
+    spy.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("confirmInplaceRun: non-TTY without JAIPH_INPLACE_YES throws E_DOCKER_INPLACE_NO_CONFIRM", async () => {
+  const ws = makeWs();
+  const spy = stubPrompt([]);
+  try {
+    await assert.rejects(
+      () => confirmInplaceRun(ws, {}, false),
+      /E_DOCKER_INPLACE_NO_CONFIRM/,
+    );
+    assert.equal(spy.callCount(), 0, "prompt is never invoked in non-TTY path");
+  } finally {
+    spy.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("confirmInplaceRun: non-TTY + JAIPH_INPLACE_YES=1 still proceeds", async () => {
+  const ws = makeWs();
+  const spy = stubPrompt([]);
+  try {
+    const ok = await confirmInplaceRun(ws, { JAIPH_INPLACE_YES: "1" }, false);
+    assert.equal(ok, true);
+    assert.equal(spy.callCount(), 0);
+  } finally {
+    spy.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("confirmInplaceRun: warning text adapts to git state (no-repo variant printed for non-git workspace)", async () => {
+  const ws = makeWs();
+  const spy = stubPrompt(["n"]);
+  const cap = captureStderr();
+  try {
+    await confirmInplaceRun(ws, {}, true);
+    const out = cap.data();
+    assert.ok(out.includes("No git repository"), "no-repo branch printed");
+    assert.ok(out.includes(ws), "workspace path named in warning");
+  } finally {
+    cap.restore();
+    spy.restore();
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("confirmInplaceRun: warning text uses clean variant for clean git tree", async () => {
+  if (!HAS_GIT) return;
+  const ws = makeWs();
+  try {
+    spawnSync("git", ["init", "-q"], { cwd: ws });
+    spawnSync("git", ["config", "user.email", "t@t"], { cwd: ws });
+    spawnSync("git", ["config", "user.name", "t"], { cwd: ws });
+    spawnSync("git", ["commit", "--allow-empty", "-m", "init", "-q"], { cwd: ws });
+    const spy = stubPrompt(["n"]);
+    const cap = captureStderr();
+    try {
+      await confirmInplaceRun(ws, {}, true);
+      const out = cap.data();
+      assert.ok(out.includes("clean"), "clean branch printed");
+      assert.ok(out.includes("git restore") || out.includes("git reset"), "clean branch names recovery command");
+    } finally {
+      cap.restore();
+      spy.restore();
+    }
+  } finally {
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+test("confirmInplaceRun: warning text uses dirty variant for dirty git tree", async () => {
+  if (!HAS_GIT) return;
+  const ws = makeWs();
+  try {
+    spawnSync("git", ["init", "-q"], { cwd: ws });
+    writeFileSync(join(ws, "untracked.txt"), "hi");
+    const spy = stubPrompt(["n"]);
+    const cap = captureStderr();
+    try {
+      await confirmInplaceRun(ws, {}, true);
+      const out = cap.data();
+      assert.ok(out.includes("uncommitted"), "dirty branch printed");
+      assert.ok(out.includes("commit") || out.includes("stash"), "dirty branch suggests commit/stash");
+    } finally {
+      cap.restore();
+      spy.restore();
+    }
+  } finally {
+    rmSync(ws, { recursive: true, force: true });
+  }
+});
+
+void readFileSync;
diff --git a/src/runtime/docker-inplace.ts b/src/runtime/docker-inplace.ts
new file mode 100644
index 00000000..7fd08dce
--- /dev/null
+++ b/src/runtime/docker-inplace.ts
@@ -0,0 +1,113 @@
+import { spawnSync } from "node:child_process";
+import { createInterface } from "node:readline";
+
+/**
+ * Git working-tree state used to shape the inplace-mode warning copy.
+ *  - "clean":   git repo, no uncommitted changes — run is reversible via git.
+ *  - "dirty":   git repo, has uncommitted changes — run's edits will mix with them.
+ *  - "no-repo": no git on PATH, or workspace is not a git repo — no safety net.
+ */
+export type GitTreeState = "clean" | "dirty" | "no-repo";
+
+/**
+ * Probe the workspace's git state without ever throwing.
+ *
+ * Treats every failure mode the same as "no-repo": `git` missing on PATH, the
+ * directory not being a git repo, permission errors, etc. The user-facing
+ * warning collapses those into a single "no safety net" branch on purpose.
+ */
+export function detectGitTreeState(workspaceRoot: string): GitTreeState {
+  try {
+    const inside = spawnSync(
+      "git",
+      ["rev-parse", "--is-inside-work-tree"],
+      { cwd: workspaceRoot, stdio: ["ignore", "pipe", "ignore"], encoding: "utf8" },
+    );
+    if (inside.status !== 0 || inside.stdout.trim() !== "true") return "no-repo";
+    const status = spawnSync(
+      "git",
+      ["status", "--porcelain"],
+      { cwd: workspaceRoot, stdio: ["ignore", "pipe", "ignore"], encoding: "utf8" },
+    );
+    if (status.status !== 0) return "no-repo";
+    return status.stdout.length === 0 ? "clean" : "dirty";
+  } catch {
+    return "no-repo";
+  }
+}
+
+/**
+ * The three required warning variants. Each names the actual workspace
+ * directory and states a recovery posture concrete enough that a developer
+ * who is about to lose work can reason about it.
+ */
+export function formatInplaceWarning(workspaceRoot: string, state: GitTreeState): string {
+  const head =
+    `⚠️  jaiph in-place mode: the workflow will edit files directly in ${workspaceRoot} on your machine.`;
+  const tail = `Everything outside this directory stays sandboxed — the run can't touch the rest of your machine.`;
+  let middle: string;
+  if (state === "clean") {
+    middle =
+      `Your git tree is clean, so anything this run changes can be undone with \`git restore .\` (or \`git reset --hard\`).`;
+  } else if (state === "dirty") {
+    middle =
+      `You have uncommitted changes — the run's edits will be mixed in with them and can't be cleanly undone. Consider committing or stashing first.`;
+  } else {
+    middle =
+      `No git repository found here, so there's no safety net — these changes are irreversible. Consider \`git init\` and committing first.`;
+  }
+  return `${head}\n${middle}\n${tail}\n`;
+}
+
+/**
+ * Minimal readline yes/no prompt. Defaults to "no" on empty input, EOF, or any
+ * answer that does not start with `y`/`Y`. There is no existing helper in the
+ * codebase; this is intentionally tiny rather than a new abstraction.
+ */
+async function defaultPromptYesNo(question: string): Promise<boolean> {
+  const rl = createInterface({ input: process.stdin, output: process.stderr });
+  try {
+    const answer = await new Promise<string>((resolveAnswer) => {
+      rl.question(question, (input) => resolveAnswer(input));
+      rl.once("close", () => resolveAnswer(""));
+    });
+    const trimmed = answer.trim().toLowerCase();
+    return trimmed === "y" || trimmed === "yes";
+  } finally {
+    rl.close();
+  }
+}
+
+/** Test seam: tests replace these to assert call/no-call and supply answers. */
+export const _inplacePrompt = {
+  ask: defaultPromptYesNo,
+};
+
+/**
+ * Orchestrate the inplace warning + confirmation flow.
+ *
+ * - `JAIPH_INPLACE_YES=1` / `"true"` skips the prompt entirely (CI path).
+ * - Non-TTY without the flag throws `E_DOCKER_INPLACE_NO_CONFIRM`.
+ * - TTY: print the warning + a `Continue? [y/N]` prompt and return the answer.
+ *
+ * Returns true to proceed with the container launch, false to abort cleanly.
+ */
+export async function confirmInplaceRun(
+  workspaceRoot: string,
+  env: Record<string, string | undefined>,
+  isTTY: boolean,
+): Promise<boolean> {
+  if (env.JAIPH_INPLACE_YES === "1" || env.JAIPH_INPLACE_YES === "true") {
+    return true;
+  }
+  if (!isTTY) {
+    throw new Error(
+      "E_DOCKER_INPLACE_NO_CONFIRM jaiph in-place mode requires interactive confirmation, " +
+        "but stdin is not a TTY. Set JAIPH_INPLACE_YES=1 to auto-confirm.",
+    );
+  }
+  const state = detectGitTreeState(workspaceRoot);
+  const warning = formatInplaceWarning(workspaceRoot, state);
+  process.stderr.write(warning);
+  return _inplacePrompt.ask("Continue? [y/N] ");
+}
diff --git a/src/runtime/docker.test.ts b/src/runtime/docker.test.ts
index 2984de2c..a227fac4 100644
--- a/src/runtime/docker.test.ts
+++ b/src/runtime/docker.test.ts
@@ -11,20 +11,26 @@ import {
   verifyImageHasJaiph,
   prepareImage,
   isEnvAllowed,
+  ENV_ALLOW_PREFIXES,
+  ENV_ALLOW_EXCLUDE_PREFIX,
   GHCR_IMAGE_REPO,
   selectSandboxMode,
   cloneWorkspaceForSandbox,
   allocateSandboxWorkspaceDir,
   pullImageIfNeeded,
   resolveDefaultDockerImageTag,
+  cleanupDocker,
+  withDockerExitGuard,
   _dockerExec,
   _uidDetect,
   type DockerRunConfig,
   type DockerSpawnOptions,
+  type DockerSpawnResult,
 } from "./docker";
 import { mkdtempSync, writeFileSync, mkdirSync, existsSync, readFileSync, readdirSync, rmSync } from "node:fs";
+import { spawnSync } from "node:child_process";
 import { tmpdir } from "node:os";
-import { join, dirname } from "node:path";
+import { join, dirname, resolve } from "node:path";
 
 /** Shared temp workspace for buildDockerArgs tests. */
 const TEST_WS = mkdtempSync(join(tmpdir(), "jaiph-test-ws-"));
@@ -70,7 +76,7 @@ test("resolveDockerConfig: defaults when no in-file and no env — Docker on", (
   assert.equal(cfg.enabled, true);
   assert.ok(cfg.image.startsWith(GHCR_IMAGE_REPO + ":"), `default image should be GHCR: ${cfg.image}`);
   assert.equal(cfg.network, "default");
-  assert.equal(cfg.timeoutSeconds, 3600);
+  assert.equal(cfg.timeoutSeconds, 14400);
 });
 
 test("resolveDefaultDockerImageTag: curl-installer layout (package.json beside src/)", () => {
@@ -472,6 +478,50 @@ test("writeOverlayScript: contains no in-container rsync/cp fallback (host handl
   }
 });
 
+// Importing the docker module must not read overlay-run.sh — non-Docker CLI
+// paths (jaiph compile/format) load this module transitively via shared imports
+// (e.g. CONTAINER_RUN_DIR in src/cli/shared/errors.ts) and must not crash with a
+// raw ENOENT when the installation is incomplete.
+//
+// `writeOverlayScript` now falls back to the embedded base64 copy when both
+// on-disk candidates are absent, so the bun-compiled standalone binary works
+// without any sibling files. The "import does no I/O" property is still
+// asserted; the "throws when missing" half was removed when the embedded
+// fallback shipped.
+test("loadOverlayScript: import does not read overlay-run.sh; writeOverlayScript falls back to embedded copy", () => {
+  const dockerPath = require.resolve("./docker");
+  const dockerDir = dirname(dockerPath);
+  const distOverlay = join(dockerDir, "overlay-run.sh");
+  const repoOverlay = resolve(dockerDir, "..", "..", "..", "runtime", "overlay-run.sh");
+  // Hide on-disk overlay candidates via existsSync patching — do not rename
+  // repo-root runtime/overlay-run.sh; parallel tests (embedded-assets) read it.
+  const script = `
+    const fs = require("node:fs");
+    const dist = ${JSON.stringify(distOverlay)};
+    const repo = ${JSON.stringify(repoOverlay)};
+    const origExists = fs.existsSync;
+    fs.existsSync = (p) => (p === dist || p === repo ? false : origExists(p));
+    const mod = require(${JSON.stringify(dockerPath)});
+    // Mirrors what jaiph compile/format pull from the docker module (only
+    // constants/types, never the overlay path).
+    if (mod.CONTAINER_RUN_DIR !== "/jaiph/run") {
+      console.error("FAIL: CONTAINER_RUN_DIR unexpected: " + mod.CONTAINER_RUN_DIR);
+      process.exit(5);
+    }
+    const tmpPath = mod.writeOverlayScript();
+    const body = fs.readFileSync(tmpPath, "utf8");
+    if (!body.startsWith("#!/usr/bin/env bash")) {
+      console.error("FAIL: embedded overlay body did not start with bash shebang: " + body.slice(0, 60));
+      process.exit(2);
+    }
+    fs.rmSync(require("node:path").dirname(tmpPath), { recursive: true, force: true });
+    console.log("OK");
+  `;
+  const r = spawnSync(process.execPath, ["-e", script], { encoding: "utf8" });
+  assert.equal(r.status, 0, `subprocess failed (status=${r.status}); stdout=${r.stdout}; stderr=${r.stderr}`);
+  assert.match(r.stdout, /OK/);
+});
+
 
 // ---------------------------------------------------------------------------
 // spawnDockerProcess: stdin must be ignored
@@ -632,6 +682,25 @@ test("isEnvAllowed: rejects arbitrary vars", () => {
   assert.equal(isEnvAllowed("CARGO_REGISTRY_TOKEN"), false);
 });
 
+// ---------------------------------------------------------------------------
+// docs/env-vars.md parity: forwarding allowlist must mirror source constants.
+// ---------------------------------------------------------------------------
+
+const REPO_ROOT = resolve(__dirname, "..", "..", "..");
+
+test("docs/env-vars.md lists ENV_ALLOW_PREFIXES and the exclude prefix verbatim", () => {
+  const doc = readFileSync(join(REPO_ROOT, "docs", "env-vars.md"), "utf8");
+  for (const prefix of ENV_ALLOW_PREFIXES) {
+    const token = `\`${prefix}*\``;
+    assert.ok(doc.includes(token), `env-vars.md missing forwarding prefix ${token}`);
+  }
+  const excludeToken = `\`${ENV_ALLOW_EXCLUDE_PREFIX}*\``;
+  assert.ok(
+    doc.includes(excludeToken),
+    `env-vars.md missing forwarding exclusion ${excludeToken}`,
+  );
+});
+
 test("buildDockerArgs: only forwards env vars matching allowlist", () => {
   const opts = defaultOpts({
     env: {
@@ -882,6 +951,239 @@ test("selectSandboxMode: returns overlay iff /dev/fuse exists on host (platform-
   assert.equal(selectSandboxMode({}), expected);
 });
 
+// ---------------------------------------------------------------------------
+// selectSandboxMode + inplace
+// ---------------------------------------------------------------------------
+
+test("selectSandboxMode: JAIPH_INPLACE=1 forces inplace", () => {
+  assert.equal(selectSandboxMode({ JAIPH_INPLACE: "1" }), "inplace");
+  assert.equal(selectSandboxMode({ JAIPH_INPLACE: "true" }), "inplace");
+});
+
+test("selectSandboxMode: JAIPH_INPLACE wins over JAIPH_DOCKER_NO_OVERLAY", () => {
+  assert.equal(
+    selectSandboxMode({ JAIPH_INPLACE: "1", JAIPH_DOCKER_NO_OVERLAY: "1" }),
+    "inplace",
+  );
+});
+
+test("selectSandboxMode: JAIPH_INPLACE=other-value does not switch mode (only 1/true)", () => {
+  const expected = existsSync("/dev/fuse") ? "overlay" : "copy";
+  assert.equal(selectSandboxMode({ JAIPH_INPLACE: "yes" }), expected);
+  assert.equal(selectSandboxMode({ JAIPH_INPLACE: "0" }), expected);
+  assert.equal(selectSandboxMode({ JAIPH_INPLACE: "" }), expected);
+});
+
+test("selectSandboxMode: existing overlay/copy behavior unchanged when JAIPH_INPLACE unset (regression)", () => {
+  // Without JAIPH_INPLACE, the function returns exactly what /dev/fuse +
+  // JAIPH_DOCKER_NO_OVERLAY would have returned before this change.
+  assert.equal(selectSandboxMode({ JAIPH_DOCKER_NO_OVERLAY: "1" }), "copy");
+  assert.equal(selectSandboxMode({ JAIPH_DOCKER_NO_OVERLAY: "true" }), "copy");
+  const expected = existsSync("/dev/fuse") ? "overlay" : "copy";
+  assert.equal(selectSandboxMode({}), expected);
+});
+
+// ---------------------------------------------------------------------------
+// buildDockerArgs: inplace mode
+// ---------------------------------------------------------------------------
+
+function inplaceOpts(overrides?: Partial<DockerSpawnOptions>): DockerSpawnOptions {
+  return defaultOpts({ sandboxMode: "inplace", sandboxWorkspaceDir: undefined, ...overrides });
+}
+
+test("buildDockerArgs: inplace binds real workspaceRoot rw at /jaiph/workspace", () => {
+  const args = buildDockerArgs(inplaceOpts());
+  const vFlags = args.filter((_, i) => i > 0 && args[i - 1] === "-v");
+  const wsMount = vFlags.find((v) => v.endsWith(":/jaiph/workspace:rw"));
+  assert.ok(wsMount, "workspace bound rw at /jaiph/workspace");
+  assert.ok(wsMount!.startsWith(`${resolve(TEST_WS)}:`), "host side is the real workspaceRoot");
+});
+
+test("buildDockerArgs: inplace has no :ro workspace mount, no fuse, no overlay script, no overlay caps", () => {
+  const args = buildDockerArgs(inplaceOpts());
+  const vFlags = args.filter((_, i) => i > 0 && args[i - 1] === "-v");
+  assert.ok(!vFlags.some((v) => v.includes("/jaiph/workspace-ro")), "no overlay lower-layer mount");
+  assert.ok(!vFlags.some((v) => v.includes("/jaiph/overlay-run.sh")), "no overlay script mount");
+  assert.ok(!vFlags.some((v) => v.endsWith(":ro") && v.includes("/jaiph/workspace")), "no :ro workspace mount");
+  assert.ok(!args.includes("/dev/fuse"), "no fuse device");
+  assert.ok(!args.includes("--device"), "no --device flag at all");
+  const capAddValues = args
+    .map((v, i) => (v === "--cap-add" ? args[i + 1] : null))
+    .filter((v): v is string => v !== null);
+  assert.deepStrictEqual(capAddValues, [], "no overlay-only --cap-add flags");
+  const secOptValues = args
+    .map((v, i) => (v === "--security-opt" ? args[i + 1] : null))
+    .filter((v): v is string => v !== null);
+  assert.ok(!secOptValues.includes("apparmor=unconfined"), "no apparmor=unconfined");
+  assert.ok(!args.includes("/jaiph/overlay-run.sh"), "container command does not invoke overlay-run.sh");
+});
+
+test("buildDockerArgs: inplace still includes --cap-drop ALL, no-new-privileges, and runs mount", () => {
+  const args = buildDockerArgs(inplaceOpts());
+  const capDropIdx = args.indexOf("--cap-drop");
+  assert.ok(capDropIdx >= 0);
+  assert.equal(args[capDropIdx + 1], "ALL");
+  const secOptIdx = args.indexOf("--security-opt");
+  assert.ok(secOptIdx >= 0);
+  assert.equal(args[secOptIdx + 1], "no-new-privileges");
+  const vFlags = args.filter((_, i) => i > 0 && args[i - 1] === "-v");
+  const runMount = vFlags.find((v) => v.endsWith(":/jaiph/run:rw"));
+  assert.ok(runMount, "run dir bound rw at /jaiph/run");
+});
+
+test("buildDockerArgs: inplace requires neither overlayScriptPath nor sandboxWorkspaceDir", () => {
+  assert.doesNotThrow(() => buildDockerArgs(inplaceOpts()));
+});
+
+test("buildDockerArgs: inplace on Linux runs as --user host_uid:host_gid", () => {
+  if (process.platform !== "linux") return;
+  const args = buildDockerArgs(inplaceOpts());
+  const userIdx = args.indexOf("--user");
+  assert.ok(userIdx >= 0, "--user flag present");
+  assert.notEqual(args[userIdx + 1], "0:0");
+  assert.match(args[userIdx + 1], /^\d+:\d+$/, "inplace --user is uid:gid");
+});
+
+test("buildDockerArgs: inplace command tail is direct `jaiph run --raw <file>` (no overlay-run.sh wrapper)", () => {
+  const args = buildDockerArgs(inplaceOpts());
+  const idxImage = args.indexOf("ubuntu:24.04");
+  const tail = args.slice(idxImage + 1);
+  assert.equal(tail[0], "jaiph");
+  assert.equal(tail[1], "run");
+  assert.equal(tail[2], "--raw");
+  assert.equal(tail[3], "/jaiph/workspace/main.jh");
+});
+
+test("buildDockerArgs: inplace does not forward JAIPH_INPLACE / JAIPH_INPLACE_YES into the container", () => {
+  const args = buildDockerArgs(inplaceOpts({
+    env: { JAIPH_INPLACE: "1", JAIPH_INPLACE_YES: "1", JAIPH_DEBUG: "true" },
+  }));
+  const envFlags = args
+    .map((v, i) => (v === "-e" ? args[i + 1] : null))
+    .filter((v): v is string => v !== null);
+  assert.ok(envFlags.some((v) => v.startsWith("JAIPH_DEBUG=")), "regular JAIPH_ var still forwarded");
+  assert.ok(!envFlags.some((v) => v.startsWith("JAIPH_INPLACE=")), "JAIPH_INPLACE not forwarded");
+  assert.ok(!envFlags.some((v) => v.startsWith("JAIPH_INPLACE_YES=")), "JAIPH_INPLACE_YES not forwarded");
+});
+
+test("isEnvAllowed: rejects JAIPH_INPLACE and JAIPH_INPLACE_YES (would otherwise leak via JAIPH_ prefix)", () => {
+  assert.equal(isEnvAllowed("JAIPH_INPLACE"), false);
+  assert.equal(isEnvAllowed("JAIPH_INPLACE_YES"), false);
+});
+
+test("buildDockerArgs: write to inplace workspace bind appears at the host workspace; copy does not", () => {
+  // Filesystem-level assertion. We do not run docker — we identify the
+  // host path that the mount spec exposes to the container's /jaiph/workspace
+  // and write to it directly. That path is the real workspaceRoot in inplace
+  // mode, and a separate clone dir in copy mode.
+  const hostWs = mkdtempSync(join(tmpdir(), "jaiph-inplace-host-"));
+  const cloneDir = mkdtempSync(join(tmpdir(), "jaiph-inplace-clone-"));
+  const runDir = mkdtempSync(join(tmpdir(), "jaiph-inplace-run-"));
+  try {
+    writeFileSync(join(hostWs, "main.jh"), "");
+    const findHostBindFor = (args: string[], containerPath: string): string => {
+      for (let i = 0; i < args.length - 1; i++) {
+        if (args[i] !== "-v") continue;
+        const spec = args[i + 1];
+        const m = spec.match(/^(.*):([^:]+):(ro|rw)$/);
+        if (m && m[2] === containerPath) return m[1];
+      }
+      throw new Error(`mount for ${containerPath} not found`);
+    };
+    const inplaceArgs = buildDockerArgs(
+      defaultOpts({ sandboxMode: "inplace", workspaceRoot: hostWs, sandboxWorkspaceDir: undefined, sourceAbs: join(hostWs, "main.jh") }),
+    );
+    const copyArgs = buildDockerArgs(
+      defaultOpts({ sandboxMode: "copy", workspaceRoot: hostWs, sandboxWorkspaceDir: cloneDir, sourceAbs: join(hostWs, "main.jh") }),
+    );
+    const inplaceHostPath = findHostBindFor(inplaceArgs, "/jaiph/workspace");
+    const copyHostPath = findHostBindFor(copyArgs, "/jaiph/workspace");
+    assert.equal(inplaceHostPath, resolve(hostWs), "inplace points at real workspace");
+    assert.notEqual(copyHostPath, resolve(hostWs), "copy points at clone, not workspace");
+    // Simulate the container writing a file through the bind.
+    writeFileSync(join(inplaceHostPath, "wrote_from_container.txt"), "x");
+    writeFileSync(join(copyHostPath, "wrote_from_container.txt"), "x");
+    assert.ok(
+      existsSync(join(hostWs, "wrote_from_container.txt")),
+      "inplace bind: container write lands on host workspace",
+    );
+    // Re-check after copy write — host workspace must only have the inplace file
+    // (already present); the copy write went to cloneDir, not hostWs.
+    const cloneWrite = join(cloneDir, "wrote_from_container.txt");
+    assert.ok(existsSync(cloneWrite), "copy bind: write landed in clone");
+    // Remove the inplace marker, then prove that subsequent copy writes don't leak.
+    rmSync(join(hostWs, "wrote_from_container.txt"));
+    writeFileSync(join(cloneDir, "second_write.txt"), "x");
+    assert.ok(
+      !existsSync(join(hostWs, "second_write.txt")),
+      "copy bind: writes do not leak to host workspace",
+    );
+    void runDir;
+  } finally {
+    rmSync(hostWs, { recursive: true, force: true });
+    rmSync(cloneDir, { recursive: true, force: true });
+    rmSync(runDir, { recursive: true, force: true });
+  }
+});
+
+// ---------------------------------------------------------------------------
+// spawnDockerProcess: inplace mode skips cloneWorkspaceForSandbox path
+// ---------------------------------------------------------------------------
+
+test("spawnDockerProcess: inplace mode does not clone or allocate sandbox workspace dir", () => {
+  const runsRoot = mkdtempSync(join(tmpdir(), "jaiph-inplace-runs-"));
+  const srcWs = mkdtempSync(join(tmpdir(), "jaiph-inplace-ws-"));
+  const { _dockerSpawn, spawnDockerProcess } = require("./docker");
+  const origExec = _dockerExec.run;
+  const origSpawn = _dockerSpawn.run;
+  let capturedArgs: string[] | undefined;
+  _dockerExec.run = () => {}; // pretend docker info / etc. succeed
+  // Stub the long-running docker run with a no-op child that won't outlive the test.
+  _dockerSpawn.run = (args: string[], _opts: object) => {
+    capturedArgs = args;
+    // Minimal ChildProcess stand-in: only the fields the helper exposes via DockerSpawnResult.
+    return { kill: () => true, pid: 0, stdout: null, stderr: null } as unknown as DockerSpawnResult["child"];
+  };
+  try {
+    writeFileSync(join(srcWs, "main.jh"), "");
+    writeFileSync(join(srcWs, "marker.txt"), "live");
+    const result: DockerSpawnResult = spawnDockerProcess({
+      config: {
+        enabled: true,
+        image: "ubuntu:24.04",
+        imageExplicit: false,
+        network: "default",
+        timeoutSeconds: 0,
+      },
+      sourceAbs: join(srcWs, "main.jh"),
+      workspaceRoot: srcWs,
+      sandboxRunDir: runsRoot,
+      runArgs: [],
+      env: { JAIPH_INPLACE: "1" },
+      isTTY: false,
+      sandboxMode: "inplace",
+    });
+    assert.equal(result.sandboxMode, "inplace");
+    assert.equal(result.sandboxWorkspaceDir, undefined, "no sandbox clone dir tracked");
+    assert.equal(result.overlayScriptDir, undefined, "no overlay script dir tracked");
+    // No .sandbox-* entry was created under the runs root.
+    const entries = readdirSync(runsRoot);
+    assert.ok(
+      !entries.some((e) => e.startsWith(".sandbox-")),
+      `inplace must not allocate .sandbox-* dirs (found: ${entries.join(",")})`,
+    );
+    // The host workspace is untouched (no clone copied files elsewhere).
+    assert.equal(readFileSync(join(srcWs, "marker.txt"), "utf8"), "live");
+    // The args still bind-mount the host workspace at /jaiph/workspace:rw.
+    assert.ok(capturedArgs && capturedArgs.some((a) => a.endsWith(":/jaiph/workspace:rw")), "host workspace mounted rw");
+  } finally {
+    _dockerExec.run = origExec;
+    _dockerSpawn.run = origSpawn;
+    rmSync(runsRoot, { recursive: true, force: true });
+    rmSync(srcWs, { recursive: true, force: true });
+  }
+});
+
 // ---------------------------------------------------------------------------
 // cloneWorkspaceForSandbox + allocateSandboxWorkspaceDir
 // ---------------------------------------------------------------------------
@@ -1062,3 +1364,86 @@ test("pullImageIfNeeded: semicolon image passed verbatim to docker pull on inspe
   }
 });
 
+// ---------------------------------------------------------------------------
+// cleanupDocker: idempotency + withDockerExitGuard: leak-free pairing
+// ---------------------------------------------------------------------------
+
+function makeStubDockerResult(overrides?: Partial<DockerSpawnResult>): DockerSpawnResult {
+  return {
+    child: {} as DockerSpawnResult["child"],
+    sandboxRunDir: "/tmp/none",
+    sandboxMode: "copy",
+    keepSandboxWorkspace: false,
+    ...overrides,
+  } as DockerSpawnResult;
+}
+
+test("cleanupDocker: second invocation on same result is a no-op", () => {
+  const overlayDir = mkdtempSync(join(tmpdir(), "jaiph-cleanup-overlay-"));
+  const sandboxDir = mkdtempSync(join(tmpdir(), "jaiph-cleanup-sandbox-"));
+  let timerFired = 0;
+  const timer = setTimeout(() => { timerFired += 1; }, 60_000);
+  const result = makeStubDockerResult({
+    overlayScriptDir: overlayDir,
+    sandboxWorkspaceDir: sandboxDir,
+    timeoutTimer: timer,
+  });
+
+  cleanupDocker(result);
+  assert.equal(result.cleaned, true, "result is marked cleaned after first call");
+  assert.equal(existsSync(overlayDir), false, "overlay tempdir removed");
+  assert.equal(existsSync(sandboxDir), false, "sandbox tempdir removed");
+
+  // Recreate paths to detect a buggy second-pass rmSync; idempotent guard
+  // must prevent any further filesystem work.
+  mkdirSync(overlayDir, { recursive: true });
+  mkdirSync(sandboxDir, { recursive: true });
+  writeFileSync(join(overlayDir, "sentinel"), "keep", "utf8");
+  writeFileSync(join(sandboxDir, "sentinel"), "keep", "utf8");
+
+  assert.doesNotThrow(() => cleanupDocker(result), "second call is silent");
+  assert.equal(existsSync(join(overlayDir, "sentinel")), true, "second call did not re-delete overlay");
+  assert.equal(existsSync(join(sandboxDir, "sentinel")), true, "second call did not re-delete sandbox");
+  assert.equal(timerFired, 0, "timer never fires (cleared on first cleanup)");
+
+  rmSync(overlayDir, { recursive: true, force: true });
+  rmSync(sandboxDir, { recursive: true, force: true });
+});
+
+test("withDockerExitGuard: removes exit listener after successful body", async () => {
+  const result = makeStubDockerResult();
+  const before = process.listenerCount("exit");
+  const beforeListeners = process.listeners("exit").slice();
+  await withDockerExitGuard(result, async () => "ok");
+  const after = process.listeners("exit");
+  assert.equal(after.length, before, "exit listener count returns to pre-run value");
+  // The cleanup guard registered during the helper must not survive in the list.
+  for (const fn of after) {
+    assert.ok(beforeListeners.includes(fn), "no new exit listener remains after helper returns");
+  }
+  assert.equal(result.cleaned, true, "cleanupDocker ran exactly once in finally");
+});
+
+test("withDockerExitGuard: removes exit listener when body throws", async () => {
+  const result = makeStubDockerResult();
+  const before = process.listenerCount("exit");
+  const beforeListeners = process.listeners("exit").slice();
+  await assert.rejects(
+    () => withDockerExitGuard(result, async () => { throw new Error("E_TEST_BODY_FAILED"); }),
+    /E_TEST_BODY_FAILED/,
+  );
+  const after = process.listeners("exit");
+  assert.equal(after.length, before, "exit listener count returns to pre-run value after throw");
+  for (const fn of after) {
+    assert.ok(beforeListeners.includes(fn), "no new exit listener remains after throw");
+  }
+  assert.equal(result.cleaned, true, "cleanupDocker ran exactly once in finally even when body threw");
+});
+
+test("withDockerExitGuard: does not register any exit listener when dockerResult is undefined", async () => {
+  const before = process.listenerCount("exit");
+  const value = await withDockerExitGuard(undefined, async () => 42);
+  assert.equal(value, 42);
+  assert.equal(process.listenerCount("exit"), before, "no listener registered without a dockerResult");
+});
+
diff --git a/src/runtime/docker.ts b/src/runtime/docker.ts
index e8ec72f4..de91f7c8 100644
--- a/src/runtime/docker.ts
+++ b/src/runtime/docker.ts
@@ -4,6 +4,7 @@ import { randomBytes } from "node:crypto";
 import { tmpdir } from "node:os";
 import { join, resolve, dirname, relative } from "node:path";
 import type { RuntimeConfig } from "../types";
+import { OVERLAY_RUN_SH_BASE64, decodeEmbeddedAsset } from "./embedded-assets";
 
 /** Resolved Docker runtime config with defaults applied and env overrides merged. */
 export interface DockerRunConfig {
@@ -84,7 +85,7 @@ const DEFAULTS: DockerRunConfig = {
   image: `${GHCR_IMAGE_REPO}:${resolveDefaultDockerImageTag()}`,
   imageExplicit: false,
   network: "default",
-  timeoutSeconds: 3600,
+  timeoutSeconds: 14400,
 };
 
 /**
@@ -155,6 +156,13 @@ export const _dockerExec = {
   },
 };
 
+/** Test seam for the long-running `docker run` spawn — stubbed by spawn tests. */
+export const _dockerSpawn = {
+  run(args: string[], opts: object): ChildProcess {
+    return spawn("docker", args, opts as any);
+  },
+};
+
 /** Test seam for host UID/GID detection — allows tests to simulate detection failure. */
 export const _uidDetect = {
   getHostUidGid(): { uid: string; gid: string } | undefined {
@@ -281,15 +289,31 @@ export function resolveImage(config: DockerRunConfig): string {
 /**
  * Container-side fuse-overlayfs setup loaded from runtime/overlay-run.sh.
  *
- * Resolves the file relative to package root — works from both source and dist
- * layouts, mirroring `resolveDefaultDockerImageTag` (package.json hops).
+ * Resolves the script in this order, so the npm/disk install and the
+ * bun-compiled standalone binary both work:
+ *   1. Sibling `overlay-run.sh` next to this module (npm `dist/src/runtime/`).
+ *   2. Repo-root `runtime/overlay-run.sh` three hops up (dev `src/runtime/`).
+ *   3. Embedded base64 baked into the executable (bun --compile binary).
+ * Lazy so importing the docker module from non-Docker code paths never
+ * touches the asset.
  */
-const OVERLAY_SCRIPT = readFileSync(
-  existsSync(resolve(__dirname, "overlay-run.sh"))
-    ? resolve(__dirname, "overlay-run.sh")
-    : resolve(__dirname, "..", "..", "..", "runtime", "overlay-run.sh"),
-  "utf8",
-);
+let overlayScriptCache: string | undefined;
+
+export function loadOverlayScript(): string {
+  if (overlayScriptCache !== undefined) return overlayScriptCache;
+  const diskCandidates = [
+    resolve(__dirname, "overlay-run.sh"),
+    resolve(__dirname, "..", "..", "..", "runtime", "overlay-run.sh"),
+  ];
+  for (const scriptPath of diskCandidates) {
+    if (existsSync(scriptPath)) {
+      overlayScriptCache = readFileSync(scriptPath, "utf8");
+      return overlayScriptCache;
+    }
+  }
+  overlayScriptCache = decodeEmbeddedAsset(OVERLAY_RUN_SH_BASE64);
+  return overlayScriptCache;
+}
 
 /**
  * Write overlay-run.sh to a temp file and return its path.
@@ -298,7 +322,7 @@ const OVERLAY_SCRIPT = readFileSync(
 export function writeOverlayScript(): string {
   const dir = mkdtempSync(join(tmpdir(), "jaiph-overlay-"));
   const scriptPath = join(dir, "overlay-run.sh");
-  writeFileSync(scriptPath, OVERLAY_SCRIPT, { mode: 0o755 });
+  writeFileSync(scriptPath, loadOverlayScript(), { mode: 0o755 });
   return scriptPath;
 }
 
@@ -307,17 +331,23 @@ export function writeOverlayScript(): string {
 // ---------------------------------------------------------------------------
 
 /** Selected sandbox primitive for a Docker run. */
-export type SandboxMode = "overlay" | "copy";
+export type SandboxMode = "overlay" | "copy" | "inplace";
 
 /**
  * Choose the sandbox mode for the upcoming run.
  *
- * Heuristic: presence of `/dev/fuse` on the host is a strong proxy for
+ * `JAIPH_INPLACE` is the highest-priority opt-in: when truthy, the host
+ * workspace is bind-mounted rw directly so the run's edits land live on the
+ * host. The machine boundary (mount set, caps, env allowlist) is unchanged.
+ * Otherwise, presence of `/dev/fuse` on the host is a strong proxy for
  * fuse-overlayfs viability inside the container. Linux dev/CI hosts typically
  * have it; macOS Docker Desktop typically doesn't expose it. Override with
  * `JAIPH_DOCKER_NO_OVERLAY=1` to force the host-copy path.
  */
 export function selectSandboxMode(env: Record<string, string | undefined>): SandboxMode {
+  if (env.JAIPH_INPLACE === "1" || env.JAIPH_INPLACE === "true") {
+    return "inplace";
+  }
   if (env.JAIPH_DOCKER_NO_OVERLAY === "1" || env.JAIPH_DOCKER_NO_OVERLAY === "true") {
     return "copy";
   }
@@ -470,14 +500,25 @@ export const CONTAINER_RUN_DIR = "/jaiph/run";
  * Explicit allowlist of environment variable prefixes forwarded into the
  * container. Everything else is dropped — fail-closed by design.
  */
-const ENV_ALLOW_PREFIXES = ["JAIPH_", "ANTHROPIC_", "CURSOR_", "CLAUDE_"] as const;
+export const ENV_ALLOW_PREFIXES = ["JAIPH_", "ANTHROPIC_", "CURSOR_", "CLAUDE_"] as const;
 
 /** Prefix excluded from the allowlist even though it starts with JAIPH_. */
-const ENV_ALLOW_EXCLUDE_PREFIX = "JAIPH_DOCKER_";
+export const ENV_ALLOW_EXCLUDE_PREFIX = "JAIPH_DOCKER_";
+
+/**
+ * Explicit exclusions that would otherwise pass the JAIPH_ allowlist.
+ * Forwarding these would leak host control flags into the container (and let a
+ * nested run re-trigger the same mode).
+ */
+export const ENV_ALLOW_EXCLUDE_NAMES = new Set<string>([
+  "JAIPH_INPLACE",
+  "JAIPH_INPLACE_YES",
+]);
 
 /** Returns true if `key` is on the explicit allowlist for container forwarding. */
 export function isEnvAllowed(key: string): boolean {
   if (key.startsWith(ENV_ALLOW_EXCLUDE_PREFIX)) return false;
+  if (ENV_ALLOW_EXCLUDE_NAMES.has(key)) return false;
   return ENV_ALLOW_PREFIXES.some((prefix) => key.startsWith(prefix));
 }
 
@@ -553,17 +594,21 @@ export function overlayMountPath(containerPath: string): string {
 /**
  * Build the `docker run --rm` argument list.
  *
- * Two sandbox shapes:
+ * Three sandbox shapes:
  *  - "overlay": workspace bind-mounts ro at /jaiph/workspace-ro; entrypoint
  *    script sets up fuse-overlayfs at /jaiph/workspace. Requires SYS_ADMIN
  *    and /dev/fuse. Run artifacts mount at /jaiph/run (outside the overlay).
  *  - "copy": host pre-clones workspace to `opts.sandboxWorkspaceDir`; that
  *    dir bind-mounts rw at /jaiph/workspace. No overlay script, no fuse,
  *    no SYS_ADMIN. Run artifacts mount at /jaiph/run as before.
+ *  - "inplace": host workspace itself bind-mounts rw at /jaiph/workspace —
+ *    edits land live on the host. Same caps/network/env posture as "copy".
+ *    Concurrent runs on the same workspace are a known sharp edge — no
+ *    locking is performed.
  *
  * The container runs `jaiph run --raw <file>` using its own installed jaiph.
  *
- * `overlayScriptPath` is required for "overlay" mode and ignored for "copy".
+ * `overlayScriptPath` is required for "overlay" mode and ignored for the rest.
  */
 export function buildDockerArgs(opts: DockerSpawnOptions, overlayScriptPath?: string): string[] {
   const mode: SandboxMode = opts.sandboxMode ?? selectSandboxMode(opts.env);
@@ -640,6 +685,10 @@ export function buildDockerArgs(opts: DockerSpawnOptions, overlayScriptPath?: st
     const hostAbs = resolve(opts.workspaceRoot);
     validateMountHostPath(hostAbs);
     args.push("-v", `${hostAbs}:${overlayMountPath(CONTAINER_WORKSPACE)}:ro`);
+  } else if (mode === "inplace") {
+    const hostAbs = resolve(opts.workspaceRoot);
+    validateMountHostPath(hostAbs);
+    args.push("-v", `${hostAbs}:${CONTAINER_WORKSPACE}:rw`);
   } else {
     const hostAbs = resolve(opts.sandboxWorkspaceDir!);
     validateMountHostPath(hostAbs);
@@ -744,15 +793,17 @@ export function spawnDockerProcess(opts: DockerSpawnOptions): DockerSpawnResult
   if (mode === "overlay") {
     overlayScriptPath = writeOverlayScript();
     overlayScriptDir = dirname(overlayScriptPath);
-  } else {
+  } else if (mode === "copy") {
     sandboxWorkspaceDir = opts.sandboxWorkspaceDir ?? allocateSandboxWorkspaceDir(opts.sandboxRunDir);
     cloneWorkspaceForSandbox(opts.workspaceRoot, sandboxWorkspaceDir);
   }
+  // inplace: no overlay script, no workspace clone — the host workspace is
+  // bind-mounted rw directly. The runs mount is still created above.
 
   opts = { ...opts, sandboxMode: mode, sandboxWorkspaceDir };
   const dockerArgs = buildDockerArgs(opts, overlayScriptPath);
 
-  const child = spawn("docker", dockerArgs, {
+  const child = _dockerSpawn.run(dockerArgs, {
     stdio: ["ignore", "pipe", "pipe"],
     cwd: opts.workspaceRoot,
     env: opts.env,
@@ -790,6 +841,8 @@ export function spawnDockerProcess(opts: DockerSpawnOptions): DockerSpawnResult
 /**
  * Clean up Docker resources after execution.
  *
+ * Idempotent: subsequent calls on the same `result` short-circuit on
+ * `result.cleaned` — exit-guard + finally-path pairing relies on this.
  * Removes the overlay script tempdir (overlay mode) and the cloned workspace
  * (copy mode), unless `JAIPH_DOCKER_KEEP_SANDBOX=1` was set.
  */
@@ -815,4 +868,29 @@ export function cleanupDocker(result: DockerSpawnResult): void {
   }
 }
 
+/**
+ * Run `body` with an abnormal-exit cleanup guard registered on `process.on("exit")`.
+ *
+ * Registration and removal are paired via try/finally: on both normal return
+ * and on throw, the listener is removed and `cleanupDocker(dockerResult)` is
+ * called exactly once. The guard only fires when the process exits before the
+ * finally runs (e.g. crash, unhandled exception in the host) — that's its
+ * purpose. When `dockerResult` is undefined (non-Docker run), no listener is
+ * registered.
+ */
+export async function withDockerExitGuard<T>(
+  dockerResult: DockerSpawnResult | undefined,
+  body: () => Promise<T>,
+): Promise<T> {
+  if (!dockerResult) return body();
+  const guard = (): void => { cleanupDocker(dockerResult); };
+  process.on("exit", guard);
+  try {
+    return await body();
+  } finally {
+    cleanupDocker(dockerResult);
+    process.removeListener("exit", guard);
+  }
+}
+
 
diff --git a/src/runtime/embedded-assets.test.ts b/src/runtime/embedded-assets.test.ts
new file mode 100644
index 00000000..36b9e896
--- /dev/null
+++ b/src/runtime/embedded-assets.test.ts
@@ -0,0 +1,35 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { existsSync, readFileSync } from "node:fs";
+import { dirname, join } from "node:path";
+import {
+  OVERLAY_RUN_SH_BASE64,
+  JAIPH_SKILL_MD_BASE64,
+  decodeEmbeddedAsset,
+} from "./embedded-assets";
+
+// The standalone binary ships these files inside the executable. If they
+// drift from the on-disk sources, npm builds keep working but the bun-compiled
+// jaiph silently ships outdated text. Fail loudly so the next contributor
+// reruns `npm run embed-assets` (run automatically by `npm run build`).
+function findRepoRoot(): string {
+  let cur = __dirname;
+  while (cur !== dirname(cur)) {
+    if (existsSync(join(cur, "package.json")) && existsSync(join(cur, "runtime"))) {
+      return cur;
+    }
+    cur = dirname(cur);
+  }
+  throw new Error("could not locate repo root for embedded-assets test");
+}
+const REPO_ROOT = findRepoRoot();
+
+test("OVERLAY_RUN_SH_BASE64 matches runtime/overlay-run.sh on disk", () => {
+  const disk = readFileSync(join(REPO_ROOT, "runtime/overlay-run.sh"), "utf8");
+  assert.equal(decodeEmbeddedAsset(OVERLAY_RUN_SH_BASE64), disk);
+});
+
+test("JAIPH_SKILL_MD_BASE64 matches docs/jaiph-skill.md on disk", () => {
+  const disk = readFileSync(join(REPO_ROOT, "docs/jaiph-skill.md"), "utf8");
+  assert.equal(decodeEmbeddedAsset(JAIPH_SKILL_MD_BASE64), disk);
+});
diff --git a/src/runtime/embedded-assets.ts b/src/runtime/embedded-assets.ts
new file mode 100644
index 00000000..c19a814a
--- /dev/null
+++ b/src/runtime/embedded-assets.ts
@@ -0,0 +1,17 @@
+// AUTO-GENERATED by tools/embed-assets.js — do not edit by hand.
+// Regenerated by `npm run build`. Sources:
+//   - runtime/overlay-run.sh
+//   - docs/jaiph-skill.md
+//
+// Base64-encoded so a bun --compile binary carries the bytes inside the
+// executable; the embedded-assets test fails if these drift from disk.
+
+export const OVERLAY_RUN_SH_BASE64 =
+  "IyEvdXNyL2Jpbi9lbnYgYmFzaApzZXQgLWV1byBwaXBlZmFpbApMT1dFUj0vamFpcGgvd29ya3NwYWNlLXJvClVQUEVSPS90bXAvb3ZlcmxheS11cHBlcgpXT1JLPS90bXAvb3ZlcmxheS13b3JrCk1FUkdFRD0vamFpcGgvd29ya3NwYWNlClJVTl9ESVI9L2phaXBoL3J1bgpta2RpciAtcCAiJFVQUEVSIiAiJFdPUksiICIkTUVSR0VEIgoKaWYgISBjb21tYW5kIC12IGZ1c2Utb3ZlcmxheWZzID4vZGV2L251bGwgMj4mMTsgdGhlbgogIHByaW50ZiAnRV9ET0NLRVJfT1ZFUkxBWSBmdXNlLW92ZXJsYXlmcyBub3QgZm91bmQgaW4gaW1hZ2U7IGluc3RhbGwgaXQgb3Igc2V0IEpBSVBIX0RPQ0tFUl9OT19PVkVSTEFZPTEgb24gdGhlIGhvc3QgdG8gdXNlIHRoZSBjb3B5IHNhbmRib3ggcGF0aFxuJyA+JjIKICBleGl0IDc4CmZpCmlmIFsgISAtZSAvZGV2L2Z1c2UgXTsgdGhlbgogIHByaW50ZiAnRV9ET0NLRVJfT1ZFUkxBWSAvZGV2L2Z1c2Ugbm90IHByZXNlbnQgaW4gY29udGFpbmVyOyBwYXNzIC0tZGV2aWNlIC9kZXYvZnVzZSBvciBzZXQgSkFJUEhfRE9DS0VSX05PX09WRVJMQVk9MSB0byB1c2UgdGhlIGNvcHkgc2FuZGJveCBwYXRoXG4nID4mMgogIGV4aXQgNzgKZmkKaWYgISBmdXNlLW92ZXJsYXlmcyAtbyAibG93ZXJkaXI9JExPV0VSLHVwcGVyZGlyPSRVUFBFUix3b3JrZGlyPSRXT1JLLGFsbG93X290aGVyIiAiJE1FUkdFRCIgMj4vdG1wL2phaXBoLWZ1c2Utb3ZlcmxheS5lcnI7IHRoZW4KICByZWFzb249IiQodHIgJ1xuJyAnICcgPC90bXAvamFpcGgtZnVzZS1vdmVybGF5LmVyciB8IHNlZCAncy9bWzpzcGFjZTpdXVwrLyAvZzsgcy9eIC8vOyBzLyAkLy8nKSIKICBwcmludGYgJ0VfRE9DS0VSX09WRVJMQVkgZnVzZS1vdmVybGF5ZnMgbW91bnQgZmFpbGVkOiAlc1xuJyAiJHJlYXNvbiIgPiYyCiAgZXhpdCA3OApmaQoKY2QgIiRNRVJHRUQiCgojIERyb3AgdG8gaG9zdCBVSUQvR0lEIGFmdGVyIG1vdW50aW5nIG92ZXJsYXkgYXMgcm9vdC4KaWYgWyAtbiAiJHtKQUlQSF9IT1NUX1VJRDotfSIgXSAmJiBbIC1uICIke0pBSVBIX0hPU1RfR0lEOi19IiBdICYmIGNvbW1hbmQgLXYgc2V0cHJpdiA+L2Rldi9udWxsIDI+JjE7IHRoZW4KICBjaG93biAiJEpBSVBIX0hPU1RfVUlEOiRKQUlQSF9IT1NUX0dJRCIgIiRSVU5fRElSIiAyPi9kZXYvbnVsbCB8fCB0cnVlCiAgZXhlYyBzZXRwcml2IC0tcmV1aWQ9IiRKQUlQSF9IT1NUX1VJRCIgLS1yZWdpZD0iJEpBSVBIX0hPU1RfR0lEIiAtLWNsZWFyLWdyb3VwcyAtLSAiJEAiCmZpCmV4ZWMgIiRAIgo=";
+
+export const JAIPH_SKILL_MD_BASE64 =
+  "LS0tCnRpdGxlOiBBZ2VudCBTa2lsbApwZXJtYWxpbms6IC9qYWlwaC1za2lsbApkaWF0YXhpczogY29udHJpYnV0b3IKcmVkaXJlY3RfZnJvbToKICAtIC9qYWlwaC1za2lsbC5tZAotLS0KCiMgSmFpcGggU2tpbGwgKGZvciBBZ2VudHMpCgpZb3UgYXJlIGFuIGFnZW50LiBBIHVzZXIgaGFzIGFza2VkIHlvdSB0byBhdXRvbWF0ZSBhIHJlcGV0aXRpdmUgdGFzayDigJQgYSBkZWxpdmVyeSBwaXBlbGluZSwgYSByZXZpZXcgbG9vcCwgYSByZWN1cnJpbmcgY2hlY2ssIGEgcXVldWUgb2Ygd29yayBpdGVtcy4gVGhpcyBkb2N1bWVudCB0ZWFjaGVzIHlvdSB0byBhdXRob3IgKipKYWlwaCB3b3JrZmxvd3MqKiB0aGF0IGRvIHRoYXQuIFJlYWQgaXQgZnVsbHkgYmVmb3JlIHdyaXRpbmcgYW55IGAuamhgIGZpbGU7IEphaXBoIGxvb2tzIGxpa2Ugc2hlbGwgcGx1cyBZQU1MIGJ1dCBpcyBuZWl0aGVyLCBhbmQgbW9zdCBhdXRob3JpbmcgbWlzdGFrZXMgY29tZSBmcm9tIGd1ZXNzaW5nIHN5bnRheCBpbnN0ZWFkIG9mIGZvbGxvd2luZyB0aGUgcnVsZXMgYmVsb3cuCgojIyBXaGF0IEphaXBoIGlzCgpKYWlwaCBpcyBhIHNtYWxsIHdvcmtmbG93IGxhbmd1YWdlLiBBIGAuamhgIGZpbGUgZGVjbGFyZXM6Cgp8IENvbnN0cnVjdCB8IFdoYXQgaXQgaXMgfCBIb3cgaXQgcnVucyB8CnwtLS18LS0tfC0tLXwKfCBgd29ya2Zsb3dgIHwgQSBuYW1lZCBzZXF1ZW5jZSBvZiBzdGVwcyDigJQgdGhlIG9yY2hlc3RyYXRpb24gbGF5ZXIgfCBJbnRlcnByZXRlZCBpbi1wcm9jZXNzIGJ5IHRoZSBydW50aW1lIHwKfCBgcnVsZWAgfCBBIG5vbi1tdXRhdGluZyBjaGVjayAocHJlY29uZGl0aW9ucywgdmVyaWZpY2F0aW9ucykgfCBJbnRlcnByZXRlZCBpbi1wcm9jZXNzOyBjYWxsZWQgd2l0aCBgZW5zdXJlYCB8CnwgYHNjcmlwdGAgfCBSZWFsIHNoZWxsIChvciBQeXRob24sIE5vZGUsIOKApikg4oCUIHRoZSBvbmx5IHBsYWNlIGZvciBzaGVsbCBjb2RlIHwgU3Bhd25lZCBhcyBhIHN1YnByb2Nlc3M7IGNhbGxlZCB3aXRoIGBydW5gIHwKfCBgcHJvbXB0YCB8IEEgdGFzayBkZWxlZ2F0ZWQgdG8gYW4gQUkgYWdlbnQgKEN1cnNvciAvIENsYXVkZSAvIENvZGV4IGJhY2tlbmQpIHwgQmFja2VuZCBDTEkgb3IgQVBJIGNhbGw7IHlvdSBjYXB0dXJlIHRoZSBhbnN3ZXIgfAp8IGBjaGFubmVsYCB8IEEgbWVzc2FnZSBxdWV1ZSB3aXRoIGRlY2xhcmVkIHdvcmtmbG93IGxpc3RlbmVycyB8IERyYWluZWQgYWZ0ZXIgdGhlIHNlbmRpbmcgd29ya2Zsb3cgZmluaXNoZXMgfAoKRXZlcnl0aGluZyBpcyAqKnN0cmluZ3MqKi4gRXZlcnkgc3RlcCBpcyBsb2dnZWQuIEV2ZXJ5IHJ1biBsZWF2ZXMgZHVyYWJsZSBhcnRpZmFjdHMgdW5kZXIgYC5qYWlwaC9ydW5zL2AgKHBlci1zdGVwIGAub3V0YC9gLmVycmAgZmlsZXMgYW5kIGFuIGFwcGVuZC1vbmx5IGBydW5fc3VtbWFyeS5qc29ubGApLiBUaGF0IGlzIHRoZSBwYXlvZmYgb3ZlciBhZC1ob2Mgc2hlbGw6IHJlcGVhdGFibGUsIGluc3BlY3RhYmxlLCB0ZXN0YWJsZSBhdXRvbWF0aW9uLgoKKipTb3VyY2Ugb2YgdHJ1dGg6Kiogd2hlbiB0aGlzIGRvY3VtZW50IGFuZCB0aGUgY29tcGlsZXIgZGlzYWdyZWUsIHRoZSBjb21waWxlciB3aW5zLiBGdWxsIHJlZmVyZW5jZXM6IFtHcmFtbWFyXShncmFtbWFyLm1kKSwgW0NMSV0oY2xpLm1kKSwgW0NvbmZpZ3VyYXRpb25dKGNvbmZpZ3VyYXRpb24ubWQpLCBbV3JpdGUgJiBydW4gdGVzdHNdKHRlc3RpbmcubWQpLCBbSW5ib3ggJiBkaXNwYXRjaF0oaW5ib3gubWQpLCBbU2FuZGJveGluZ10oc2FuZGJveGluZy5tZCkuCgojIyBTbWFsbGVzdCB3b3JraW5nIGV4YW1wbGUKCmBgYGphaXBoCnNjcmlwdCBsaXN0X3RvZG9zID0gYGdyZXAgLXJuICJUT0RPIiBzcmMvIHx8IHRydWVgCnNjcmlwdCB3b3JrdHJlZV9jbGVhbiA9IGB0ZXN0IC16ICIkKGdpdCBzdGF0dXMgLS1wb3JjZWxhaW4pImAKCnJ1bGUgZ2l0X2NsZWFuKCkgewogIHJ1biB3b3JrdHJlZV9jbGVhbigpIGNhdGNoIChlcnIpIHsKICAgIGZhaWwgIndvcmtpbmcgdHJlZSBpcyBub3QgY2xlYW4iCiAgfQp9Cgp3b3JrZmxvdyBkZWZhdWx0KHRhc2spIHsKICBlbnN1cmUgZ2l0X2NsZWFuKCkKICBjb25zdCB0b2RvcyA9IHJ1biBsaXN0X3RvZG9zKCkKICBwcm9tcHQgIiIiCiAgQWRkcmVzcyB0aGUgZm9sbG93aW5nIHJlcXVlc3Q6ICR7dGFza30KICBLbm93biBUT0RPcyBpbiB0aGUgY29kZWJhc2U6CiAgJHt0b2Rvc30KICAiIiIKICBsb2cgImRvbmUiCn0KYGBgCgpSdW4gaXQ6IGBqYWlwaCBydW4gLi9mbG93LmpoICJjbGVhbiB1cCB0aGUgYXV0aCBtb2R1bGUiYC4gVGhlIENMSSBleGVjdXRlcyBgd29ya2Zsb3cgZGVmYXVsdGAgYW5kIGJpbmRzIGAiY2xlYW4gdXAgdGhlIGF1dGggbW9kdWxlImAgdG8gdGhlIGB0YXNrYCBwYXJhbWV0ZXIuICoqRXZlcnkgcnVubmFibGUgZmlsZSBtdXN0IGRlZmluZSBgd29ya2Zsb3cgZGVmYXVsdGAuKioKCiMjIFlvdXIgYXV0aG9yaW5nIGxvb3AKCkZvbGxvdyB0aGlzIHNlcXVlbmNlIGV2ZXJ5IHRpbWUgeW91IGNyZWF0ZSBvciBlZGl0IGAuamhgIGZpbGVzLiBEbyBub3Qgc2tpcCB0aGUgY29tcGlsZSBzdGVwIOKAlCBpdCBjYXRjaGVzIGFsbW9zdCBldmVyeSBtaXN0YWtlIGRlc2NyaWJlZCBpbiB0aGlzIGRvY3VtZW50LCB3aXRoIGZpbGU6bGluZTpjb2wgcG9zaXRpb25zLgoKMS4gKipXcml0ZSoqIHRoZSBgLmpoYCBmaWxlcyAoc3ludGF4IGJlbG93KS4KMi4gKipGb3JtYXQ6KiogYGphaXBoIGZvcm1hdCA8ZmlsZXPigKY+YCDigJQgY2Fub25pY2FsIHdoaXRlc3BhY2UgYW5kIHRvcC1sZXZlbCBvcmRlcmluZy4KMy4gKipDb21waWxlOioqIGBqYWlwaCBjb21waWxlIFstLWpzb25dIFstLXdvcmtzcGFjZSA8ZGlyPl0gPGZpbGUtb3ItZGlyPmAg4oCUIHBhcnNlcyBhbmQgdmFsaWRhdGVzIHRoZSB3aG9sZSBpbXBvcnQgY2xvc3VyZSB3aXRob3V0IHJ1bm5pbmcgYW55dGhpbmcuIFJlcG9ydHMgKiphbGwqKiBlcnJvcnMgYXQgb25jZSBhcyBgcGF0aDpsaW5lOmNvbCBDT0RFIG1lc3NhZ2VgLiBVc2UgYC0tanNvbmAgZm9yIG1hY2hpbmUtcmVhZGFibGUgb3V0cHV0LiBEaXJlY3RvcnkgYXJndW1lbnRzIHNraXAgYCoudGVzdC5qaGA7IHBhc3MgdGVzdCBmaWxlcyBleHBsaWNpdGx5LiBgLS13b3Jrc3BhY2VgIHNldHMgdGhlIGxpYnJhcnkgcm9vdCBmb3IgYGphaXBoIGluc3RhbGxgIHBhdGhzIHdoZW4gYXV0by1kZXRlY3QgaXMgd3JvbmcuCjQuICoqVGVzdDoqKiBgamFpcGggdGVzdGAg4oCUIHJ1bnMgZXZlcnkgYCoudGVzdC5qaGAgaXQgZmluZHM7IHplcm8gbWF0Y2hlcyBpbiBkaXNjb3ZlcnkgbW9kZSBleGl0IDAgd2l0aCBhIG5vdGljZSwgc28gdGhpcyBjYWxsIGlzIGFsd2F5cyBzYWZlIHRvIG1ha2UuCjUuICoqUnVuOioqIGBqYWlwaCBydW4gPGZpbGUuamg+IFthcmdz4oCmXWAgZm9yIHRoZSBlbmQtdG8tZW5kIGNoZWNrLgoKQ0xJIHF1aWNrIHJlZmVyZW5jZToKCnwgQ29tbWFuZCB8IFB1cnBvc2UgfAp8LS0tfC0tLXwKfCBgamFpcGggcnVuIFstLXRhcmdldCA8ZGlyPl0gWy0tcmF3XSA8ZmlsZS5qaD4gWy0tXSBbYXJnc+KApl1gIHwgRXhlY3V0ZSBgd29ya2Zsb3cgZGVmYXVsdGA7IGFyZ3MgYmluZCB0byBpdHMgbmFtZWQgcGFyYW1ldGVycyB8CnwgYGphaXBoIHRlc3QgW3BhdGhdYCB8IFJ1biBgKi50ZXN0LmpoYCBmaWxlcyAod29ya3NwYWNlLCBkaXIsIG9yIHNpbmdsZSBmaWxlKSB8CnwgYGphaXBoIGNvbXBpbGUgWy0tanNvbl0gWy0td29ya3NwYWNlIDxkaXI+XSA8cGF0aHPigKY+YCB8IFZhbGlkYXRlIG9ubHkg4oCUIG5vIGV4ZWN1dGlvbiwgbm8gc2lkZSBlZmZlY3RzIHwKfCBgamFpcGggZm9ybWF0IFstLWNoZWNrXSA8ZmlsZS5qaCDigKY+YCB8IFJlZm9ybWF0IChvciB2ZXJpZnkgZm9ybWF0dGluZyBpbiBDSSkgfAp8IGBqYWlwaCBpbml0IFt3b3Jrc3BhY2VdYCB8IFNjYWZmb2xkIGAuamFpcGgvYCAoYm9vdHN0cmFwIHdvcmtmbG93ICsgdGhpcyBza2lsbCBmaWxlKSB8CnwgYGphaXBoIGluc3RhbGwgWzxuYW1lW0B2ZXJzaW9uXT4gXHwgPHVybFtAdmVyc2lvbl0+4oCmXWAgfCBJbnN0YWxsIGxpYnJhcmllcyBpbnRvIGAuamFpcGgvbGlicy9gIChiYXJlIG5hbWVzIHJlc29sdmUgdmlhIGBKQUlQSF9SRUdJU1RSWWAsIGVsc2UgYGh0dHBzOi8vamFpcGgub3JnL3JlZ2lzdHJ5YDsgVVJMIGZvcm0gaXMgdW5jaGFuZ2VkKSB8CgpTaG9ydGhhbmQ6IGBqYWlwaCAuL2ZpbGUuamhgIHJvdXRlcyBieSBleHRlbnNpb24gKGAqLnRlc3QuamhgIOKGkiB0ZXN0LCBvdGhlciBgLmpoYCDihpIgcnVuKS4gQSBgIyEvdXNyL2Jpbi9lbnYgamFpcGhgIHNoZWJhbmcgbWFrZXMgYSBgLmpoYCBmaWxlIGRpcmVjdGx5IGV4ZWN1dGFibGUuCgoqKlNhbmRib3hpbmc6KiogYnkgZGVmYXVsdCwgaW50ZXJhY3RpdmUgYGphaXBoIHJ1bmAgZXhlY3V0ZXMgdGhlIHdvcmtmbG93IGluc2lkZSBhIERvY2tlciBjb250YWluZXIgKGBnaGNyLmlvL2phaXBobGFuZy9qYWlwaC1ydW50aW1lYCkuIFNldCBgSkFJUEhfVU5TQUZFPXRydWVgIG9yIHBhc3MgYC0tdW5zYWZlYCB0byBydW4gZGlyZWN0bHkgb24gdGhlIGhvc3QsIG9yIHNldCBgSkFJUEhfRE9DS0VSX0VOQUJMRUQ9dHJ1ZS9mYWxzZWAgdG8gZm9yY2UgZWl0aGVyIG1vZGUuIGBqYWlwaCB0ZXN0YCBhbHdheXMgcnVucyBvbiB0aGUgaG9zdCAobm8gRG9ja2VyKS4KCiMjIENvcmUgcnVsZXMgeW91IG11c3QgaW50ZXJuYWxpemUKClRoZXNlIHNpeCBydWxlcyBwcmV2ZW50IDkwJSBvZiBjb21waWxlIGVycm9yczoKCjEuICoqUGFyZW50aGVzZXMgZXZlcnl3aGVyZS4qKiBEZWZpbml0aW9ucyBhbmQgY2FsbCBzaXRlcyBib3RoIHJlcXVpcmUgYCgpYCwgZXZlbiB3aXRoIHplcm8gYXJndW1lbnRzOiBgd29ya2Zsb3cgZGVmYXVsdCgpIHsg4oCmIH1gLCBgcnVuIHNldHVwKClgLCBgZW5zdXJlIGNoZWNrKClgLiBCYXJlIGBydW4gc2V0dXBgIGlzIGEgcGFyc2UgZXJyb3IuCjIuICoqQWxsIGNhcHR1cmVzIHVzZSBgY29uc3RgLCBhbmQgYWxsIGJpbmRpbmdzIGFyZSBpbW11dGFibGUuKiogYGNvbnN0IHggPSBydW4gZm9vKClgIOKAlCBuZXZlciBgeCA9IHJ1biBmb28oKWAsIG5ldmVyIHJlYmluZCBgeGAgbGF0ZXIsIG5ldmVyIHNoYWRvdyBhIHBhcmFtZXRlciB3aXRoIGEgYGNvbnN0YCBvZiB0aGUgc2FtZSBuYW1lLgozLiAqKkNhbGwga2V5d29yZCBtdXN0IG1hdGNoIGNhbGxlZSB0eXBlLioqIGBlbnN1cmVgIOKGkiBydWxlcyBvbmx5LiBgcnVuYCDihpIgd29ya2Zsb3dzIGFuZCBzY3JpcHRzIChpbnNpZGUgYSB3b3JrZmxvdyk7IHNjcmlwdHMgKipvbmx5KiogKGluc2lkZSBhIHJ1bGUpLiBNaXhpbmcgdGhlbSBpcyBgRV9WQUxJREFURWAuCjQuICoqU2hlbGwgbGl2ZXMgaW4gc2NyaXB0cy4qKiBSdWxlcyByZWplY3QgcmF3IHNoZWxsIGxpbmVzIGVudGlyZWx5LiBXb3JrZmxvd3MgdGVjaG5pY2FsbHkgYWxsb3cgaW5saW5lIHNoZWxsIGxpbmVzLCBidXQgeW91IHNob3VsZCBub3Qgd3JpdGUgdGhlbSDigJQgdXNlIGEgbmFtZWQgYHNjcmlwdGAgb3IgYW4gaW5saW5lIHNjcmlwdCAoYGAgcnVuIGBjbWRgKCkgYGApLiBTaGVsbCBvcGVyYXRvcnMgbmV4dCB0byBtYW5hZ2VkIGNhbGxzIChgcnVuIGZvbygpIHwgZ3JlcCB4YCwgYHJ1biBmb28oKSA+IGZpbGVgLCBgcnVuIGZvbygpICZgKSBhcmUgcGFyc2UgZXJyb3JzLgo1LiAqKkludGVycG9sYXRpb24gaXMgYCR7bmFtZX1gIG9ubHkuKiogTm8gYCRuYW1lYCBpbiBvcmNoZXN0cmF0aW9uIHN0cmluZ3MsIG5vIGAkKOKApilgLCBubyBgJHt2YXI6LWRlZmF1bHR9YCwgbm8gYCR7dmFyLy94L3l9YC4gVGhvc2Ugc2hlbGwgZm9ybXMgYXJlIHZhbGlkICppbnNpZGUgc2NyaXB0IGJvZGllcyogb25seS4KNi4gKipBcmd1bWVudHMgYXJlIG5vdCBmb3J3YXJkZWQgaW1wbGljaXRseS4qKiBJZiBgd29ya2Zsb3cgZGVmYXVsdCh0YXNrKWAgY2FsbHMgYHJ1biBpbXBsZW1lbnQoKWAsIHRoZSBpbXBsZW1lbnQgd29ya2Zsb3cgZG9lcyBub3Qgc2VlIGB0YXNrYC4gUGFzcyBpdDogYHJ1biBpbXBsZW1lbnQodGFzaylgLgoKIyMgU3ludGF4IHJlZmVyZW5jZQoKIyMjIEZpbGUgbGF5b3V0CgpUb3AtbGV2ZWwgZm9ybXMsIGluIGNvbnZlbnRpb25hbCBvcmRlciAoYGphaXBoIGZvcm1hdGAgaG9pc3RzIGBpbXBvcnRgLCBgY29uZmlnYCwgYW5kIGBjaGFubmVsYCB0byB0aGUgdG9wKToKCmBgYGphaXBoCmltcG9ydCAiaGVscGVycy5qaCIgYXMgaGVscGVycyAgICAgICAgICAjIG1vZHVsZSBpbXBvcnQgKHJlbGF0aXZlOyAuamggYXBwZW5kZWQgaWYgb21pdHRlZCkKaW1wb3J0IHNjcmlwdCAiLi90b29sLnB5IiBhcyB0b29sICAgICAgICMgZXh0ZXJuYWwgc2NyaXB0IGZpbGUsIGNhbGxhYmxlIHdpdGggcnVuIHRvb2woYXJncykKY29uZmlnIHsgYWdlbnQuYmFja2VuZCA9ICJjbGF1ZGUiIH0gICAgICMgb3B0aW9uYWwsIGF0IG1vc3Qgb25lIHBlciBmaWxlCmNoYW5uZWwgZmluZGluZ3MgLT4gYW5hbHlzdCAgICAgICAgICAgICAjIGNoYW5uZWxzICsgb3B0aW9uYWwgcm91dGVzLCB0b3AgbGV2ZWwgb25seQpjb25zdCBWRVJTSU9OID0gIjEuMCIgICAgICAgICAgICAgICAgICAgIyBtb2R1bGUtc2NvcGVkIGltbXV0YWJsZSBzdHJpbmcKc2NyaXB0IGJ1aWxkID0gYG5wbSBydW4gYnVpbGRgICAgICAgICAgICMgc2hlbGwgZGVmaW5pdGlvbnMKcnVsZSB0ZXN0c19wYXNzKCkgeyBydW4gcnVuX3Rlc3RzKCkgfSAgICMgY2hlY2tzCndvcmtmbG93IGRlZmF1bHQoKSB7IOKApiB9ICAgICAgICAgICAgICAgICMgb3JjaGVzdHJhdGlvbjsgZGVmYXVsdCA9IHRoZSBlbnRyeXBvaW50CmBgYAoKQ2hhbm5lbHMsIHJ1bGVzLCB3b3JrZmxvd3MsIHNjcmlwdHMsIHNjcmlwdC1pbXBvcnQgYWxpYXNlcywgYW5kIG1vZHVsZSBgY29uc3RgIHNoYXJlICoqb25lIG5hbWVzcGFjZSBwZXIgbW9kdWxlKiog4oCUIGR1cGxpY2F0ZSB0b3AtbGV2ZWwgbmFtZXMgYXJlIGBFX1BBUlNFYDsgZHVwbGljYXRlIGltcG9ydCBhbGlhc2VzIGFyZSBgRV9WQUxJREFURWAuIENvbW1lbnRzIGFyZSBmdWxsLWxpbmUgYCNgIG9ubHkuCgoqKkltcG9ydHM6KiogcGF0aHMgcmVzb2x2ZSByZWxhdGl2ZSB0byB0aGUgaW1wb3J0aW5nIGZpbGU7IGlmIG5vdCBmb3VuZCBhbmQgdGhlIHBhdGggY29udGFpbnMgYC9gLCBpdCBmYWxscyBiYWNrIHRvIGA8d29ya3NwYWNlPi8uamFpcGgvbGlicy88bGliPi88cGF0aD4uamhgIChpbnN0YWxsZWQgdmlhIGBqYWlwaCBpbnN0YWxsYCkuIFJlZmVyZW5jZSBpbXBvcnRlZCBzeW1ib2xzIGFzIGBhbGlhcy5uYW1lYC4gSWYgYSBtb2R1bGUgdXNlcyBgZXhwb3J0YCBvbiBhbnkgZGVjbGFyYXRpb24sIG9ubHkgZXhwb3J0ZWQgbmFtZXMgYXJlIHZpc2libGUgdG8gaW1wb3J0ZXJzOyB3aXRoIHplcm8gYGV4cG9ydGBzLCBldmVyeXRoaW5nIGlzIHB1YmxpYy4KCiMjIyBTdHJpbmdzIGFuZCBpbnRlcnBvbGF0aW9uCgotIGAic2luZ2xlIGxpbmUiYCDigJQgZG91YmxlIHF1b3RlcyBvbmx5OyBzaW5nbGUgcXVvdGVzIGFyZSBwYXJzZSBlcnJvcnMuIEVzY2FwZXM6IGBcImAsIGBcXGAsIGBcbmAsIGBcdGAuCi0gYCIiIuKApiIiImAg4oCUIG11bHRpbGluZS4gT3BlbmluZyBgIiIiYCBlbmRzIGl0cyBsaW5lOyBjbG9zaW5nIGAiIiJgIGlzIG9uIGl0cyBvd24gbGluZS4KLSBBIGRvdWJsZS1xdW90ZWQgc3RyaW5nIHNwYW5uaW5nIG11bHRpcGxlIGxpbmVzIGlzIHJlamVjdGVkIOKAlCB1c2UgYCIiImAuCgpJbnNpZGUgYW55IG9yY2hlc3RyYXRpb24gc3RyaW5nOgoKfCBGb3JtIHwgTWVhbmluZyB8CnwtLS18LS0tfAp8IGAke25hbWV9YCB8IFZhbHVlIG9mIGEgYGNvbnN0YCwgY2FwdHVyZSwgb3IgcGFyYW1ldGVyIGluIHNjb3BlICh1bmtub3duIG5hbWVzIGFyZSBjb21waWxlIGVycm9ycykgfAp8IGAke25hbWUuZmllbGR9YCB8IEZpZWxkIG9mIGEgdHlwZWQtcHJvbXB0IGNhcHR1cmUgKGNvbXBpbGUtY2hlY2tlZCBhZ2FpbnN0IHRoZSBzY2hlbWEpIHwKfCBgJHtydW4gcmVmKGFyZ3MpfWAgLyBgJHtlbnN1cmUgcmVmKGFyZ3MpfWAgfCBJbmxpbmUgbWFuYWdlZCBjYWxsOyBpdHMgb3V0cHV0IGlzIHNwbGljZWQgaW4uIE5vIG5lc3RpbmcuIHwKfCBgJHtKQUlQSF9XT1JLU1BBQ0V9YCBldGMuIHwgRmFsbHMgYmFjayB0byBwcm9jZXNzIGVudmlyb25tZW50IHdoZW4gbm8gd29ya2Zsb3cgdmFyaWFibGUgbWF0Y2hlcyB8CgojIyMgU2NyaXB0cyDigJQgdGhlIHNoZWxsIGxheWVyCgpgYGBgamFpcGgKIyBzaW5nbGUtbGluZTogYmFja3RpY2tzLiBOTyBKYWlwaCAke25hbWV9IGhlcmUg4oCUIHBhc3MgZGF0YSBhcyAkMSwgJDIgYXJndW1lbnRzLgpzY3JpcHQgY291bnRfbGluZXMgPSBgd2MgLWwgPCAiJDEiYAoKIyBtdWx0aS1saW5lOiBmZW5jZWQgYmxvY2suIEJhc2ggJHvigKZ9IHBhc3NlcyB0aHJvdWdoIHRvIHRoZSBzaGVsbCB1bnRvdWNoZWQuCnNjcmlwdCBkZXBsb3kgPSBgYGAKc2V0IC1ldW8gcGlwZWZhaWwKZWNobyAiZGVwbG95aW5nICR7VEFSR0VUX0VOVjotc3RhZ2luZ30iCi4vZGVwbG95LnNoICIkMSIKYGBgCgojIHBvbHlnbG90OiBmZW5jZSB0YWcg4oaSICMhL3Vzci9iaW4vZW52IDx0YWc+LiBBbnkgdGFnIHdvcmtzLgpzY3JpcHQgcGFyc2VfanNvbiA9IGBgYHB5dGhvbjMKaW1wb3J0IGpzb24sIHN5cwpwcmludChqc29uLmxvYWQob3BlbihzeXMuYXJndlsxXSkpWyJ2ZXJzaW9uIl0pCmBgYApgYGBgCgpTY3JpcHQgc2VtYW50aWNzOgoKLSBCb2RpZXMgYXJlICoqb3BhcXVlKiogdG8gdGhlIGNvbXBpbGVyIOKAlCBmdWxsIHNoZWxsL1B5dGhvbi93aGF0ZXZlciwgaGVyZWRvY3MgaW5jbHVkZWQuIFRoZSBvbmUgY2hlY2s6IGRvIG5vdCBjYWxsIEphaXBoIHN5bWJvbHMgKGBydW5gLCBgZW5zdXJlYCwgd29ya2Zsb3cgbmFtZXMpIGZyb20gaW5zaWRlIGEgc2NyaXB0IGJvZHkgb3IgYCQo4oCmKWAuCi0gKipDYXB0dXJlID0gc3Rkb3V0LioqIGBjb25zdCB2ID0gcnVuIHBhcnNlX2pzb24oInBrZy5qc29uIilgIGJpbmRzIHRoZSBzY3JpcHQncyBzdGRvdXQuIFVzZSBgZWNob2AvYHByaW50ZmAgdG8gcmV0dXJuIGRhdGE7IHVzZSBleGl0IGNvZGVzIChgcmV0dXJuIE5gIC8gYGV4aXQgTmApIGZvciBwYXNzL2ZhaWwuCi0gKipBcmd1bWVudHMgYXJyaXZlIGFzIGAkMWAsIGAkMmAsIOKApioqIE1vZHVsZSBgY29uc3RgIHZhbHVlcyBhbmQgd29ya2Zsb3cgYmluZGluZ3MgYXJlICpub3QqIGV4cG9ydGVkIGludG8gdGhlIHN1YnByb2Nlc3MgZW52aXJvbm1lbnQg4oCUIHBhc3MgdGhlbSBleHBsaWNpdGx5IGFzIGFyZ3VtZW50cy4KLSBBbHRlcm5hdGl2ZWx5IGEgbWFudWFsIGAjIWAgc2hlYmFuZyBhcyB0aGUgZmlyc3QgYm9keSBsaW5lIHNlbGVjdHMgdGhlIGludGVycHJldGVyIChtdXR1YWxseSBleGNsdXNpdmUgd2l0aCBhIGZlbmNlIHRhZykuCi0gQSBuZXdsaW5lIGluc2lkZSBhIHNpbmdsZS1iYWNrdGljayBib2R5IGlzIGEgcGFyc2UgZXJyb3Ig4oCUIHVzZSBhIGZlbmNlZCBibG9jay4KCioqSW5saW5lIHNjcmlwdHMqKiBmb3Igb25lLW9mZiBjb21tYW5kcyDigJQgYm9keSBiZWZvcmUgdGhlIHBhcmVucywgYXJncyBpbnNpZGU6CgpgYGBgamFpcGgKcnVuIGBta2RpciAtcCAiJDEiYCgib3V0L3JlcG9ydHMiKQpjb25zdCBub3cgPSBydW4gYGRhdGUgKyVzYCgpCmNvbnN0IHN0YXRzID0gcnVuIGBgYHB5dGhvbjMKaW1wb3J0IHN5czsgcHJpbnQobGVuKHN5cy5hcmd2WzFdKSkKYGBgKGlucHV0X3RleHQpCmBgYGAKCklubGluZSBzY3JpcHRzIHdvcmsgaW4gYHJ1bmAsIGBjb25zdCDigKYgPSBydW5gLCBgcmV0dXJuIHJ1bmAsIGFuZCBgbG9nIHJ1bmAgcG9zaXRpb25zLiBUaGV5IGNhbm5vdCBiZSB1c2VkIHdpdGggYHJ1biBhc3luY2AuIEEgYHJ1bmAgc3RlcCB3aG9zZSBib2R5IGlzIGFuIGlubGluZSBzY3JpcHQgYWNjZXB0cyB0aGUgc2FtZSBvcHRpb25hbCBgY2F0Y2ggKG5hbWUpIDxib2R5PmAgLyBgcmVjb3ZlciAobmFtZSkgPGJvZHk+YCBzdWZmaXggYXMgYSBuYW1lZC1yZWYgYHJ1bmAgc3RlcCAoc2FtZSBzZW1hbnRpY3Mg4oCUIGBjYXRjaGAgcnVucyBvbmNlLCBgcmVjb3ZlcmAgcmV0cmllcyB1cCB0byBgcnVuLnJlY292ZXJfbGltaXRgLCBtdXR1YWxseSBleGNsdXNpdmUpLiBUaGUgb3RoZXIgaW5saW5lLXNjcmlwdCBwb3NpdGlvbnMgKGBjb25zdCDigKYgPSBydW5gLCBgcmV0dXJuIHJ1bmAsIGBsb2cgcnVuYCkgZG8gbm90IHRha2UgdGhvc2Ugc3VmZml4ZXMg4oCUIHdyYXAgaW4gYSBzdGFuZGFsb25lIGBydW5gIHN0ZXAuCgojIyMgV29ya2Zsb3cgc3RlcHMKCmBgYGphaXBoCndvcmtmbG93IHJlbGVhc2UodmVyc2lvbikgewogIGVuc3VyZSBnaXRfY2xlYW4oKSAgICAgICAgICAgICAgICAgICAgICAgICMgcnVuIGEgcnVsZQogIGNvbnN0IG5vdGVzID0gcnVuIGdlbl9ub3Rlcyh2ZXJzaW9uKSAgICAgICMgcnVuIGEgc2NyaXB0L3dvcmtmbG93LCBjYXB0dXJlCiAgcnVuIHB1Ymxpc2godmVyc2lvbiwgbm90ZXMpICAgICAgICAgICAgICAgIyBhcmdzOiBiYXJlIGlkZW50aWZpZXJzIGZvciB2YXJpYWJsZXMKICBsb2cgInB1Ymxpc2hlZCAke3ZlcnNpb259IiAgICAgICAgICAgICAgICAjIGluZm8gbGluZSBpbiB0aGUgcHJvZ3Jlc3MgdHJlZSAoc3Rkb3V0KQogIGxvZ2VyciAid2FybmluZzogc2xvdyByZWdpc3RyeSIgICAgICAgICAgICMgcmVkICEgbGluZSAoc3RkZXJyKQogIGFsZXJ0cyA8LSAicmVsZWFzZWQgJHt2ZXJzaW9ufSIgICAgICAgICAgICMgc2VuZCB0byBhIGNoYW5uZWwKICByZXR1cm4gbm90ZXMgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAjIHNldCB0aGlzIHdvcmtmbG93J3MgcmV0dXJuIHZhbHVlCn0KYGBgCgotICoqQ2FsbCBhcmd1bWVudHM6KiogcXVvdGVkIGxpdGVyYWxzIChgIm1haW4iYCksIGJhcmUgaWRlbnRpZmllcnMgZm9yIGluLXNjb3BlIHZhcmlhYmxlcyAoYHZlcnNpb25gIOKAlCBwcmVmZXJyZWQgc3R5bGUpLCBxdW90ZWQgaW50ZXJwb2xhdGlvbiB3aGVuIHRoZSB3aG9sZSBhcmd1bWVudCBpcyBvbmUgdmFyaWFibGUgKGAiJHt2ZXJzaW9ufSJgIOKAlCBhbHNvIGFjY2VwdGVkIHdoZW4gYHZlcnNpb25gIGlzIGluIHNjb3BlKSwgb3IgZXhwbGljaXQgbmVzdGVkIGNhbGxzIChgcnVuIG91dGVyKHJ1biBpbm5lcigpKWAsIGBydW4gb3V0ZXIoZW5zdXJlIGNoZWNrKCkpYCkuIEJhcmUgY2FsbCBzaGFwZXMgbGlrZSBgcnVuIG91dGVyKGlubmVyKCkpYCBhcmUgcmVqZWN0ZWQuIFN0cmluZ3MgbWl4aW5nIHRleHQgYW5kIGludGVycG9sYXRpb24gKGAidiR7dmVyc2lvbn0iYCkgYXJlIGZpbmUuCi0gKipBcml0eSBpcyBjaGVja2VkKiogd2hlbiB0aGUgY2FsbGVlIGRlY2xhcmVzIHBhcmFtZXRlcnM6IGBydW4gZ3JlZXQoImEiLCJiIilgIGFnYWluc3QgYHdvcmtmbG93IGdyZWV0KG5hbWUpYCBpcyBgRV9WQUxJREFURWAuCi0gKipgZmFpbCAicmVhc29uImAqKiBhYm9ydHMgd2l0aCBhIG5vbi16ZXJvIGV4aXQuICoqYHJldHVybmAqKiBhY2NlcHRzIGAic3RyaW5nImAsIGAiIiLigKYiIiJgLCBhIGJhcmUgaWRlbnRpZmllciwgYHJ1biByZWYoKWAgLyBgZW5zdXJlIHJlZigpYCwgYW4gaW5saW5lIHNjcmlwdCwgb3IgYSBgbWF0Y2hgIGV4cHJlc3Npb24uCi0gKipgbG9nYCAvIGBsb2dlcnJgKiogYWNjZXB0IGAic3RyaW5nImAsIGAiIiLigKYiIiJgLCBhIGJhcmUgaWRlbnRpZmllciAoYGxvZyBzdGF0dXNgIOKJoSBgbG9nICIke3N0YXR1c30iYCksIG9yIGBsb2cgcnVuIFxgY21kXGAoKWAuCgojIyMgUnVsZXMg4oCUIGNoZWNrcyBvbmx5CgpgYGBqYWlwaApydWxlIGJyYW5jaF9pcyhleHBlY3RlZCkgewogIHJ1biBgdGVzdCAiJChnaXQgYnJhbmNoIC0tc2hvdy1jdXJyZW50KSIgPSAiJDEiYChleHBlY3RlZCkKfQoKcnVsZSBwcmVjb25kaXRpb25zKCkgewogIGVuc3VyZSBicmFuY2hfaXMoIm1haW4iKQogIGVuc3VyZSBnaXRfY2xlYW4oKQp9CmBgYAoKQWxsb3dlZCBpbiBydWxlIGJvZGllczogYGVuc3VyZWAsIGBydW5gICgqKnNjcmlwdHMgb25seSoqKSwgYGNvbnN0YCwgYGlmYCwgYG1hdGNoYCwgYGZvcmAsIGBsb2dgL2Bsb2dlcnJgLCBgZmFpbGAsIGByZXR1cm5gLCBgY2F0Y2hgL2ByZWNvdmVyYCBzdWZmaXhlcy4gKipOb3QgYWxsb3dlZDoqKiBgcHJvbXB0YCwgY2hhbm5lbCBzZW5kcywgYHJ1biBhc3luY2AsIGBydW5gIHRvIGEgd29ya2Zsb3csIHJhdyBzaGVsbCBsaW5lcy4gQSBydWxlIHBhc3NlcyB3aGVuIGl0IGV4aXRzIDAuIFRyZWF0IHJ1bGVzIGFzIHJlYWQtb25seTogZG8gbXV0YXRpb25zIGluIHdvcmtmbG93cyBhbmQgc2NyaXB0cy4KCiMjIyBQcm9tcHRzIOKAlCBkZWxlZ2F0aW5nIHRvIGFuIGFnZW50CgpgYGBqYWlwaApwcm9tcHQgIlN1bW1hcml6ZSB0aGUgZGlmZiBpbiBvbmUgcGFyYWdyYXBoIiAgICAgICAgICAjIGZpcmUgYW5kIGZvcmdldApjb25zdCBhbnN3ZXIgPSBwcm9tcHQgIlN1bW1hcml6ZSB0aGUgZGlmZiIgICAgICAgICAgICAjIGNhcHR1cmUgdGhlIGFnZW50J3MgYW5zd2VyCgpjb25zdCBib2R5ID0gIlJldmlldyB0aGlzIHBsYW46ICR7cGxhbn0iCnByb21wdCBib2R5ICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICMgaWRlbnRpZmllciBmb3JtCgpjb25zdCByZXZpZXcgPSBwcm9tcHQgIiIiCllvdSBhcmUgcmV2aWV3aW5nIGEgcmVsZWFzZSBwbGFuLgpBcHByb3ZlIG9ubHkgaWYgYWxsIGNoZWNrcyBiZWxvdyBhcmUgYWRkcmVzc2VkLgpQbGFuOgoke3BsYW59CiIiIgpgYGAKCioqVHlwZWQgcHJvbXB0cyoqIGZvcmNlIHN0cnVjdHVyZWQgSlNPTiBvdXRwdXQgYW5kIGdpdmUgeW91IGZpZWxkIGFjY2VzczoKCmBgYGphaXBoCmNvbnN0IHIgPSBwcm9tcHQgIkFzc2VzcyB0aGlzIGNoYW5nZSIgcmV0dXJucyAieyB2ZXJkaWN0OiBzdHJpbmcsIHJpc2s6IHN0cmluZyB9Igpsb2cgInZlcmRpY3Q9JHtyLnZlcmRpY3R9IHJpc2s9JHtyLnJpc2t9IgojIGlmL21hdGNoIGFjY2VwdCBkb3Qgc3ViamVjdHMgb24gdHlwZWQgcHJvbXB0IGNhcHR1cmVzIOKAlCBubyByZWJpbmQgbmVlZGVkCmlmIHIudmVyZGljdCA9PSAicmVqZWN0IiB7CiAgZmFpbCAicmVqZWN0ZWQ6ICR7ci5yaXNrfSIKfQpgYGAKCi0gU2NoZW1hIGlzICoqZmxhdCoqLCB0eXBlcyBgc3RyaW5nYCB8IGBudW1iZXJgIHwgYGJvb2xlYW5gIG9ubHkuIENhcHR1cmUgKGBjb25zdCByID1gKSBpcyAqKnJlcXVpcmVkKiogd2l0aCBgcmV0dXJuc2AuCi0gVGhlIHJ1bnRpbWUgZXh0cmFjdHMgYW5kIHZhbGlkYXRlcyBKU09OIGZyb20gdGhlIGFnZW50J3MgcmVwbHk7IG9uIHNjaGVtYSBtaXNtYXRjaCB0aGUgc3RlcCBmYWlscy4gQWxsIGZpZWxkcyBhcmUgc3RvcmVkIGFzICoqc3RyaW5ncyoqIChhIGBudW1iZXJgIGZpZWxkIGhvbGRzIHRoZSB0ZXh0IGAiNDIiYCkuCi0gRm9yIGEgYCIiImAgcHJvbXB0LCBgcmV0dXJucyAi4oCmImAgZ29lcyBvbiB0aGUgY2xvc2luZy1gIiIiYCBsaW5lIG9yIHRoZSBsaW5lIGltbWVkaWF0ZWx5IGFmdGVyLgotIFRyaXBsZSAqKmJhY2t0aWNrcyoqIGluc2lkZSBwcm9tcHQgY29udGV4dCBhcmUgcmVqZWN0ZWQg4oCUIHRoZXkgYXJlIHNjcmlwdCBkZWxpbWl0ZXJzLiBVc2UgaW5kZW50YXRpb24gb3IgcXVvdGVzIGZvciBjb2RlIGluIHByb21wdCB0ZXh0LgoKQmFja2VuZCBpcyBjb25maWd1cmVkLCBub3QgcGVyLXByb21wdDogYGFnZW50LmJhY2tlbmRgID0gYGN1cnNvcmAgKGRlZmF1bHQpIHwgYGNsYXVkZWAgfCBgY29kZXhgLCBwbHVzIGBhZ2VudC5kZWZhdWx0X21vZGVsYCwgdmlhIGBjb25maWcgeyDigKYgfWAgb3IgYEpBSVBIX0FHRU5UXypgIGVudiB2YXJzIChlbnYgd2lucykuIE9uIHRoZSAqKmN1cnNvcioqIGJhY2tlbmQgb25seSwgYGFnZW50LmNvbW1hbmRgIGNhbiBwb2ludCBhdCBhIGN1c3RvbSBleGVjdXRhYmxlIChwcm9tcHQgb24gc3RkaW4sIGFuc3dlciBvbiBzdGRvdXQpOyBgY2xhdWRlYCBhbmQgYGNvZGV4YCBpZ25vcmUgYGFnZW50LmNvbW1hbmRgLgoKKipXcml0ZSBwcm9tcHRzIGxpa2UgdGFzayBicmllZnM6Kiogc3RhdGUgdGhlIGdvYWwsIHRoZSBjb25zdHJhaW50cywgdGhlIGFjY2VwdGFuY2UgY3JpdGVyaWEsIGFuZCB3aGF0IHRvIG91dHB1dC4gSW50ZXJwb2xhdGUgY29uY3JldGUgY29udGV4dCAoYCR7dGFza31gLCBgJHtkaWZmfWAsIGNhcHR1cmVkIGZpbGUgY29udGVudHMpIHJhdGhlciB0aGFuIGFza2luZyB0aGUgYWdlbnQgdG8gZ28gZmluZCBpdC4KCiMjIyBGYWlsdXJlIGhhbmRsaW5nOiBgY2F0Y2hgIGFuZCBgcmVjb3ZlcmAKCmBgYGphaXBoCiMgY2F0Y2gg4oCUIHJ1bnMgT05DRSBvbiBmYWlsdXJlLCB0aGVuIGNvbnRpbnVlcwpydW4gZGVwbG95KGVudikgY2F0Y2ggKGVycikgewogIGxvZ2VyciAiZGVwbG95IGZhaWxlZDogJHtlcnJ9IgogIHJ1biByb2xsYmFjayhlbnYpCn0KCiMgcmVjb3ZlciDigJQgcmVwYWlyLWFuZC1SRVRSWSBsb29wOiBydW4gdGFyZ2V0IOKGkiBvbiBmYWlsdXJlIHJ1biBib2R5IOKGkiByZXRyeSB0YXJnZXQKcnVuIHRlc3RzKCkgcmVjb3ZlciAoZXJyKSB7CiAgcHJvbXB0ICJUZXN0cyBmYWlsZWQuIEZpeCB0aGUgY29kZS4gRmFpbHVyZSBvdXRwdXQ6ICR7ZXJyfSIKfQpgYGAKCi0gVGhlIGJpbmRpbmcgKGBlcnJgKSByZWNlaXZlcyB0aGUgbWVyZ2VkIHN0ZG91dCtzdGRlcnIgb2YgdGhlIGZhaWxlZCBleGVjdXRpb24uIEV4YWN0bHkgb25lIGJpbmRpbmcsIGFsd2F5cyBpbiBwYXJlbnRoZXNlcyDigJQgYmFyZSBgY2F0Y2gge2AgaXMgYSBwYXJzZSBlcnJvci4KLSBgY2F0Y2hgIHdvcmtzIG9uIGBlbnN1cmVgIGFuZCBgcnVuYDsgYHJlY292ZXJgIHdvcmtzIG9uIGBydW5gIChhbmQgYHJ1biBhc3luY2ApIG9ubHkuIFRoZXkgYXJlIG11dHVhbGx5IGV4Y2x1c2l2ZSBvbiBvbmUgc3RlcC4KLSBgcmVjb3ZlcmAgcmV0cmllcyB1bnRpbCBzdWNjZXNzIG9yIGBydW4ucmVjb3Zlcl9saW1pdGAgKGRlZmF1bHQgKioxMCoqOyB3b3JrZmxvdy1sZXZlbCBjb25maWcgb3ZlcnJpZGVzIG1vZHVsZS1sZXZlbCkuCi0gQSBjb21tb24gcGF0dGVybjogYSBgY2F0Y2hgIHdob3NlIGJvZHkgaXMgdGhlICJlbHNlIGJyYW5jaCIg4oCUIG5vdGUgYHJldHVybmAgaW5zaWRlIGEgY2F0Y2ggYm9keSByZXR1cm5zIGZyb20gdGhlICoqZW5jbG9zaW5nIHdvcmtmbG93KiouCgpgcmVjb3ZlcmAgKyBgcHJvbXB0YCBpcyBKYWlwaCdzIHNpZ25hdHVyZSBsb29wIGZvciByZXBldGl0aXZlIGFnZW50IHdvcms6ICpjaGVjayDihpIgaWYgYnJva2VuLCBhc2sgYWdlbnQgdG8gZml4IOKGkiByZS1jaGVjayosIGZ1bGx5IHVuYXR0ZW5kZWQuCgojIyMgQ29udHJvbCBmbG93OiBgaWZgLCBgbWF0Y2hgLCBgZm9yYAoKYGBgamFpcGgKaWYgc3RhdHVzID09ICJvayIgeyBsb2cgImhlYWx0aHkiIH0gICAgICAgIyBvcGVyYXRvcnM6ID09ICE9ID1+ICF+CmlmIG1zZyA9fiAvRVJST1J8RkFUQUwvIHsgZmFpbCAiYmFkIiB9ICAgICMgPX4gLyAhfiB0YWtlIC9yZWdleC8KCmNvbnN0IGxhYmVsID0gbWF0Y2ggc3RhdHVzIHsgICAgICAgICAgICAgICMgc3RhdGVtZW50LCBleHByZXNzaW9uLCBvciByZXR1cm4gZm9ybQogICJvayIgPT4gInN1Y2Nlc3MiCiAgL153YXJuLyA9PiAid2FybmluZyIKICBfID0+ICJ1bmtub3duIgp9Cgpmb3IgcGF0aCBpbiBwYXRocyB7ICAgICAgICAgICAgICAgICAgICAgICAjIGl0ZXJhdGVzIExJTkVTIG9mIHRoZSBzdHJpbmcgYHBhdGhzYAogIHJ1biBwcm9jZXNzKHBhdGgpCn0KYGBgCgotIFN1YmplY3RzIGZvciBgaWZgIGFuZCBgbWF0Y2hgIGFyZSBiYXJlIGlkZW50aWZpZXJzIChgaWYgc3RhdHVzID09IOKApmAsIGBtYXRjaCBzdGF0dXMge2ApIG9yIGBJREVOVC5JREVOVGAgcmVhZGluZyBhIGZpZWxkIGZyb20gYSB0eXBlZCBwcm9tcHQgY2FwdHVyZSAoYGlmIHIudmVyZGljdCA9PSAib2siYCwgYG1hdGNoIHIudmVyZGljdCB7IOKApiB9YCkuIGAkc3RhdHVzYCAvIGAke3N0YXR1c31gIGFzIHN1YmplY3QgaXMgc3RpbGwgYSBwYXJzZSBlcnJvci4gRG90IHN1YmplY3RzIG9uIGEgbm9uLXR5cGVkLWNhcHR1cmUgdmFyaWFibGUsIG9yIGEgZmllbGQgbm90IGluIHRoZSBwcm9tcHQncyBgcmV0dXJuc2Agc2NoZW1hLCBnZXQgdGhlIHNhbWUgYEVfVkFMSURBVEVgIGVycm9ycyBhcyBgJHt2YXIuZmllbGR9YCBpbnRlcnBvbGF0aW9uLiBgZm9yYCBpdGVyYXRvcnMgc3RheSBiYXJlIGlkZW50aWZpZXJzIChgZm9yIHggaW4gbGluZXNgKS4KLSBgaWZgIHN1cHBvcnRzIGFuIG9wdGlvbmFsIGBlbHNlYCBicmFuY2gg4oCUIGB9IGVsc2Uge2AgbXVzdCBiZSBvbiAqKnRoZSBzYW1lIGxpbmUqKiBhcyB0aGUgY2xvc2luZyBgfWAgb2YgdGhlIGBpZmAgYm9keS4gKipObyBgZWxzZSBpZmAgY2hhaW5pbmcqKjogbmVzdCBhbiBgaWZgIGluc2lkZSB0aGUgYGVsc2VgIGJsb2NrLCBvciB1c2UgYG1hdGNoYCBmb3IgbXVsdGktd2F5IGJyYW5jaGluZy4KLSBgbWF0Y2hgOiBhcm1zIGFyZSBuZXdsaW5lLXNlcGFyYXRlZCAobm8gY29tbWFzKSwgZmlyc3QgbWF0Y2ggd2lucywgZXhhY3RseSBvbmUgYF9gIGFybSByZXF1aXJlZC4gQXJtIGJvZGllczogc3RyaW5nLCBgIiIi4oCmIiIiYCwgaW4tc2NvcGUgaWRlbnRpZmllciwgYCR7dmFyfWAsIGBmYWlsICLigKYiYCwgYHJ1biByZWYoKWAsIGBlbnN1cmUgcmVmKClgLiAqKk5vdCoqIGFsbG93ZWQgaW4gYXJtczogYHJldHVybmAgKHdyaXRlIGByZXR1cm4gbWF0Y2ggeCB7IOKApiB9YCksIGBsb2dgL2Bsb2dlcnJgLCBpbmxpbmUgc2NyaXB0cyDigJQgY2FwdHVyZSB0aGUgbWF0Y2ggcmVzdWx0IGludG8gYSBgY29uc3RgIGFuZCBhY3Qgb24gaXQgYWZ0ZXIuCi0gYGZvcmAgc3BsaXRzIHRoZSBzb3VyY2Ugc3RyaW5nIG9uIG5ld2xpbmVzIChhIHRyYWlsaW5nIGZpbmFsIG5ld2xpbmUgZG9lcyBub3QgcHJvZHVjZSBhbiBlbXB0eSBpdGVyYXRpb24pLiBUaGVyZSBpcyBubyBudW1lcmljL3doaWxlIGxvb3Ag4oCUIGl0ZXJhdGUgbGluZXMsIHVzZSBgcmVjb3ZlcmAsIG9yIHVzZSByZWN1cnNpdmUgd29ya2Zsb3dzIChkZXB0aCBsaW1pdCAyNTYpLgoKIyMjIENoYW5uZWxzIOKAlCBmYW4tb3V0IGJldHdlZW4gd29ya2Zsb3dzCgpgYGBqYWlwaApjaGFubmVsIGZpbmRpbmdzIC0+IGFuYWx5c3QsIHJldmlld2VyICAgICAjIHJvdXRlcyBkZWNsYXJlZCBhdCBUT1AgTEVWRUwgb25seQoKd29ya2Zsb3cgc2Nhbm5lcigpIHsKICBmaW5kaW5ncyA8LSAiRm91bmQgMyBpc3N1ZXMgaW4gYXV0aCIgICAgIyBSSFM6ICJsaXRlcmFsIiwgIiIiYmxvY2siIiIsICR7dmFyfSwgb3IgcnVuIHJlZigpCn0KCndvcmtmbG93IGFuYWx5c3QobWVzc2FnZSwgY2hhbiwgc2VuZGVyKSB7ICMgcm91dGUgdGFyZ2V0cyBkZWNsYXJlIEVYQUNUTFkgMyBwYXJhbXMKICBsb2cgImZyb20gJHtzZW5kZXJ9OiAke21lc3NhZ2V9Igp9Cgp3b3JrZmxvdyBkZWZhdWx0KCkgewogIHJ1biBzY2FubmVyKCkgICAgICAgICAgICAgICAgICAgICAgICAgICAjIGRpc3BhdGNoIGhhcHBlbnMgQUZURVIgc3RlcHMgZmluaXNoCn0KYGBgCgpTZW5kcyBlbnF1ZXVlIGluIG1lbW9yeTsgdGhlIHF1ZXVlIGRyYWlucyBhZnRlciB0aGUgb3duaW5nIHdvcmtmbG93J3Mgc3RlcHMgY29tcGxldGUsIGNhbGxpbmcgZWFjaCB0YXJnZXQgc2VxdWVudGlhbGx5LiBBIGAtPmAgaW5zaWRlIGEgd29ya2Zsb3cgYm9keSBpcyBhIHBhcnNlIGVycm9yLiBTZW5kcyBvbiBhIGNoYW5uZWwgd2l0aCBubyByb3V0ZSBhcmUgc2lsZW50bHkgZHJvcHBlZC4gRWFjaCB3b3JrZmxvdyBmcmFtZSBtYXkgZHJhaW4gYXQgbW9zdCAqKjEwMDAqKiBtZXNzYWdlcyBiZWZvcmUgdGhlIHJ1bnRpbWUgYWJvcnRzIHRoZSBvd25pbmcgd29ya2Zsb3cgd2l0aCBgRV9JTkJPWF9ESVNQQVRDSF9MSU1JVGAgKG5hbWluZyB0aGUgY2hhbm5lbCB0aGF0IGhpdCB0aGUgY2FwKTsgb3ZlcnJpZGUgdmlhIGBKQUlQSF9JTkJPWF9NQVhfRElTUEFUQ0g9PHBvc2l0aXZlIGludD5gIG9ubHkgaWYgdGhlIGhpZ2ggdm9sdW1lIGlzIGludGVudGlvbmFsLiBSb3V0ZWQgcGF5bG9hZHMgYXJlIHBlcnNpc3RlZCB1bmRlciB0aGUgcnVuIGRpciBhcyBgaW5ib3gvTk5OLTxjaGFubmVsPi50eHRgLgoKIyMjIENvbmN1cnJlbmN5OiBgcnVuIGFzeW5jYAoKYGBgamFpcGgKd29ya2Zsb3cgZGVmYXVsdCgpIHsKICBjb25zdCBhID0gcnVuIGFzeW5jIGxpbnQoKSAgICAgICAgICAgICAjIHJldHVybnMgYSBoYW5kbGUgaW1tZWRpYXRlbHkKICBjb25zdCBiID0gcnVuIGFzeW5jIHVuaXRfdGVzdHMoKQogIGxvZyAibGludDogJHthfSIgICAgICAgICAgICAgICAgICAgICAgICMgZmlyc3QgcmVhbCByZWFkIGJsb2NrcyArIHJlc29sdmVzCiAgbG9nICJ0ZXN0czogJHtifSIKfSAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAjIHVucmVhZCBoYW5kbGVzIGFyZSBqb2luZWQgd2hlbiB0aGlzIHN0ZXAgbGlzdCBmaW5pc2hlcwpgYGAKCldvcmtmbG93cyBvbmx5IChyZWplY3RlZCBpbiBydWxlcyk7IG5vdCBjb21iaW5hYmxlIHdpdGggaW5saW5lIHNjcmlwdHMuIGBjYXRjaGAvYHJlY292ZXJgIGNvbXBvc2Ugd2l0aCBgcnVuIGFzeW5jYC4gVW5yZWFkIGhhbmRsZXMgYXJlIGpvaW5lZCBhdCB0aGUgZW5kIG9mIHRoZSAqKmN1cnJlbnQgc3RlcCBsaXN0KiogKHRoZSB3b3JrZmxvdyBib2R5LCBhbiBgaWZgL2BlbHNlYCBicmFuY2gsIG9yIGEgYGNhdGNoYC9gcmVjb3ZlcmAgYm9keSkgYmVmb3JlIGNvbnRyb2wgY29udGludWVzIOKAlCBjaGFubmVsIGRyYWlucyBydW4gb25seSBhZnRlciB0aGUgZW50cnkgd29ya2Zsb3cncyB0b3AtbGV2ZWwgbGlzdCBmaW5pc2hlcy4gRm9yIGNvbmN1cnJlbnQgKnNoZWxsKiwgdXNlIGAmYCArIGB3YWl0YCBpbnNpZGUgb25lIHNjcmlwdCBib2R5IGluc3RlYWQuCgojIyMgQ29uZmlnCgpgYGBqYWlwaApjb25maWcgewogIGFnZW50LmJhY2tlbmQgPSAiY2xhdWRlIiAgICAgICAgICAgICAgICMgY3Vyc29yIHwgY2xhdWRlIHwgY29kZXgKICBhZ2VudC5kZWZhdWx0X21vZGVsID0gImNsYXVkZS1zb25uZXQtNC02IgogIHJ1bi5yZWNvdmVyX2xpbWl0ID0gNSAgICAgICAgICAgICAgICAgICMgd29ya2Zsb3ctbGV2ZWwgY29uZmlnIGFsc28gaG9ub3JlZAogIHJ1bi5sb2dzX2RpciA9ICIuamFpcGgvcnVucyIKfQpgYGAKClByZWNlZGVuY2U6ICoqZW52aXJvbm1lbnQgPiB3b3JrZmxvdy1sZXZlbCBjb25maWcgPiBtb2R1bGUtbGV2ZWwgY29uZmlnID4gZGVmYXVsdHMqKi4gQSB3b3JrZmxvdyBib2R5IG1heSBvcGVuIHdpdGggaXRzIG93biBgY29uZmlnIHsg4oCmIH1gIChiZWZvcmUgYW55IHN0ZXBzOyBgYWdlbnQuKmAvYHJ1bi4qYCBrZXlzIG9ubHkpIHRvIG92ZXJyaWRlIHRoZSBtb2RlbCBvciBiYWNrZW5kIGZvciBqdXN0IHRoYXQgd29ya2Zsb3cuIERvY2tlciBvbi9vZmYgaXMgZW52LW9ubHkgKGBKQUlQSF9VTlNBRkVgLCBgSkFJUEhfRE9DS0VSX0VOQUJMRURgKTsgaW1hZ2UvbmV0d29yay90aW1lb3V0IGNvbWUgZnJvbSBgcnVudGltZS4qYCBrZXlzIG9yIGBKQUlQSF9ET0NLRVJfKmAuCgojIyBDb21waWxlIGVycm9ycyB5b3Ugd2lsbCBzZWUsIGFuZCB0aGUgZml4Cgp8IEVycm9yIChhYnJpZGdlZCkgfCBGaXggfAp8LS0tfC0tLXwKfCBgRV9QQVJTRWAgbWlzc2luZyBgKClgIG9uIGRlZmluaXRpb24vY2FsbCB8IEFkZCBwYXJlbnRoZXNlczogYHdvcmtmbG93IGRlZmF1bHQoKWAsIGBydW4gc2V0dXAoKWAgfAp8IGBFX1BBUlNFYCBhc3NpZ25tZW50IHdpdGhvdXQgYGNvbnN0YCB8IGBjb25zdCB4ID0gcnVuIGZvbygpYCB8CnwgYEVfVkFMSURBVEVgIGNhbm5vdCByZWJpbmQgaW1tdXRhYmxlIG5hbWUgfCBSZW5hbWUgdGhlIG5ldyBiaW5kaW5nIOKAlCBub3RoaW5nIGlzIHJlYXNzaWduYWJsZSB8CnwgYEVfVkFMSURBVEVgIGBlbnN1cmVgIG9uIG5vbi1ydWxlIC8gYHJ1bmAgb24gcnVsZSB8IE1hdGNoIGtleXdvcmQgdG8gY2FsbGVlOiBydWxlc+KGkmBlbnN1cmVgLCBzY3JpcHRzL3dvcmtmbG93c+KGkmBydW5gIHwKfCBgRV9WQUxJREFURWAgYHJ1bmAgdG8gd29ya2Zsb3cgaW5zaWRlIHJ1bGUgfCBSdWxlcyBtYXkgYHJ1bmAgc2NyaXB0cyBvbmx5OyByZXN0cnVjdHVyZSBvciBtb3ZlIHRvIGEgd29ya2Zsb3cgfAp8IGBFX1ZBTElEQVRFYCBpbmxpbmUgc2hlbGwgZm9yYmlkZGVuIGluIHJ1bGVzIHwgV3JhcCB0aGUgc2hlbGwgaW4gYSBgc2NyaXB0YCAobmFtZWQgb3IgaW5saW5lKSBhbmQgYHJ1bmAgaXQgfAp8IGBFX1BBUlNFYCBgJHvigKZ9YCBpbiBzaW5nbGUtYmFja3RpY2sgc2NyaXB0IHwgVXNlIGAkMWAvYCQyYCBhcmdzLCBvciBzd2l0Y2ggdG8gYSBmZW5jZWQgYGBgIGJsb2NrIHwKfCBgRV9WQUxJREFURWAgdW5rbm93biBpZGVudGlmaWVyIC8gdW5rbm93biBgJHtuYW1lfWAgfCBEZWNsYXJlIGl0IChgY29uc3RgL3BhcmFtKSBiZWZvcmUgdXNlOyBjaGVjayBzcGVsbGluZyB8CnwgYEVfVkFMSURBVEVgIG5lc3RlZCBjYWxsIG11c3QgYmUgZXhwbGljaXQgfCBgcnVuIGYocnVuIGcoKSlgLCBub3QgYHJ1biBmKGcoKSlgIHwKfCBgRV9WQUxJREFURWAgZHVwbGljYXRlIGltcG9ydCBhbGlhcyB8IFVzZSBhIHVuaXF1ZSBgYXNgIG5hbWUgZm9yIGVhY2ggYGltcG9ydGAgfAp8IGBFX1ZBTElEQVRFYCBhcml0eSBtaXNtYXRjaCB8IE1hdGNoIHRoZSBjYWxsZWUncyBkZWNsYXJlZCBwYXJhbWV0ZXIgY291bnQgfAp8IGBFX1BBUlNFYCByZWRpcmVjdGlvbiBhZnRlciBtYW5hZ2VkIGNhbGwgfCBNb3ZlIHBpcGVzL3JlZGlyZWN0cyBpbnRvIGEgc2NyaXB0IGJvZHkgfAp8IGBFX1ZBTElEQVRFYCBzY3JpcHRzIGFyZSBub3QgdmFsdWVzL3Byb21wdGFibGUgfCBTY3JpcHRzIGFyZW4ndCBzdHJpbmdzOiBkb24ndCBgY29uc3QgeCA9IHNjcmlwdE5hbWVgLCBgJHtzY3JpcHROYW1lfWAsIG9yIGBwcm9tcHQgc2NyaXB0TmFtZWAgfAp8IGBFX1BBUlNFYCBgLT5gIGluc2lkZSB3b3JrZmxvdyBib2R5IHwgTW92ZSB0aGUgcm91dGUgdG8gdGhlIHRvcC1sZXZlbCBgY2hhbm5lbGAgbGluZSB8CnwgYEVfUEFSU0VgIGBwcm9tcHQg4oCmIHJldHVybnNgIHdpdGhvdXQgY2FwdHVyZSB8IGBjb25zdCB4ID0gcHJvbXB0IOKApiByZXR1cm5zICLigKYiYCB8CnwgYEVfU0NIRU1BYCBpbnZhbGlkIHJldHVybnMgc2NoZW1hIHwgRmxhdCBgeyBmaWVsZDogc3RyaW5nfG51bWJlcnxib29sZWFuIH1gIG9ubHkgfAp8IGBFX0lNUE9SVF9OT1RfRk9VTkRgIHwgRml4IHRoZSBwYXRoIChyZWxhdGl2ZSB0byB0aGUgaW1wb3J0aW5nIGZpbGUpIG9yIGBqYWlwaCBpbnN0YWxsYCB0aGUgbGlicmFyeSB8CgojIyBSdW50aW1lIG1vZGVsICh3aGF0IGhhcHBlbnMgd2hlbiBpdCBydW5zKQoKLSBgamFpcGggcnVuIGZpbGUuamggYXJnc+KApmAgdmFsaWRhdGVzIHRoZSBpbXBvcnQgY2xvc3VyZSwgZW1pdHMgc2NyaXB0IGJvZGllcyBhcyBleGVjdXRhYmxlIGZpbGVzLCB0aGVuIGludGVycHJldHMgYHdvcmtmbG93IGRlZmF1bHRgIHdpdGggdGhlIGFyZ3MgYm91bmQgdG8gaXRzIG5hbWVkIHBhcmFtZXRlcnMuIFNjcmlwdHMgYWRkaXRpb25hbGx5IHNlZSBwb3NpdGlvbmFsIGFyZ3MgYXMgYCQxYCwgYCQyYC4KLSAqKlJ1biBkaXJlY3Rvcnk6KiogYC5qYWlwaC9ydW5zLzxVVEMtZGF0ZT4vPFVUQy10aW1lPi08ZmlsZT4vYCB3aXRoIG51bWJlcmVkIGBOTk5OTk4tPHN0ZXA+Lm91dGAvYC5lcnJgIHBlciBzdGVwICh3cml0dGVuIGluY3JlbWVudGFsbHkg4oCUIGB0YWlsIC1mYCB3b3JrcykgYW5kIGBydW5fc3VtbWFyeS5qc29ubGAsIG9uZSBKU09OIGV2ZW50IHBlciBsaW5lIChgV09SS0ZMT1dfU1RBUlQvRU5EYCwgYFNURVBfU1RBUlQvRU5EYCwgYExPR2AsIGBJTkJPWF8qYCwgYFBST01QVF8qYCkuIFdoZW4gZGVidWdnaW5nIGEgZmFpbGVkIHJ1biwgcmVhZCB0aGUgZmFpbHVyZSBmb290ZXIgdGhlIENMSSBwcmludHMsIHRoZW4gdGhlIHJlZmVyZW5jZWQgYC5lcnJgL2Aub3V0YCBmaWxlcy4KLSAqKlJldHVybiB2YWx1ZToqKiBpZiBgZGVmYXVsdGAgcmV0dXJucyBhIHN0cmluZywgdGhlIENMSSBwcmludHMgaXQgdG8gc3Rkb3V0IGFmdGVyIHRoZSBQQVNTIGxpbmUuCi0gKipDYXB0dXJlIHNvdXJjZXM6Kiogd29ya2Zsb3cvcnVsZSDihpIgaXRzIGV4cGxpY2l0IGByZXR1cm5gIHZhbHVlOyBzY3JpcHQg4oaSIHN0ZG91dDsgcHJvbXB0IOKGkiB0aGUgYWdlbnQncyBhbnN3ZXIuCi0gU3RlcCBlbnZpcm9ubWVudDogc2NyaXB0cyBpbmhlcml0IHRoZSBydW5uZXIncyBlbnZpcm9ubWVudCBwbHVzIGBKQUlQSF9XT1JLU1BBQ0VgLCBgSkFJUEhfU0NSSVBUU2AsIGBKQUlQSF9SVU5fRElSYCwgYEpBSVBIX0FSVElGQUNUU19ESVJgLCBldGMuIFdvcmtmbG93IHZhcmlhYmxlcyBhcmUgKipub3QqKiBhdXRvLWV4cG9ydGVkIOKAlCBwYXNzIHRoZW0gYXMgYXJndW1lbnRzLgoKIyMgVGVzdGluZyB5b3VyIHdvcmtmbG93cwoKVGVzdCBmaWxlcyBhcmUgYCoudGVzdC5qaGAgbmV4dCB0byB5b3VyIG1vZHVsZXMsIHJ1biB3aXRoIGBqYWlwaCB0ZXN0YC4gVGhleSBleGVjdXRlIHRoZSBzYW1lIGludGVycHJldGVyIHdpdGggcHJvbXB0cyBhbmQgYm9kaWVzIG1vY2tlZCDigJQgbm8gbGl2ZSBMTE0gY2FsbHMuCgpgYGBqYWlwaAppbXBvcnQgIm1haW4uamgiIGFzIGFwcAoKdGVzdCAiaGFwcHkgcGF0aCIgewogIG1vY2sgcHJvbXB0ICJMR1RNIOKAlCBpbXBsZW1lbnRlZCIKICBjb25zdCBvdXQgPSBydW4gYXBwLmRlZmF1bHQoImFkZCBsb2dnaW5nIikKICBleHBlY3RfY29udGFpbiBvdXQgIkxHVE0iCn0KCnRlc3QgImZhaWx1cmUgcGF0aCBpcyBoYW5kbGVkIiB7CiAgbW9jayBwcm9tcHQgeyAvZml4LyA9PiAiZml4ZWQiLCBfID0+ICJub29wIiB9ICAgIyBjb250ZW50LWJhc2VkIGRpc3BhdGNoCiAgbW9jayBzY3JpcHQgYXBwLnJ1bl90ZXN0cygpIHsKICAgIGV4aXQgMQogIH0KICBjb25zdCBvdXQgPSBydW4gYXBwLmRlZmF1bHQoIngiKSBhbGxvd19mYWlsdXJlICAgIyBub24temVybyBleGl0IGRvZXNuJ3QgZmFpbCB0aGUgdGVzdAogIGV4cGVjdF9jb250YWluIG91dCAicm9sbGJhY2siCn0KYGBgCgotIE1vY2tzOiBgbW9jayBwcm9tcHQgIuKApiJgIChxdWV1ZWQsIG9uZSBwZXIgcHJvbXB0IGNhbGwpLCBgbW9jayBwcm9tcHQgeyAvcmUvID0+ICLigKYiLCBfID0+ICLigKYiIH1gLCBgbW9jayB3b3JrZmxvdyByZWYoKSB7IOKApiB9YCwgYG1vY2sgcnVsZSByZWYoKSB7IOKApiB9YCwgYG1vY2sgc2NyaXB0IHJlZigpIHsgc2hlbGwgbGluZXMgfWAuIEFsbCBtb2NrIHJlZnMgbmVlZCBgKClgLgotIEFzc2VydGlvbnM6IGBleHBlY3RfY29udGFpbmAsIGBleHBlY3Rfbm90X2NvbnRhaW5gLCBgZXhwZWN0X2VxdWFsYCDigJQgYGV4cGVjdF8qIDxjYXB0dXJlVmFyPiAibGl0ZXJhbCJgIG9yIGEgdGVzdC1ibG9jayBgY29uc3RgIG5hbWUuCi0gRm9yIHR5cGVkIHByb21wdHMsIHRoZSBtb2NrIHRleHQgbXVzdCBiZSBvbmUgbGluZSBvZiB2YWxpZCBKU09OIG1hdGNoaW5nIHRoZSBzY2hlbWEuCi0gTWl4aW5nIHF1ZXVlZCBgbW9jayBwcm9tcHQgIuKApiJgIC8gYG1vY2sgcHJvbXB0IDxjb25zdD5gIGFuZCBhIGBtb2NrIHByb21wdCB7IOKApiB9YCBibG9jayBpbiBvbmUgdGVzdCBpcyByZWplY3RlZCBhdCBjb21waWxlIHRpbWUgKGBFX1ZBTElEQVRFYDogYGNhbm5vdCBtaXggIm1vY2sgcHJvbXB0IHsg4oCmIH0iIHdpdGggcXVldWVkICJtb2NrIHByb21wdCDigKYiIGluIG9uZSB0ZXN0IGJsb2NrOyBjaG9vc2Ugb25lIHN0eWxlYCkuIFVzZSBvbmUgc3R5bGUgcGVyIGJsb2NrOyBzZXBhcmF0ZSB0ZXN0cyBpbiB0aGUgc2FtZSBmaWxlIG1heSB1c2UgZGlmZmVyZW50IHN0eWxlcy4KCldyaXRlIGF0IGxlYXN0IG9uZSB0ZXN0IHBlciB3b3JrZmxvdyB5b3UgYXV0aG9yIHdoZW4gdGhlIHJlcG8gdXNlcyB0ZXN0czsgbW9jayBldmVyeSBwcm9tcHQgc28gdGhlIHN1aXRlIGlzIGRldGVybWluaXN0aWMuCgojIyBQYXR0ZXJucyBmb3IgcmVwZXRpdGl2ZSB0YXNrcwoKKipHYXRlIOKGkiBkbyDihpIgdmVyaWZ5KiogKHRoZSBzdGFuZGFyZCBkZWxpdmVyeSBzaGFwZSk6CgpgYGBqYWlwaAp3b3JrZmxvdyBkZWZhdWx0KHRhc2spIHsKICBlbnN1cmUgcHJlY29uZGl0aW9ucygpICAgICAgICAgICMgZmFzdCBjaGVja3MgZmlyc3QKICBydW4gaW1wbGVtZW50KHRhc2spICAgICAgICAgICAgICMgcHJvbXB0LWRyaXZlbiB3b3JrCiAgcnVuIHZlcmlmeSgpIHJlY292ZXIgKGVycikgeyAgICAjIHZlcmlmaWNhdGlvbiB3aXRoIHNlbGYtcmVwYWlyCiAgICBwcm9tcHQgIlZlcmlmaWNhdGlvbiBmYWlsZWQg4oCUIGZpeCBpdC4gT3V0cHV0OiAke2Vycn0iCiAgfQp9CmBgYAoKKipQcm9jZXNzIGEgcXVldWUgb2YgaXRlbXMqKiAobGluZS1vcmllbnRlZCBgZm9yYCk6CgpgYGBqYWlwaAp3b3JrZmxvdyBkZWZhdWx0KCkgewogIGNvbnN0IGl0ZW1zID0gcnVuIGBscyBpbmJveC8qLm1kIDI+L2Rldi9udWxsIHx8IHRydWVgKCkKICBmb3IgaXRlbSBpbiBpdGVtcyB7CiAgICBydW4gaGFuZGxlKGl0ZW0pCiAgfQp9CmBgYAoKKipSZXZpZXctdGhlbi1hY3Qgd2l0aCBhIHR5cGVkIHZlcmRpY3Q6KioKCmBgYGphaXBoCndvcmtmbG93IHRyaWFnZShpdGVtKSB7CiAgY29uc3QgciA9IHByb21wdCAiSXMgdGhpcyByZWFkeSB0byBpbXBsZW1lbnQ/IEl0ZW06ICR7aXRlbX0iIHJldHVybnMgInsgdmVyZGljdDogc3RyaW5nLCByZWFzb246IHN0cmluZyB9IgogIGNvbnN0IG91dGNvbWUgPSBtYXRjaCByLnZlcmRpY3QgewogICAgInJlYWR5IiA9PiBydW4gaW1wbGVtZW50KGl0ZW0pCiAgICBfID0+ICJza2lwcGVkOiAke3IucmVhc29ufSIKICB9CiAgbG9nIG91dGNvbWUKfQpgYGAKCioqUGlwZWxpbmUgc3RhZ2VzIHZpYSBjaGFubmVscyoqIHdoZW4gbGF0ZXIgc3RhZ2VzIHNob3VsZCByZWFjdCB0byBlYXJsaWVyIG9uZXMgd2l0aG91dCBkaXJlY3QgY2FsbHMgKHNlZSB0aGUgY2hhbm5lbCBzZWN0aW9uIGFib3ZlKS4KCiMjIFdoYXQgdG8gcHJvZHVjZSBpbiBhIHJlcG9zaXRvcnkKCldoZW4gYXNrZWQgdG8gc2NhZmZvbGQgSmFpcGggYXV0b21hdGlvbiAoZS5nLiBhZnRlciBgamFpcGggaW5pdGApLCBidWlsZCBhIHNtYWxsIGNvbXBvc2FibGUgc2V0IHVuZGVyIGAuamFpcGgvYDoKCi0gYC5qYWlwaC9yZWFkaW5lc3MuamhgIOKAlCBwcmVmbGlnaHQgcnVsZXMgKHJlcXVpcmVkIHRvb2xzLCBjbGVhbiBnaXQpICsgYHdvcmtmbG93IGRlZmF1bHRgIHJ1bm5pbmcgdGhlbS4KLSBgLmphaXBoL3ZlcmlmaWNhdGlvbi5qaGAg4oCUIGxpbnQvdGVzdC9idWlsZCBydWxlcyArIGB3b3JrZmxvdyBkZWZhdWx0YC4KLSBgLmphaXBoL21haW4uamhgIOKAlCBpbXBvcnRzIGJvdGgsIGRlZmluZXMgdGhlIHByb21wdC1kcml2ZW4gYGltcGxlbWVudGAgd29ya2Zsb3csIGFuZCBhIGB3b3JrZmxvdyBkZWZhdWx0KHRhc2spYCB3aXJpbmcgKipwcmVmbGlnaHQg4oaSIGltcGxlbWVudCDihpIgdmVyaWZpY2F0aW9uKiouCi0gT3B0aW9uYWw6IGEgcmV2aWV3IHdvcmtmbG93IGdhdGluZyBhIHRhc2sgcXVldWUsIGAqLnRlc3QuamhgIHRlc3RzIGZvciB0aGUgd29ya2Zsb3dzLgoKS2VlcCB3b3JrZmxvd3Mgc2hvcnQ7IHB1dCBleHBlbnNpdmUgY2hlY2tzIGFmdGVyIGNoZWFwIG9uZXM7IHBhc3MgZGF0YSBleHBsaWNpdGx5LiBBbHdheXMgZmluaXNoIHdpdGggZm9ybWF0ICsgY29tcGlsZToKCmBgYGJhc2gKamFpcGggZm9ybWF0IC5qYWlwaC8qLmpoCmphaXBoIGNvbXBpbGUgLmphaXBoCmphaXBoIHRlc3QgICAgICAgICAgICAgICAgICAgICAgICMgc2FmZSBldmVuIHdoZW4gbm8gKi50ZXN0LmpoIGV4aXN0cyB5ZXQKamFpcGggcnVuIC5qYWlwaC9tYWluLmpoICJpbXBsZW1lbnQgZmVhdHVyZSBYIgpgYGAKCkVuZCB5b3VyIHNjYWZmb2xkaW5nIHJlc3BvbnNlIGJ5IHByaW50aW5nIHRob3NlIGV4YWN0IGNvbW1hbmRzIGZvciB0aGUgdXNlciwgcGx1cyBhIHNob3J0ICoqV0hBVCBDSEFOR0VEKiogLyAqKldIWSoqIHN1bW1hcnkuIENhbm9uaWNhbCBhZ2VudC1yZWFkYWJsZSBjb3B5IG9mIHRoaXMgc2tpbGw6IDxodHRwczovL3Jhdy5naXRodWJ1c2VyY29udGVudC5jb20vamFpcGhsYW5nL2phaXBoL3JlZnMvaGVhZHMvbWFpbi9kb2NzL2phaXBoLXNraWxsLm1kPi4K";
+
+export function decodeEmbeddedAsset(base64: string): string {
+  return Buffer.from(base64, "base64").toString("utf8");
+}
diff --git a/src/runtime/kernel/graph.ts b/src/runtime/kernel/graph.ts
index c2839db1..73022f0f 100644
--- a/src/runtime/kernel/graph.ts
+++ b/src/runtime/kernel/graph.ts
@@ -1,19 +1,9 @@
-import { readFileSync } from "node:fs";
 import { resolve } from "node:path";
-import { parsejaiph } from "../../parser";
+import { loadModuleGraph, type ModuleGraph, type ModuleNode } from "../../transpile/module-graph";
 import type { RuleDef, ScriptDef, WorkflowDef, WorkflowRefDef, RuleRefDef, jaiphModule } from "../../types";
-import { resolveImportPath } from "../../transpile/resolve";
 
-export interface RuntimeModuleNode {
-  filePath: string;
-  ast: jaiphModule;
-  imports: Map<string, string>;
-}
-
-export interface RuntimeGraph {
-  entryFile: string;
-  modules: Map<string, RuntimeModuleNode>;
-}
+export type RuntimeModuleNode = ModuleNode;
+export type RuntimeGraph = ModuleGraph;
 
 export interface ResolvedWorkflow {
   filePath: string;
@@ -30,41 +20,37 @@ export interface ResolvedScript {
   script: ScriptDef;
 }
 
-function buildNode(filePath: string, workspaceRoot?: string): RuntimeModuleNode {
-  const ast = parsejaiph(readFileSync(filePath, "utf8"), filePath);
-  const imports = new Map<string, string>();
-  for (const imp of ast.imports) {
-    imports.set(imp.alias, resolveImportPath(filePath, imp.path, workspaceRoot));
-  }
-  // Synthesise ScriptDef stubs for script imports so resolveScriptRef finds them.
-  if (ast.scriptImports) {
-    for (const si of ast.scriptImports) {
-      ast.scripts.push({
-        name: si.alias,
-        comments: [],
-        body: "",
-        bodyKind: "fenced",
-        loc: si.loc,
-      });
-    }
+/** Inject `ScriptDef` stubs for `import script` declarations so `resolveScriptRef` finds them. Idempotent. */
+function attachScriptImportStubs(ast: jaiphModule): void {
+  if (!ast.scriptImports) return;
+  for (const si of ast.scriptImports) {
+    if (ast.scripts.some((s) => s.name === si.alias)) continue;
+    ast.scripts.push({
+      name: si.alias,
+      comments: [],
+      body: "",
+      loc: si.loc,
+    });
   }
-  return { filePath, ast, imports };
 }
 
-export function buildRuntimeGraph(entryFile: string, workspaceRoot?: string): RuntimeGraph {
-  const entry = resolve(entryFile);
-  const modules = new Map<string, RuntimeModuleNode>();
-  const queue: string[] = [entry];
-  while (queue.length > 0) {
-    const current = queue.shift()!;
-    if (modules.has(current)) continue;
-    const node = buildNode(current, workspaceRoot);
-    modules.set(current, node);
-    for (const imported of node.imports.values()) {
-      if (!modules.has(imported)) queue.push(imported);
-    }
+/**
+ * Adapt a {@link ModuleGraph} for runtime dispatch by injecting `ScriptDef`
+ * stubs for `import script` declarations so `resolveScriptRef` lookups
+ * succeed for cross-module script imports. The injection mutates the AST
+ * in-place; the helper is idempotent so repeated calls are safe.
+ */
+export function buildRuntimeGraph(
+  source: string | ModuleGraph,
+  workspaceRoot?: string,
+): RuntimeGraph {
+  const graph = typeof source === "string"
+    ? loadModuleGraph(source, workspaceRoot)
+    : source;
+  for (const node of graph.modules.values()) {
+    attachScriptImportStubs(node.ast);
   }
-  return { entryFile: entry, modules };
+  return graph;
 }
 
 export function lookupWorkflow(graph: RuntimeGraph, fromFile: string, ref: WorkflowRefDef): WorkflowDef | null {
diff --git a/src/runtime/kernel/node-test-runner.test.ts b/src/runtime/kernel/node-test-runner.test.ts
index 8f276006..cc36d5bf 100644
--- a/src/runtime/kernel/node-test-runner.test.ts
+++ b/src/runtime/kernel/node-test-runner.test.ts
@@ -4,6 +4,7 @@ import { join } from "node:path";
 import { test } from "node:test";
 import assert from "node:assert/strict";
 import { runTestFile } from "./node-test-runner";
+import { loadModuleGraph } from "../../transpile/module-graph";
 import type { SourceLoc } from "../../types";
 
 const loc: SourceLoc = { line: 1, col: 1 };
@@ -35,7 +36,7 @@ test "block B" {
     // Before this change, buildRuntimeGraph would be called once per
     // test_run_workflow step (2 calls). After caching, it is called once.
     // We verify behavioral correctness: both blocks pass with the shared graph.
-    const exitCode = await runTestFile(testFile, dir, scriptsDir, [
+    const exitCode = await runTestFile(loadModuleGraph(testFile, dir), dir, scriptsDir, [
       {
         description: "block A", loc,
         steps: [{ type: "test_run_workflow" as const, workflowRef: "greet", args: [], loc }],
@@ -75,7 +76,7 @@ test "const drives mock and expect" {
 `,
     );
 
-    const exitCode = await runTestFile(testFile, dir, scriptsDir, [
+    const exitCode = await runTestFile(loadModuleGraph(testFile, dir), dir, scriptsDir, [
       {
         description: "const drives mock and expect", loc,
         steps: [
@@ -119,7 +120,7 @@ test "undefined const ref" {
 `,
     );
 
-    const exitCode = await runTestFile(testFile, dir, scriptsDir, [
+    const exitCode = await runTestFile(loadModuleGraph(testFile, dir), dir, scriptsDir, [
       {
         description: "undefined const ref", loc,
         steps: [
@@ -161,7 +162,7 @@ test "no implicit response" {
 `,
     );
 
-    const exitCode = await runTestFile(testFile, dir, scriptsDir, [
+    const exitCode = await runTestFile(loadModuleGraph(testFile, dir), dir, scriptsDir, [
       {
         description: "no implicit response", loc,
         steps: [
diff --git a/src/runtime/kernel/node-test-runner.ts b/src/runtime/kernel/node-test-runner.ts
index 4e7fd597..d6a52692 100644
--- a/src/runtime/kernel/node-test-runner.ts
+++ b/src/runtime/kernel/node-test-runner.ts
@@ -2,6 +2,7 @@ import { mkdtempSync, rmSync, readdirSync, readFileSync } from "node:fs";
 import { tmpdir } from "node:os";
 import { basename, join } from "node:path";
 import { buildRuntimeGraph, resolveWorkflowRef, resolveRuleRef, resolveScriptRef, type RuntimeGraph } from "./graph";
+import type { ModuleGraph } from "../../transpile/module-graph";
 import { NodeWorkflowRuntime, type MockBodyDef } from "./node-workflow-runtime";
 import type { MockPromptArm } from "./mock";
 import type { TestBlockDef, TestStepDef } from "../../types";
@@ -151,6 +152,14 @@ async function runTestBlock(
           JAIPH_RUNS_DIR: join(tmpDir, ".jaiph", "runs"),
           JAIPH_SCRIPTS: scriptsDir,
         };
+        // `jaiph test` is meant to be deterministic and fast: a prompt that
+        // returns non-zero (e.g. no matching mock arm) should fail the test
+        // immediately rather than wait through the production retry schedule
+        // (~2h41m). Tests that intentionally exercise the retry behaviour can
+        // override this by setting JAIPH_PROMPT_RETRY explicitly.
+        if (env.JAIPH_PROMPT_RETRY === undefined) {
+          env.JAIPH_PROMPT_RETRY = "0";
+        }
         if (mockArmsJson) {
           env.JAIPH_MOCK_PROMPT_ARMS_JSON = mockArmsJson;
           delete env.JAIPH_MOCK_RESPONSES_JSON;
@@ -256,11 +265,12 @@ async function runTestBlock(
 }
 
 export async function runTestFile(
-  testFileAbs: string,
+  moduleGraph: ModuleGraph,
   workspaceRoot: string,
   scriptsDir: string,
   blocks: TestBlockDef[],
 ): Promise<number> {
+  const testFileAbs = moduleGraph.entryFile;
   const bold = "\x1b[1m";
   const reset = "\x1b[0m";
   const red = "\x1b[31m";
@@ -291,12 +301,13 @@ export async function runTestFile(
 
   process.stdout.write(`${bold}testing${reset} ${displayName}\n`);
 
-  // Build the runtime graph once for the entire test file.
-  // The graph depends only on testFileAbs and its import closure, which are
-  // constant across all blocks and steps within a single runTestFile call.
-  // If a future test step mutates imported files on disk mid-run, a manual
-  // rebuild would be needed — but that is not a supported pattern today.
-  const graph = buildRuntimeGraph(testFileAbs, workspaceRoot);
+  // Build the runtime view of the already-loaded module graph once for the
+  // entire test file. The graph depends only on testFileAbs and its import
+  // closure, which are constant across all blocks and steps within a single
+  // runTestFile call. If a future test step mutates imported files on disk
+  // mid-run, a manual rebuild would be needed — but that is not a supported
+  // pattern today.
+  const graph = buildRuntimeGraph(moduleGraph, workspaceRoot);
 
   let total = 0;
   let failed = 0;
diff --git a/src/runtime/kernel/node-workflow-runner.ts b/src/runtime/kernel/node-workflow-runner.ts
index a3432c4a..025f7633 100644
--- a/src/runtime/kernel/node-workflow-runner.ts
+++ b/src/runtime/kernel/node-workflow-runner.ts
@@ -1,34 +1,54 @@
 import { basename, dirname, join } from "node:path";
 import { writeFileSync } from "node:fs";
+import { loadModuleGraph, readModuleGraph } from "../../transpile/module-graph";
 import { buildRuntimeGraph } from "./graph";
 import { NodeWorkflowRuntime } from "./node-workflow-runtime";
 
-function parseArgs(argv: string[]): {
+/**
+ * Internal argv marker dispatched from `main` (src/cli/index.ts) to route the
+ * remaining args here. Defined once so the CLI dispatcher and the spawn site
+ * in `workflow-launch.ts` cannot drift.
+ */
+export const WORKFLOW_RUNNER_ARG = "__workflow-runner";
+
+interface RunnerArgs {
   metaFile: string;
   sourceFile: string;
   builtScript: string;
   workflowName: string;
   runArgs: string[];
-} {
-  const metaFile = argv[2] ?? "";
-  const sourceFile = argv[3] ?? process.env.JAIPH_SOURCE_ABS ?? "";
-  const builtScript = argv[4] ?? "";
-  const workflowName = argv[5] ?? "default";
-  const runArgs = argv.slice(6);
+}
+
+function parseRunnerArgs(positional: string[]): RunnerArgs {
+  const metaFile = positional[0] ?? "";
+  const sourceFile = positional[1] ?? process.env.JAIPH_SOURCE_ABS ?? "";
+  const builtScript = positional[2] ?? "";
+  const workflowName = positional[3] ?? "default";
+  const runArgs = positional.slice(4);
   if (!metaFile || !sourceFile) {
     throw new Error("node-workflow-runner requires meta file and source file");
   }
   return { metaFile, sourceFile, builtScript, workflowName, runArgs };
 }
 
-async function main(): Promise<number> {
-  const { metaFile, sourceFile, builtScript, workflowName, runArgs } = parseArgs(process.argv);
+/**
+ * Run the workflow leader with the post-dispatch positional args
+ * `[metaFile, sourceFile, builtScript, workflowName, ...runArgs]`.
+ *
+ * Callable from `src/cli/index.ts` when the reserved `__workflow-runner` argv
+ * arrives, so the bun-compiled binary self-spawns into the runner without
+ * needing a separate `node-workflow-runner.js` script on disk.
+ */
+export async function runWorkflowRunner(positional: string[]): Promise<number> {
+  const { metaFile, sourceFile, builtScript, workflowName, runArgs } = parseRunnerArgs(positional);
   process.env.JAIPH_SOURCE_FILE = basename(sourceFile);
   if (!process.env.JAIPH_SCRIPTS && builtScript) {
     process.env.JAIPH_SCRIPTS = join(dirname(builtScript), "scripts");
   }
   const workspaceRoot = process.env.JAIPH_WORKSPACE || undefined;
-  const graph = buildRuntimeGraph(sourceFile, workspaceRoot);
+  const graphFile = process.env.JAIPH_MODULE_GRAPH_FILE;
+  const moduleGraph = graphFile ? readModuleGraph(graphFile) : loadModuleGraph(sourceFile, workspaceRoot);
+  const graph = buildRuntimeGraph(moduleGraph);
   const runtime = new NodeWorkflowRuntime(graph, { env: process.env, cwd: process.cwd() });
   const status = workflowName === "default" ? await runtime.runDefault(runArgs) : 1;
   writeFileSync(
@@ -40,7 +60,7 @@ async function main(): Promise<number> {
 }
 
 if (require.main === module) {
-  main()
+  runWorkflowRunner(process.argv.slice(2))
     .then((status) => process.exit(status))
     .catch((err) => {
       process.stderr.write(`jaiph node runner: ${err instanceof Error ? err.message : String(err)}\n`);
diff --git a/src/runtime/kernel/node-workflow-runtime.artifacts.test.ts b/src/runtime/kernel/node-workflow-runtime.artifacts.test.ts
index e0b83340..5d4c589f 100644
--- a/src/runtime/kernel/node-workflow-runtime.artifacts.test.ts
+++ b/src/runtime/kernel/node-workflow-runtime.artifacts.test.ts
@@ -194,6 +194,10 @@ test("NodeWorkflowRuntime: failed prompt preserves backend stderr in artifacts a
       JAIPH_AGENT_COMMAND: fakeAgent,
       JAIPH_AGENT_MODEL: "gpt-5.4",
       JAIPH_WORKSPACE: root,
+      // This test exercises single-attempt stderr capture; the prompt-retry
+      // backoff schedule (default 15s → 1m → 10m → 30m → 2h) is orthogonal
+      // and is covered by node-workflow-runtime.prompt-retry.test.ts.
+      JAIPH_PROMPT_RETRY: "0",
     };
     const runtime = new NodeWorkflowRuntime(graph, { env, cwd: root, suppressLiveEvents: true });
     const prevSummaryEnv = process.env.JAIPH_RUN_SUMMARY_FILE;
@@ -294,7 +298,7 @@ test("NodeWorkflowRuntime: ensure catch receives failure payload in catch scope
   }
 });
 
-test("NodeWorkflowRuntime: nested workflow inherits caller metadata scope (callee module config does not override)", async () => {
+test("NodeWorkflowRuntime: nested cross-module run applies callee module config and restores caller scope after", async () => {
   const root = mkdtempSync(join(tmpdir(), "jaiph-node-meta-nested-"));
   try {
     const childJh = join(root, "child.jh");
@@ -304,11 +308,11 @@ test("NodeWorkflowRuntime: nested workflow inherits caller metadata scope (calle
       childJh,
       [
         'config {',
-        '  agent.backend = "claude"',
+        '  agent.default_model = "model-b"',
         "}",
-        'script log_backend = `printf \'%s:%s\\n\' "$1" "$JAIPH_AGENT_BACKEND" >> "$JAIPH_META_SCOPE_FILE"`',
-        "workflow default() {",
-        '  run log_backend("child")',
+        'script log_model = `printf \'%s:%s\\n\' "$1" "$JAIPH_AGENT_MODEL" >> "$JAIPH_META_SCOPE_FILE"`',
+        "workflow show() {",
+        '  run log_model("child")',
         "}",
         "",
       ].join("\n"),
@@ -319,13 +323,13 @@ test("NodeWorkflowRuntime: nested workflow inherits caller metadata scope (calle
         'import "child.jh" as child',
         "",
         'config {',
-        '  agent.backend = "cursor"',
+        '  agent.default_model = "model-a"',
         "}",
-        'script log_backend = `printf \'%s:%s\\n\' "$1" "$JAIPH_AGENT_BACKEND" >> "$JAIPH_META_SCOPE_FILE"`',
+        'script log_model = `printf \'%s:%s\\n\' "$1" "$JAIPH_AGENT_MODEL" >> "$JAIPH_META_SCOPE_FILE"`',
         "workflow default() {",
-        '  run log_backend("parent_before")',
-        "  run child.default()",
-        '  run log_backend("parent_after")',
+        '  run log_model("parent_before")',
+        "  run child.show()",
+        '  run log_model("parent_after")',
         "}",
         "",
       ].join("\n"),
@@ -333,10 +337,10 @@ test("NodeWorkflowRuntime: nested workflow inherits caller metadata scope (calle
     const scriptsDir = join(root, "scripts");
     mkdirSync(scriptsDir, { recursive: true });
     writeFileSync(
-      join(scriptsDir, "log_backend"),
+      join(scriptsDir, "log_model"),
       [
         "#!/usr/bin/env bash",
-        'printf \'%s:%s\n\' "$1" "$JAIPH_AGENT_BACKEND" >> "$JAIPH_META_SCOPE_FILE"',
+        'printf \'%s:%s\n\' "$1" "$JAIPH_AGENT_MODEL" >> "$JAIPH_META_SCOPE_FILE"',
         "",
       ].join("\n"),
       { mode: 0o755 },
@@ -350,21 +354,161 @@ test("NodeWorkflowRuntime: nested workflow inherits caller metadata scope (calle
       JAIPH_SCRIPTS: scriptsDir,
       JAIPH_META_SCOPE_FILE: metaFile,
     };
-    delete env.JAIPH_AGENT_BACKEND;
-    delete env.JAIPH_AGENT_BACKEND_LOCKED;
+    delete env.JAIPH_AGENT_MODEL;
+    delete env.JAIPH_AGENT_MODEL_LOCKED;
 
     const runtime = new NodeWorkflowRuntime(graph, { env, cwd: root, suppressLiveEvents: true });
     const status = await runtime.runDefault([]);
     assert.equal(status, 0);
 
     const actual = readFileSync(metaFile, "utf8");
-    const expected = "parent_before:cursor\nchild:cursor\nparent_after:cursor\n";
+    const expected = "parent_before:model-a\nchild:model-b\nparent_after:model-a\n";
     assert.equal(actual, expected);
   } finally {
     rmSync(root, { recursive: true, force: true });
   }
 });
 
+test("NodeWorkflowRuntime: nested cross-module run applies callee workflow-level config over callee module-level config", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-node-meta-nested-wf-"));
+  try {
+    const childJh = join(root, "child.jh");
+    const parentJh = join(root, "parent.jh");
+    const metaFile = join(root, "config_scope.log");
+    writeFileSync(
+      childJh,
+      [
+        'config {',
+        '  agent.default_model = "child-module-model"',
+        "}",
+        'script log_model = `printf \'%s:%s\\n\' "$1" "$JAIPH_AGENT_MODEL" >> "$JAIPH_META_SCOPE_FILE"`',
+        "workflow show() {",
+        '  config {',
+        '    agent.default_model = "child-workflow-model"',
+        "  }",
+        '  run log_model("child")',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    writeFileSync(
+      parentJh,
+      [
+        'import "child.jh" as child',
+        "",
+        'config {',
+        '  agent.default_model = "model-a"',
+        "}",
+        "workflow default() {",
+        "  run child.show()",
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const scriptsDir = join(root, "scripts");
+    mkdirSync(scriptsDir, { recursive: true });
+    writeFileSync(
+      join(scriptsDir, "log_model"),
+      [
+        "#!/usr/bin/env bash",
+        'printf \'%s:%s\n\' "$1" "$JAIPH_AGENT_MODEL" >> "$JAIPH_META_SCOPE_FILE"',
+        "",
+      ].join("\n"),
+      { mode: 0o755 },
+    );
+
+    const graph = buildRuntimeGraph(parentJh);
+    const env: NodeJS.ProcessEnv = {
+      ...process.env,
+      JAIPH_TEST_MODE: "1",
+      JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+      JAIPH_SCRIPTS: scriptsDir,
+      JAIPH_META_SCOPE_FILE: metaFile,
+    };
+    delete env.JAIPH_AGENT_MODEL;
+    delete env.JAIPH_AGENT_MODEL_LOCKED;
+
+    const runtime = new NodeWorkflowRuntime(graph, { env, cwd: root, suppressLiveEvents: true });
+    const status = await runtime.runDefault([]);
+    assert.equal(status, 0);
+
+    const actual = readFileSync(metaFile, "utf8");
+    assert.equal(actual, "child:child-workflow-model\n");
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("NodeWorkflowRuntime: nested cross-module run honors locked JAIPH_AGENT_MODEL over callee config", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-node-meta-nested-locked-"));
+  try {
+    const childJh = join(root, "child.jh");
+    const parentJh = join(root, "parent.jh");
+    const metaFile = join(root, "config_scope.log");
+    writeFileSync(
+      childJh,
+      [
+        'config {',
+        '  agent.default_model = "model-b"',
+        "}",
+        'script log_model = `printf \'%s:%s\\n\' "$1" "$JAIPH_AGENT_MODEL" >> "$JAIPH_META_SCOPE_FILE"`',
+        "workflow show() {",
+        '  config {',
+        '    agent.default_model = "child-workflow-model"',
+        "  }",
+        '  run log_model("child")',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    writeFileSync(
+      parentJh,
+      [
+        'import "child.jh" as child',
+        "",
+        'config {',
+        '  agent.default_model = "model-a"',
+        "}",
+        "workflow default() {",
+        "  run child.show()",
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const scriptsDir = join(root, "scripts");
+    mkdirSync(scriptsDir, { recursive: true });
+    writeFileSync(
+      join(scriptsDir, "log_model"),
+      [
+        "#!/usr/bin/env bash",
+        'printf \'%s:%s\n\' "$1" "$JAIPH_AGENT_MODEL" >> "$JAIPH_META_SCOPE_FILE"',
+        "",
+      ].join("\n"),
+      { mode: 0o755 },
+    );
+
+    const graph = buildRuntimeGraph(parentJh);
+    const env: NodeJS.ProcessEnv = {
+      ...process.env,
+      JAIPH_TEST_MODE: "1",
+      JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+      JAIPH_SCRIPTS: scriptsDir,
+      JAIPH_META_SCOPE_FILE: metaFile,
+      JAIPH_AGENT_MODEL: "env-model",
+      JAIPH_AGENT_MODEL_LOCKED: "1",
+    };
+
+    const runtime = new NodeWorkflowRuntime(graph, { env, cwd: root, suppressLiveEvents: true });
+    const status = await runtime.runDefault([]);
+    assert.equal(status, 0);
+
+    const actual = readFileSync(metaFile, "utf8");
+    assert.equal(actual, "child:env-model\n");
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
 test("NodeWorkflowRuntime: nested cross-module preserves locked JAIPH_AGENT_BACKEND (callee config ignored)", async () => {
   const root = mkdtempSync(join(tmpdir(), "jaiph-node-meta-nested-lock-"));
   try {
@@ -724,3 +868,139 @@ test("NodeWorkflowRuntime: JAIPH_INBOX_PARALLEL has no effect on inbox dispatch
   assert.deepEqual(without, withTrue);
   assert.deepEqual(without, ["consumer_a", "consumer_b"]);
 });
+
+async function runInboxCapScenario(opts: {
+  rootPrefix: string;
+  fileName: string;
+  source: string;
+  inboxMaxDispatch?: string;
+}): Promise<{ status: number; summary: string }> {
+  const root = mkdtempSync(join(tmpdir(), opts.rootPrefix));
+  try {
+    const jh = join(root, opts.fileName);
+    writeFileSync(jh, opts.source);
+    const graph = buildRuntimeGraph(jh);
+    const env: NodeJS.ProcessEnv = {
+      ...process.env,
+      JAIPH_TEST_MODE: "1",
+      JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+    };
+    delete env.JAIPH_INBOX_MAX_DISPATCH;
+    if (opts.inboxMaxDispatch !== undefined) {
+      env.JAIPH_INBOX_MAX_DISPATCH = opts.inboxMaxDispatch;
+    }
+    const runtime = new NodeWorkflowRuntime(graph, { env, cwd: root, suppressLiveEvents: true });
+    const prevSummary = process.env.JAIPH_RUN_SUMMARY_FILE;
+    process.env.JAIPH_RUN_SUMMARY_FILE = runtime.getSummaryFile();
+    let status: number;
+    try {
+      status = await runtime.runDefault([]);
+    } finally {
+      if (prevSummary === undefined) delete process.env.JAIPH_RUN_SUMMARY_FILE;
+      else process.env.JAIPH_RUN_SUMMARY_FILE = prevSummary;
+    }
+    runtime.stopHeartbeat();
+    const summary = readFileSync(runtime.getSummaryFile(), "utf8");
+    return { status, summary };
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+}
+
+test("NodeWorkflowRuntime: circular inbox sends fail with E_INBOX_DISPATCH_LIMIT instead of hanging", async () => {
+  const { status, summary } = await runInboxCapScenario({
+    rootPrefix: "jaiph-inbox-cap-circular-",
+    fileName: "circular.jh",
+    inboxMaxDispatch: "10",
+    source: [
+      "channel ping -> on_ping",
+      "channel pong -> on_pong",
+      "",
+      "workflow on_ping(message, chan, sender) {",
+      '  pong <- "p"',
+      "}",
+      "",
+      "workflow on_pong(message, chan, sender) {",
+      '  ping <- "p"',
+      "}",
+      "",
+      "workflow default() {",
+      '  ping <- "start"',
+      "}",
+      "",
+    ].join("\n"),
+  });
+  assert.notEqual(status, 0, "circular sends must fail the workflow");
+  const failLine = summary.split("\n").find((line) => line.includes("E_INBOX_DISPATCH_LIMIT"));
+  assert.ok(failLine, `expected an E_INBOX_DISPATCH_LIMIT entry in run_summary.jsonl; got:\n${summary}`);
+  assert.match(failLine!, /drained 10 messages without quiescing/);
+  assert.match(failLine!, /channel \\"(ping|pong)\\"/);
+  assert.match(failLine!, /raise JAIPH_INBOX_MAX_DISPATCH if intentional/);
+});
+
+test("NodeWorkflowRuntime: JAIPH_INBOX_MAX_DISPATCH=5 triggers the cap after 5 messages", async () => {
+  const { status, summary } = await runInboxCapScenario({
+    rootPrefix: "jaiph-inbox-cap-five-",
+    fileName: "self_loop.jh",
+    inboxMaxDispatch: "5",
+    source: [
+      "channel loop -> on_loop",
+      "",
+      "workflow on_loop(message, chan, sender) {",
+      '  loop <- "again"',
+      "}",
+      "",
+      "workflow default() {",
+      '  loop <- "start"',
+      "}",
+      "",
+    ].join("\n"),
+  });
+  assert.notEqual(status, 0, "self-loop must fail the workflow");
+  const lines = summary.split("\n").filter((line) => line.trim().length > 0);
+  const dispatchStarts = lines.filter((line) => {
+    const evt = JSON.parse(line) as { type?: string };
+    return evt.type === "INBOX_DISPATCH_START";
+  });
+  assert.equal(dispatchStarts.length, 5, "exactly 5 dispatches should occur before the cap");
+  const failLine = lines.find((line) => line.includes("E_INBOX_DISPATCH_LIMIT"));
+  assert.ok(failLine, `expected E_INBOX_DISPATCH_LIMIT in summary; got:\n${summary}`);
+  assert.match(failLine!, /drained 5 messages without quiescing/);
+  assert.match(failLine!, /channel \\"loop\\"/);
+});
+
+test("NodeWorkflowRuntime: multi-message fan-out below the cap is unaffected", async () => {
+  const { status, summary } = await runInboxCapScenario({
+    rootPrefix: "jaiph-inbox-cap-fanout-",
+    fileName: "fanout.jh",
+    inboxMaxDispatch: "5",
+    source: [
+      "channel ch -> sink_a, sink_b, sink_c",
+      "",
+      "workflow producer() {",
+      '  ch <- "m1"',
+      '  ch <- "m2"',
+      '  ch <- "m3"',
+      "}",
+      "",
+      "workflow sink_a(message, chan, sender) {",
+      '  log "a"',
+      "}",
+      "",
+      "workflow sink_b(message, chan, sender) {",
+      '  log "b"',
+      "}",
+      "",
+      "workflow sink_c(message, chan, sender) {",
+      '  log "c"',
+      "}",
+      "",
+      "workflow default() {",
+      "  run producer()",
+      "}",
+      "",
+    ].join("\n"),
+  });
+  assert.equal(status, 0, "fan-out below the cap must succeed");
+  assert.ok(!summary.includes("E_INBOX_DISPATCH_LIMIT"), "must not flag the cap below the limit");
+});
diff --git a/src/runtime/kernel/node-workflow-runtime.handle.test.ts b/src/runtime/kernel/node-workflow-runtime.handle.test.ts
new file mode 100644
index 00000000..9fca5fc7
--- /dev/null
+++ b/src/runtime/kernel/node-workflow-runtime.handle.test.ts
@@ -0,0 +1,9 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { formatInvalidAsyncHandleError } from "./node-workflow-runtime";
+
+test("formatInvalidAsyncHandleError: includes the handle id and consumption hint", () => {
+  const msg = formatInvalidAsyncHandleError("__JAIPH_HANDLE__7");
+  assert.match(msg, /invalid async handle "__JAIPH_HANDLE__7"/);
+  assert.match(msg, /was never created or was already consumed/);
+});
diff --git a/src/runtime/kernel/node-workflow-runtime.prompt-retry.test.ts b/src/runtime/kernel/node-workflow-runtime.prompt-retry.test.ts
new file mode 100644
index 00000000..1660f14a
--- /dev/null
+++ b/src/runtime/kernel/node-workflow-runtime.prompt-retry.test.ts
@@ -0,0 +1,680 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import {
+  existsSync,
+  mkdtempSync,
+  readFileSync,
+  rmSync,
+  writeFileSync,
+} from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { buildRuntimeGraph } from "./graph";
+import { NodeWorkflowRuntime } from "./node-workflow-runtime";
+
+/**
+ * Build a fake agent script (executed via JAIPH_AGENT_COMMAND, custom-command
+ * path — name != "cursor-agent" so stdout is captured raw, not parsed as
+ * stream-json) that fails the first `failTimes` calls (exit 1) and succeeds
+ * on the (failTimes+1)-th call (exit 0, writing `successPayload` to stdout).
+ * Each call appends one line to `callsLog` so tests count invocations.
+ */
+function writeFakeAgent(opts: {
+  agentPath: string;
+  counterFile: string;
+  callsLog: string;
+  failTimes: number;
+  successPayload: string;
+}): void {
+  const lines = [
+    "#!/usr/bin/env bash",
+    "set -u",
+    // Drain stdin (the prompt is piped via stdin for custom commands).
+    "cat >/dev/null 2>&1 || true",
+    `echo call >> "${opts.callsLog}"`,
+    `current=$(cat "${opts.counterFile}" 2>/dev/null || echo 0)`,
+    `if [ "$current" -lt ${opts.failTimes} ]; then`,
+    `  echo $((current + 1)) > "${opts.counterFile}"`,
+    `  echo "fake-agent: simulated transport failure (attempt $((current + 1)))" >&2`,
+    "  exit 1",
+    "fi",
+    `printf '%s' "${opts.successPayload}"`,
+    "",
+  ];
+  writeFileSync(opts.agentPath, lines.join("\n"), { mode: 0o755 });
+}
+
+function readSummaryEvents(summaryFile: string): Array<Record<string, unknown>> {
+  return readFileSync(summaryFile, "utf8")
+    .split("\n")
+    .filter(Boolean)
+    .map((line) => JSON.parse(line) as Record<string, unknown>);
+}
+
+/**
+ * Run a callback with `process.env.JAIPH_RUN_SUMMARY_FILE` bound to the
+ * runtime's summary file. Required because `appendRunSummaryLine` reads
+ * the path from process.env, not the runtime's local env copy.
+ */
+async function withSummaryEnv<T>(summaryFile: string, fn: () => Promise<T>): Promise<T> {
+  const prev = process.env.JAIPH_RUN_SUMMARY_FILE;
+  process.env.JAIPH_RUN_SUMMARY_FILE = summaryFile;
+  try {
+    return await fn();
+  } finally {
+    if (prev === undefined) delete process.env.JAIPH_RUN_SUMMARY_FILE;
+    else process.env.JAIPH_RUN_SUMMARY_FILE = prev;
+  }
+}
+
+test("prompt retry: success on attempt N+1 returns { ok: true } with successful attempt's value", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-success-"));
+  try {
+    const jh = join(root, "succeeds.jh");
+    writeFileSync(
+      jh,
+      [
+        "workflow default() {",
+        '  const r = prompt "x"',
+        "  return r",
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 2,
+      successPayload: "all-good-output",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const sleepCalls: number[] = [];
+    const runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      promptRetryDelays: [10, 20, 30, 40, 50],
+      sleep: async (ms) => {
+        sleepCalls.push(ms);
+      },
+    });
+    const status = await runtime.runDefault([]);
+    assert.equal(status, 0, "workflow should succeed once prompt succeeds on retry");
+
+    const returnFile = join(runtime.getRunDir(), "return_value.txt");
+    assert.ok(existsSync(returnFile), "return_value.txt should be written on success");
+    assert.equal(readFileSync(returnFile, "utf8"), "all-good-output");
+
+    const calls = readFileSync(callsLog, "utf8").split("\n").filter(Boolean);
+    assert.equal(calls.length, 3, "agent should be invoked 3 times (2 failures + 1 success)");
+    assert.deepEqual(sleepCalls, [10, 20], "two delays before the successful third attempt");
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("prompt retry: exhausting retries on default-length schedule makes exactly 6 executePrompt calls", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-exhaust-"));
+  try {
+    const jh = join(root, "always_fail.jh");
+    writeFileSync(
+      jh,
+      [
+        "workflow default() {",
+        '  prompt "x"',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 999,
+      successPayload: "never-reached",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const sleepCalls: number[] = [];
+    const runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      // 5 delays + 1 initial = 6 attempts total, mirroring the default schedule shape.
+      promptRetryDelays: [1, 2, 3, 4, 5],
+      sleep: async (ms) => {
+        sleepCalls.push(ms);
+      },
+    });
+    const status = await runtime.runDefault([]);
+    assert.equal(status, 1, "workflow should fail after retries exhausted");
+
+    const calls = readFileSync(callsLog, "utf8").split("\n").filter(Boolean);
+    assert.equal(calls.length, 6, "exactly 6 total executePrompt calls (1 + 5 retries)");
+    assert.deepEqual(sleepCalls, [1, 2, 3, 4, 5], "delays requested between attempts equal the schedule");
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("prompt retry: default schedule values are passed to sleep in order", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-default-schedule-"));
+  try {
+    const jh = join(root, "always_fail.jh");
+    writeFileSync(
+      jh,
+      [
+        "workflow default() {",
+        '  prompt "x"',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 999,
+      successPayload: "n/a",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const sleepCalls: number[] = [];
+    const runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      // No promptRetryDelays override → default schedule applies.
+      sleep: async (ms) => {
+        sleepCalls.push(ms);
+      },
+    });
+    const status = await runtime.runDefault([]);
+    assert.equal(status, 1);
+    assert.deepEqual(
+      sleepCalls,
+      [15_000, 60_000, 600_000, 1_800_000, 7_200_000],
+      "sleep called with the exact default schedule in order",
+    );
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("prompt retry: enclosing run+catch fires after retries are exhausted (compose-below-recover)", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-catch-"));
+  try {
+    const jh = join(root, "with_catch.jh");
+    // Nest the prompt inside a callee workflow so we can attach `catch` at
+    // the calling `run` site (the parser rejects `prompt` inside rules).
+    writeFileSync(
+      jh,
+      [
+        "workflow inner() {",
+        '  prompt "x"',
+        "}",
+        "",
+        "workflow default() {",
+        "  run inner() catch (failure) {",
+        '    return "recovered"',
+        "  }",
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 999,
+      successPayload: "n/a",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const sleepCalls: number[] = [];
+    const runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      promptRetryDelays: [1, 2],
+      sleep: async (ms) => {
+        sleepCalls.push(ms);
+      },
+    });
+    const status = await runtime.runDefault([]);
+    assert.equal(status, 0, "catch branch should recover and the workflow should succeed");
+
+    const calls = readFileSync(callsLog, "utf8").split("\n").filter(Boolean);
+    assert.equal(calls.length, 3, "retries are exhausted (3 attempts) before catch fires");
+    assert.deepEqual(sleepCalls, [1, 2]);
+
+    const returnFile = join(runtime.getRunDir(), "return_value.txt");
+    assert.ok(existsSync(returnFile));
+    assert.equal(readFileSync(returnFile, "utf8"), "recovered");
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("prompt retry: invalid JSON from prompt with returns schema is NOT retried", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-bad-json-"));
+  try {
+    const jh = join(root, "schema.jh");
+    writeFileSync(
+      jh,
+      [
+        "workflow default() {",
+        '  const r = prompt "x" returns "{ verdict: string }"',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    // Agent succeeds (exit 0) but emits non-JSON output, so post-processing fails.
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 0,
+      successPayload: "this is not JSON",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const sleepCalls: number[] = [];
+    const runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      promptRetryDelays: [10, 20, 30],
+      sleep: async (ms) => {
+        sleepCalls.push(ms);
+      },
+    });
+    const status = await runtime.runDefault([]);
+    assert.equal(status, 1, "invalid JSON should fail the step");
+
+    const calls = readFileSync(callsLog, "utf8").split("\n").filter(Boolean);
+    assert.equal(calls.length, 1, "schema/JSON failures must not trigger retry");
+    assert.deepEqual(sleepCalls, [], "sleep must not be called for deterministic post-processing failures");
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("prompt retry: every failed attempt and the final termination emit LOGERR with attempt info", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-logerr-"));
+  try {
+    const jh = join(root, "always_fail.jh");
+    writeFileSync(
+      jh,
+      [
+        "workflow default() {",
+        '  prompt "x"',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 999,
+      successPayload: "n/a",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      promptRetryDelays: [10, 20],
+      sleep: async () => {},
+    });
+    const status = await withSummaryEnv(runtime.getSummaryFile(), () => runtime.runDefault([]));
+    assert.equal(status, 1);
+
+    const events = readSummaryEvents(runtime.getSummaryFile());
+    const logerrs = events.filter((e) => e.type === "LOGERR").map((e) => String(e.message));
+    // Three failed attempts: attempt 1 with retry-in-10ms, attempt 2 with retry-in-20ms,
+    // attempt 3 with retries-exhausted termination.
+    assert.equal(logerrs.length, 3, `expected 3 LOGERR entries, got ${logerrs.length}: ${logerrs.join(" | ")}`);
+    assert.match(logerrs[0]!, /prompt attempt 1\/3 failed/);
+    assert.match(logerrs[0]!, /retrying in 10ms/);
+    assert.match(logerrs[1]!, /prompt attempt 2\/3 failed/);
+    assert.match(logerrs[1]!, /retrying in 20ms/);
+    assert.match(logerrs[2]!, /prompt attempt 3\/3 failed/);
+    assert.match(logerrs[2]!, /retries exhausted/);
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("prompt retry: LOGERR is emitted even when no recover/catch is present", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-logerr-no-catch-"));
+  try {
+    const jh = join(root, "always_fail.jh");
+    writeFileSync(
+      jh,
+      [
+        "workflow default() {",
+        '  prompt "x"',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 999,
+      successPayload: "n/a",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      promptRetryDelays: [1],
+      sleep: async () => {},
+    });
+    await withSummaryEnv(runtime.getSummaryFile(), () => runtime.runDefault([]));
+    const events = readSummaryEvents(runtime.getSummaryFile());
+    const logerrs = events.filter((e) => e.type === "LOGERR");
+    assert.ok(logerrs.length >= 1, "at least one LOGERR even without recover/catch");
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("prompt retry: JAIPH_PROMPT_RETRY=0 disables retry — 1 attempt, sleep never called", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-disabled-"));
+  try {
+    const jh = join(root, "always_fail.jh");
+    writeFileSync(
+      jh,
+      [
+        "workflow default() {",
+        '  prompt "x"',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 999,
+      successPayload: "n/a",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const sleepCalls: number[] = [];
+    const runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+        JAIPH_PROMPT_RETRY: "0",
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      // No constructor override → env is consulted.
+      sleep: async (ms) => {
+        sleepCalls.push(ms);
+      },
+    });
+    const status = await runtime.runDefault([]);
+    assert.equal(status, 1);
+    const calls = readFileSync(callsLog, "utf8").split("\n").filter(Boolean);
+    assert.equal(calls.length, 1, "exactly 1 attempt with retries disabled");
+    assert.deepEqual(sleepCalls, [], "sleep must not be called with retries disabled");
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("prompt retry: JAIPH_PROMPT_RETRY_DELAYS overrides the default schedule", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-env-override-"));
+  try {
+    const jh = join(root, "always_fail.jh");
+    writeFileSync(
+      jh,
+      [
+        "workflow default() {",
+        '  prompt "x"',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 999,
+      successPayload: "n/a",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const sleepCalls: number[] = [];
+    const runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+        JAIPH_PROMPT_RETRY_DELAYS: "7,8,9",
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      sleep: async (ms) => {
+        sleepCalls.push(ms);
+      },
+    });
+    const status = await runtime.runDefault([]);
+    assert.equal(status, 1);
+    const calls = readFileSync(callsLog, "utf8").split("\n").filter(Boolean);
+    assert.equal(calls.length, 4, "1 initial + 3 retries");
+    assert.deepEqual(sleepCalls, [7, 8, 9]);
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("prompt retry: invalid JAIPH_PROMPT_RETRY_DELAYS errors clearly without silent fallback", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-bad-env-"));
+  try {
+    const jh = join(root, "always_fail.jh");
+    writeFileSync(
+      jh,
+      [
+        "workflow default() {",
+        '  prompt "x"',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 999,
+      successPayload: "n/a",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const sleepCalls: number[] = [];
+    const runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+        JAIPH_PROMPT_RETRY_DELAYS: "10,oops,30",
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      sleep: async (ms) => {
+        sleepCalls.push(ms);
+      },
+    });
+    const status = await withSummaryEnv(runtime.getSummaryFile(), () => runtime.runDefault([]));
+    assert.equal(status, 1, "workflow should fail with invalid config");
+    // Step fails before executePrompt is called.
+    const calls = existsSync(callsLog) ? readFileSync(callsLog, "utf8").split("\n").filter(Boolean) : [];
+    assert.equal(calls.length, 0, "executePrompt should not run when retry config is invalid");
+    assert.deepEqual(sleepCalls, []);
+    const summary = readFileSync(runtime.getSummaryFile(), "utf8");
+    assert.match(summary, /prompt retry config invalid/);
+    assert.match(summary, /JAIPH_PROMPT_RETRY_DELAYS contains invalid entry [^a-z]*oops/);
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+test("prompt retry: abort during backoff sleep halts further executePrompt calls", async () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-retry-abort-"));
+  try {
+    const jh = join(root, "always_fail.jh");
+    writeFileSync(
+      jh,
+      [
+        "workflow default() {",
+        '  prompt "x"',
+        "}",
+        "",
+      ].join("\n"),
+    );
+    const counterFile = join(root, "counter");
+    const callsLog = join(root, "calls.log");
+    const agent = join(root, "fake-agent");
+    writeFakeAgent({
+      agentPath: agent,
+      counterFile,
+      callsLog,
+      failTimes: 999,
+      successPayload: "n/a",
+    });
+
+    const graph = buildRuntimeGraph(jh);
+    const sleepCalls: number[] = [];
+    let runtime: NodeWorkflowRuntime;
+    const sleep = (ms: number, signal: AbortSignal): Promise<void> => {
+      sleepCalls.push(ms);
+      // Simulate an in-progress wait that observes the runtime's AbortSignal.
+      // The retry loop should reject this promise the moment abort() fires.
+      return new Promise<void>((resolve, reject) => {
+        if (signal.aborted) {
+          reject(new Error("aborted-by-test"));
+          return;
+        }
+        const onAbort = (): void => {
+          signal.removeEventListener("abort", onAbort);
+          reject(new Error("aborted-by-test"));
+        };
+        signal.addEventListener("abort", onAbort, { once: true });
+        // Trigger the actual abort from inside the sleep so the loop is
+        // genuinely awaiting when it fires.
+        setImmediate(() => runtime.abort());
+      });
+    };
+    runtime = new NodeWorkflowRuntime(graph, {
+      env: {
+        ...process.env,
+        JAIPH_RUNS_DIR: join(root, ".jaiph", "runs"),
+        JAIPH_AGENT_BACKEND: "cursor",
+        JAIPH_AGENT_COMMAND: agent,
+        JAIPH_WORKSPACE: root,
+      },
+      cwd: root,
+      suppressLiveEvents: true,
+      promptRetryDelays: [10, 20, 30, 40, 50],
+      sleep,
+    });
+    const status = await runtime.runDefault([]);
+    assert.equal(status, 1);
+    const calls = readFileSync(callsLog, "utf8").split("\n").filter(Boolean);
+    assert.equal(calls.length, 1, "after abort fires during the first backoff, no second attempt should run");
+    assert.equal(sleepCalls.length, 1, "only the first sleep is requested before abort kicks in");
+    assert.ok(runtime.isAborted(), "runtime.isAborted() should be true after abort()");
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
diff --git a/src/runtime/kernel/node-workflow-runtime.ts b/src/runtime/kernel/node-workflow-runtime.ts
index d6c91545..c2012aa6 100644
--- a/src/runtime/kernel/node-workflow-runtime.ts
+++ b/src/runtime/kernel/node-workflow-runtime.ts
@@ -5,17 +5,15 @@ import { PassThrough } from "node:stream";
 import { randomUUID } from "node:crypto";
 import { AsyncLocalStorage } from "node:async_hooks";
 import { inlineScriptName } from "../../inline-script-name";
-import type { MatchExprDef, WorkflowStepDef } from "../../types";
+import { argsToRuntimeString } from "../../parse/core";
+import type { CatchBody, Expr, MatchExprDef, WorkflowStepDef } from "../../types";
 import { executePrompt, resolveConfig, resolveModel, resolvePromptStepName } from "./prompt";
 import { appendRunSummaryLine } from "./emit";
 import { buildStepDisplayParamPairs } from "../../cli/commands/format-params.js";
 import { resolveRuleRef, resolveScriptRef, resolveWorkflowRef, type RuntimeGraph } from "./graph";
 import type { WorkflowMetadata } from "../../types";
 import { extractJson, validateFields } from "./schema";
-import {
-  plainMultilineOrchestrationForRuntime,
-  tripleQuotedRawForRuntime,
-} from "../orchestration-text";
+import { canonicalizeTripleQuotedString } from "../../parse/triple-quote";
 import {
   commaArgsToInterpolated,
   interpolate,
@@ -32,13 +30,33 @@ import {
 import { RuntimeEventEmitter, type Frame } from "./runtime-event-emitter";
 import { executeMockBodyDef, type MockBodyDef, type StepResult } from "./runtime-mock";
 import { linesOfDelimitedString } from "../string-lines";
+import {
+  defaultPromptSleep,
+  formatRetryDelay,
+  isPromptRetryAbortError,
+  resolvePromptRetryDelays,
+  summarizeError,
+} from "./prompt-retry";
 
 export type { MockBodyDef } from "./runtime-mock";
 
-type EnsureRecover = Extract<WorkflowStepDef, { type: "ensure" }>["catch"];
-
 const HANDLE_PREFIX = "__JAIPH_HANDLE__";
 
+export function formatInvalidAsyncHandleError(handleId: string): string {
+  return `invalid async handle "${handleId}" — the handle was never created or was already consumed`;
+}
+
+const DEFAULT_INBOX_DISPATCH_LIMIT = 1000;
+
+function resolveInboxDispatchLimit(env: NodeJS.ProcessEnv): number {
+  const raw = env.JAIPH_INBOX_MAX_DISPATCH;
+  if (raw === undefined || raw === "") return DEFAULT_INBOX_DISPATCH_LIMIT;
+  if (!/^[0-9]+$/.test(raw)) return DEFAULT_INBOX_DISPATCH_LIMIT;
+  const n = Number.parseInt(raw, 10);
+  if (!Number.isFinite(n) || n <= 0) return DEFAULT_INBOX_DISPATCH_LIMIT;
+  return n;
+}
+
 type AsyncHandle = {
   ref: string;
   promise: Promise<StepResult>;
@@ -69,6 +87,7 @@ type WorkflowContext = {
   workflowName: string;
   routes: Map<string, string[]>;
   queue: InboxMsg[];
+  workflowMeta?: WorkflowMetadata;
 };
 
 export class NodeWorkflowRuntime {
@@ -88,6 +107,17 @@ export class NodeWorkflowRuntime {
   private readonly mockBodies: Map<string, MockBodyDef>;
   private handleRegistry = new Map<string, AsyncHandle>();
   private handleIdCounter = 0;
+  private readonly abortController = new AbortController();
+  private readonly sleep: (ms: number, signal: AbortSignal) => Promise<void>;
+  /**
+   * Retry schedule for transport-failure backoff in `runPromptStep`. Resolved
+   * lazily from constructor opt or env on first prompt; cached thereafter so
+   * the same workflow run uses a single (validated) schedule and a parse
+   * failure does not get re-thrown per attempt.
+   */
+  private cachedPromptRetryDelays: number[] | undefined;
+  private cachedPromptRetryError: Error | undefined;
+  private readonly promptRetryDelaysOverride: readonly number[] | undefined;
 
   private getFrameStack(): Frame[] {
     return this.asyncFrameStack.getStore() ?? this.stack;
@@ -111,7 +141,9 @@ export class NodeWorkflowRuntime {
   /** Resolve a handle to its StepResult. Caches the result for subsequent reads. */
   private async resolveHandleResult(handleId: string): Promise<StepResult> {
     const handle = this.handleRegistry.get(handleId);
-    if (!handle) return { status: 1, output: "", error: "invalid handle" };
+    if (!handle) {
+      return { status: 1, output: "", error: formatInvalidAsyncHandleError(handleId) };
+    }
     if (handle.resolved) return handle.resolved;
     const result = await handle.promise;
     handle.resolved = result;
@@ -131,6 +163,37 @@ export class NodeWorkflowRuntime {
     return result;
   }
 
+  /**
+   * Resolve an `if` / `match` subject to its value. Accepts plain identifiers
+   * (`status`) and `IDENT.IDENT` dot subjects (`r.verdict`) — the latter
+   * parses JSON from the base variable and extracts the field, mirroring
+   * `${var.field}` interpolation semantics.
+   */
+  private async resolveSubjectValue(
+    scope: Scope,
+    subject: string,
+  ): Promise<{ ok: true; value: string } | { ok: false; result: StepResult }> {
+    const dotIdx = subject.indexOf(".");
+    const base = dotIdx === -1 ? subject : subject.slice(0, dotIdx);
+    const rawBase = scope.vars.get(base);
+    if (rawBase && this.isHandle(rawBase)) {
+      const hr = await this.resolveHandleVar(scope, base);
+      if (hr.status !== 0) return { ok: false, result: hr };
+    }
+    const baseVal = scope.vars.get(base) ?? scope.env?.[base] ?? "";
+    if (dotIdx === -1) return { ok: true, value: baseVal };
+    const field = subject.slice(dotIdx + 1);
+    try {
+      const obj = JSON.parse(baseVal);
+      if (obj != null && typeof obj === "object" && field in obj) {
+        return { ok: true, value: String((obj as Record<string, unknown>)[field]) };
+      }
+    } catch {
+      // fall through to empty
+    }
+    return { ok: true, value: "" };
+  }
+
   /** Scan input for ${var} references and resolve any that are handles. */
   private async resolveHandlesInInput(scope: Scope, input: string): Promise<StepResult | null> {
     const re = /\$\{([a-zA-Z_][a-zA-Z0-9_]*)/g;
@@ -159,12 +222,27 @@ export class NodeWorkflowRuntime {
        * with `node --test` reporter output.
        */
       suppressLiveEvents?: boolean;
+      /**
+       * Injectable backoff sleep. Tests pass a stub to record requested delays
+       * and resolve immediately; production uses `defaultPromptSleep` which
+       * races setTimeout against the runtime's AbortSignal.
+       */
+      sleep?: (ms: number, signal: AbortSignal) => Promise<void>;
+      /**
+       * Override the prompt-retry delay schedule. When set, takes precedence
+       * over `JAIPH_PROMPT_RETRY` / `JAIPH_PROMPT_RETRY_DELAYS`. Empty array
+       * disables retries (1 attempt total). Used by tests to assert the full
+       * sequence with zero real wall-clock wait.
+       */
+      promptRetryDelays?: readonly number[];
     },
   ) {
     this.graph = graph;
     this.env = opts.env ?? process.env;
     this.cwd = opts.cwd ?? process.cwd();
     this.mockBodies = opts.mockBodies ?? new Map();
+    this.sleep = opts.sleep ?? defaultPromptSleep;
+    this.promptRetryDelaysOverride = opts.promptRetryDelays;
     this.runId = this.env.JAIPH_RUN_ID || randomUUID();
     const source = this.env.JAIPH_SOURCE_FILE ?? basename(graph.entryFile);
     const date = new Date();
@@ -192,6 +270,45 @@ export class NodeWorkflowRuntime {
     this.startHeartbeat();
   }
 
+  /**
+   * Signal cooperative cancellation. Aborts any in-flight prompt-retry sleep
+   * so the retry loop exits without further `executePrompt` calls. Exposed
+   * for in-process hosts and tests; the runner process itself terminates on
+   * SIGINT/SIGTERM by Node default, which is sufficient for the CLI path.
+   */
+  abort(): void {
+    this.abortController.abort();
+  }
+
+  isAborted(): boolean {
+    return this.abortController.signal.aborted;
+  }
+
+  /**
+   * Resolve and cache the prompt-retry delay schedule (constructor override
+   * wins over env). On invalid env parse the error is cached and re-returned
+   * so every prompt in the same run surfaces the same misconfiguration.
+   */
+  private getPromptRetryDelays(): { ok: true; delays: number[] } | { ok: false; error: string } {
+    if (this.cachedPromptRetryError) {
+      return { ok: false, error: this.cachedPromptRetryError.message };
+    }
+    if (this.cachedPromptRetryDelays !== undefined) {
+      return { ok: true, delays: this.cachedPromptRetryDelays };
+    }
+    if (this.promptRetryDelaysOverride !== undefined) {
+      this.cachedPromptRetryDelays = [...this.promptRetryDelaysOverride];
+      return { ok: true, delays: this.cachedPromptRetryDelays };
+    }
+    try {
+      this.cachedPromptRetryDelays = resolvePromptRetryDelays(this.env);
+      return { ok: true, delays: this.cachedPromptRetryDelays };
+    } catch (err) {
+      this.cachedPromptRetryError = err instanceof Error ? err : new Error(String(err));
+      return { ok: false, error: this.cachedPromptRetryError.message };
+    }
+  }
+
   getRunDir(): string {
     return this.runDir;
   }
@@ -309,13 +426,19 @@ export class NodeWorkflowRuntime {
     const crossModuleNested = callerModulePath !== calleeModulePath;
     return this.executeManagedStep("workflow", `${workflowName}`, args, async (io) => {
       // Root entry (`runDefault`, inheritCallerMetadataScope=false): apply entry module + workflow metadata.
-      // Nested cross-module (`run` / inbox to another module): caller env (locks + effective scope)
-      // is authoritative — do not layer callee module or callee workflow metadata.
-      // Same-module nested `run` (inheritCallerMetadataScope=true, !crossModuleNested): apply callee
-      // workflow-level config on top of caller env (workflow boundaries still apply within one module).
+      // Nested cross-module `run`: layer callee module + workflow metadata on top of the caller's
+      // effective env (same mechanics as root entry, respecting `${NAME}_LOCKED`).  A module's
+      // config describes how that module's workflows run, regardless of who called them; this
+      // also matches cross-module `ensure` (see `executeRule`).
+      // Same-module nested `run`: apply only the callee workflow-level metadata (workflow boundaries
+      // still apply within one module; module config is already in the caller's effective env).
       let workflowEnv: NodeJS.ProcessEnv;
       if (inheritCallerMetadataScope && crossModuleNested) {
-        workflowEnv = { ...scope.env };
+        workflowEnv = this.applyMetadataScope(
+          scope.env,
+          this.graph.modules.get(resolved.filePath)?.ast.metadata,
+          resolved.workflow.metadata,
+        );
       } else if (inheritCallerMetadataScope) {
         workflowEnv = this.applyMetadataScope(scope.env, undefined, resolved.workflow.metadata);
       } else {
@@ -338,6 +461,7 @@ export class NodeWorkflowRuntime {
         workflowName,
         routes: new Map(),
         queue: [],
+        workflowMeta: resolved.workflow.metadata,
       };
       // Build route map from channel-level route declarations in the module.
       // Only register on the entry workflow (not nested calls) so that sends from
@@ -447,14 +571,9 @@ export class NodeWorkflowRuntime {
     scope: Scope,
     expr: MatchExprDef,
   ): Promise<{ ok: true; value: string } | { ok: false; result: StepResult }> {
-    // Resolve handle if the subject variable is a handle.
-    const rawSubject = scope.vars.get(expr.subject);
-    if (rawSubject && this.isHandle(rawSubject)) {
-      const hr = await this.resolveHandleVar(scope, expr.subject);
-      if (hr.status !== 0) return { ok: false, result: hr };
-    }
-    // Subject is a bare identifier — resolve against scope variables
-    const subject = scope.vars.get(expr.subject) ?? scope.env?.[expr.subject] ?? "";
+    const resolved = await this.resolveSubjectValue(scope, expr.subject);
+    if (!resolved.ok) return { ok: false, result: resolved.result };
+    const subject = resolved.value;
     for (const arm of expr.arms) {
       let matched = false;
       if (arm.pattern.kind === "wildcard") {
@@ -467,7 +586,7 @@ export class NodeWorkflowRuntime {
       if (matched) {
         let body = arm.body.trimStart();
         if (arm.tripleQuotedBody) {
-          body = tripleQuotedRawForRuntime(arm.body).trimStart();
+          body = canonicalizeTripleQuotedString(arm.body).trimStart();
         }
 
         // fail "message" — abort with failure
@@ -511,6 +630,72 @@ export class NodeWorkflowRuntime {
     return { ok: false, result: { status: 1, output: "", error: "match: no arm matched" } };
   }
 
+  /**
+   * Evaluate an `Expr` to its string value, executing any managed call
+   * (call/ensure_call/inline_script/match/prompt) and returning its captured
+   * result. Used by `const` / `return` / `send` / `say` step handlers so they
+   * don't each duplicate the dispatch table.
+   *
+   * `promptCaptureName` lets callers route prompt-side effects (e.g. schema
+   * field exports) into a scope binding; pass `undefined` for non-capture
+   * positions.
+   */
+  private async evaluateExpr(
+    scope: Scope,
+    expr: Expr,
+    promptCaptureName: string | undefined,
+    io: StepIO | undefined,
+  ): Promise<{ ok: true; value: string; output: string } | { ok: false; result: StepResult; output: string }> {
+    if (expr.kind === "literal") {
+      const ir = await this.interpolateWithCaptures(expr.raw, scope);
+      if (!ir.ok) return { ok: false, result: ir.result, output: "" };
+      return { ok: true, value: ir.value, output: "" };
+    }
+    if (expr.kind === "call") {
+      const r = await this.executeRunRef(scope, expr.callee.value, argsToRuntimeString(expr.args));
+      if (r.status !== 0) return { ok: false, result: r, output: "" };
+      return { ok: true, value: r.returnValue ?? r.output.trim(), output: "" };
+    }
+    if (expr.kind === "ensure_call") {
+      const r = await this.executeEnsureRef(scope, expr.callee.value, argsToRuntimeString(expr.args), undefined);
+      if (r.status !== 0) return { ok: false, result: r, output: "" };
+      return { ok: true, value: r.returnValue ?? r.output.trim(), output: "" };
+    }
+    if (expr.kind === "inline_script") {
+      const shebang = expr.lang ? `#!/usr/bin/env ${expr.lang}` : undefined;
+      const r = await this.executeInlineScript(scope, expr.body, shebang, argsToRuntimeString(expr.args));
+      if (r.status !== 0) return { ok: false, result: r, output: "" };
+      return { ok: true, value: r.returnValue ?? r.output.trim(), output: "" };
+    }
+    if (expr.kind === "match") {
+      const mr = await this.evaluateMatch(scope, expr.match);
+      if (!mr.ok) return { ok: false, result: mr.result, output: "" };
+      return { ok: true, value: mr.value, output: "" };
+    }
+    if (expr.kind === "prompt") {
+      if (expr.returns !== undefined && !promptCaptureName) {
+        return {
+          ok: false,
+          result: { status: 1, output: "", error: 'prompt with "returns" schema must capture to a variable' },
+          output: "",
+        };
+      }
+      const r = await this.runPromptStep(scope, expr.raw, expr.returns, promptCaptureName, io);
+      if (!r.ok) return { ok: false, result: r.result, output: r.output };
+      // For captured prompts `runPromptStep` writes the value into scope and we
+      // return that here; non-capture prompts (no binding) yield empty string.
+      const value = promptCaptureName ? (scope.vars.get(promptCaptureName) ?? "") : "";
+      return { ok: true, value, output: r.output };
+    }
+    // shell / bare_ref should never reach the runtime — validator rejects them
+    // outside their narrow send-RHS lane (and shell-as-send is rejected too).
+    return {
+      ok: false,
+      result: { status: 1, output: "", error: `unsupported expression kind in runtime: ${expr.kind}` },
+      output: "",
+    };
+  }
+
   private async executeSteps(scope: Scope, steps: WorkflowStepDef[], io?: StepIO): Promise<StepResult> {
     let accOut = "";
     let accErr = "";
@@ -519,24 +704,34 @@ export class NodeWorkflowRuntime {
     const localHandleIds: string[] = [];
     let asyncCounter = 0;
     for (const step of steps) {
-      if (step.type === "comment" || step.type === "blank_line") continue;
-      if (step.type === "log" || step.type === "logerr") {
-        const level = step.type === "log" ? "LOG" : "LOGERR";
+      if (step.type === "trivia") continue;
+      if (step.type === "say") {
         let message: string;
-        if (step.managed?.kind === "run_inline_script") {
-          const shebang = step.managed.lang ? `#!/usr/bin/env ${step.managed.lang}` : undefined;
-          const result = await this.executeInlineScript(scope, step.managed.body, shebang, step.managed.args ?? "");
+        if (step.message.kind === "inline_script") {
+          const shebang = step.message.lang ? `#!/usr/bin/env ${step.message.lang}` : undefined;
+          const result = await this.executeInlineScript(scope, step.message.body, shebang, argsToRuntimeString(step.message.args));
           if (result.status !== 0) return this.mergeStepResult(accOut, accErr, result);
           message = result.returnValue ?? result.output.trim();
-        } else {
-          const raw = step.tripleQuoted ? plainMultilineOrchestrationForRuntime(step.message) : step.message;
-          const ir = await this.interpolateWithCaptures(raw, scope);
+        } else if (step.message.kind === "literal") {
+          const ir = await this.interpolateWithCaptures(step.message.raw, scope);
           if (!ir.ok) return this.mergeStepResult(accOut, accErr, ir.result);
-          message = ir.value;
+          message = step.level === "fail" || step.level === "logerr"
+            ? stripOuterQuotes(ir.value)
+            : ir.value;
+        } else {
+          return this.mergeStepResult(accOut, accErr, {
+            status: 1,
+            output: "",
+            error: `unsupported ${step.level} message kind: ${step.message.kind}`,
+          });
+        }
+        if (step.level === "fail") {
+          return this.mergeStepResult(accOut, accErr, { status: 1, output: "", error: message });
         }
-        this.emitter.emitLog(level, message);
+        const eventLevel = step.level === "log" ? "LOG" : "LOGERR";
+        this.emitter.emitLog(eventLevel, message);
         const chunk = `${message}\n`;
-        if (level === "LOG") {
+        if (step.level === "log") {
           accOut += chunk;
           io?.appendOut(chunk);
         } else {
@@ -545,53 +740,18 @@ export class NodeWorkflowRuntime {
         }
         continue;
       }
-      if (step.type === "fail") {
-        const failMsg = step.tripleQuoted ? tripleQuotedRawForRuntime(step.message) : step.message;
-        const failIr = await this.interpolateWithCaptures(failMsg, scope);
-        if (!failIr.ok) return this.mergeStepResult(accOut, accErr, failIr.result);
-        const message = failIr.value;
-        return this.mergeStepResult(accOut, accErr, { status: 1, output: "", error: message });
-      }
-      if (step.type === "shell") {
-        const cmdIr = await this.interpolateWithCaptures(step.command, scope);
-        if (!cmdIr.ok) return this.mergeStepResult(accOut, accErr, cmdIr.result);
-        const stepName = `sh_line_${step.loc.line}`;
-        const result = await this.executeManagedStep(
-          "script",
-          stepName,
-          [],
-          (io) => this.executeShLine(scope, cmdIr.value, io),
-        );
-        if (result.status !== 0) return this.mergeStepResult(accOut, accErr, result);
-        continue;
-      }
       if (step.type === "return") {
-        if (step.managed) {
-          if (step.managed.kind === "match") {
-            const matchResult = await this.evaluateMatch(scope, step.managed.match);
-            if (!matchResult.ok) return this.mergeStepResult(accOut, accErr, matchResult.result);
-            returnValue = matchResult.value;
-            return this.mergeStepResult(accOut, accErr, { status: 0, output: "", error: "", returnValue });
-          }
-          if (step.managed.kind === "run_inline_script") {
-            const shebang = step.managed.lang ? `#!/usr/bin/env ${step.managed.lang}` : undefined;
-            const result = await this.executeInlineScript(scope, step.managed.body, shebang, step.managed.args ?? "");
-            if (result.status !== 0) return this.mergeStepResult(accOut, accErr, result);
-            returnValue = result.returnValue ?? result.output.trim();
-            return this.mergeStepResult(accOut, accErr, { status: 0, output: "", error: "", returnValue });
-          }
-          const result = step.managed.kind === "run"
-            ? await this.executeRunRef(scope, step.managed.ref.value, step.managed.args ?? "")
-            : await this.executeEnsureRef(scope, step.managed.ref.value, step.managed.args ?? "", undefined);
-          if (result.status !== 0) return this.mergeStepResult(accOut, accErr, result);
-          returnValue = result.returnValue ?? result.output.trim();
+        const value = step.value;
+        if (value.kind === "literal") {
+          const retIr = await this.interpolateWithCaptures(value.raw, scope);
+          if (!retIr.ok) return this.mergeStepResult(accOut, accErr, retIr.result);
+          returnValue = stripOuterQuotes(retIr.value);
           return this.mergeStepResult(accOut, accErr, { status: 0, output: "", error: "", returnValue });
         }
-        // Match Bash semantics: return "$var" should return var value, not literal quotes.
-        const retRaw = step.tripleQuoted ? tripleQuotedRawForRuntime(step.value) : step.value;
-        const retIr = await this.interpolateWithCaptures(retRaw, scope);
-        if (!retIr.ok) return this.mergeStepResult(accOut, accErr, retIr.result);
-        returnValue = stripOuterQuotes(retIr.value);
+        const r = await this.evaluateExpr(scope, value, undefined, io);
+        accOut += r.output;
+        if (!r.ok) return this.mergeStepResult(accOut, accErr, r.result);
+        returnValue = r.value;
         return this.mergeStepResult(accOut, accErr, { status: 0, output: "", error: "", returnValue });
       }
       if (step.type === "send") {
@@ -604,53 +764,51 @@ export class NodeWorkflowRuntime {
           });
         }
         let payload = "";
-        if (step.rhs.kind === "literal") {
-          const sendTok =
-            step.rhs.tripleQuoted ? tripleQuotedRawForRuntime(step.rhs.token) : step.rhs.token;
-          const sendIr = await this.interpolateWithCaptures(sendTok, scope);
+        const sendValue = step.value;
+        if (sendValue.kind === "literal") {
+          const sendIr = await this.interpolateWithCaptures(sendValue.raw, scope);
           if (!sendIr.ok) return this.mergeStepResult(accOut, accErr, sendIr.result);
           payload = stripOuterQuotes(sendIr.value);
-        } else if (step.rhs.kind === "var") {
-          const sendHandleErr = await this.resolveHandlesInInput(scope, step.rhs.bash);
-          if (sendHandleErr) return this.mergeStepResult(accOut, accErr, sendHandleErr);
-          payload = interpolate(step.rhs.bash, scope.vars, scope.env);
-        } else if (step.rhs.kind === "run") {
-          const runValue = await this.executeRunRef(scope, step.rhs.ref.value, step.rhs.args ?? "");
-          if (runValue.status !== 0) return this.mergeStepResult(accOut, accErr, runValue);
-          payload = runValue.returnValue ?? runValue.output.trim();
+        } else if (sendValue.kind === "call") {
+          const r = await this.executeRunRef(scope, sendValue.callee.value, argsToRuntimeString(sendValue.args));
+          if (r.status !== 0) return this.mergeStepResult(accOut, accErr, r);
+          payload = r.returnValue ?? r.output.trim();
         } else {
           return this.mergeStepResult(accOut, accErr, {
             status: 1,
             output: "",
-            error: "unsupported send rhs in node runtime",
+            error: `unsupported send value kind: ${sendValue.kind}`,
           });
         }
         this.inboxSeq += 1;
         const seqPadded = String(this.inboxSeq).padStart(3, "0");
         const senderName = ctx.workflowName;
+        // Validator (validateChannelRef) has already proven that an `alias.name`
+        // token refers to an existing imported channel. Routes are registered
+        // under the bare channel name, so strip the alias prefix so the same
+        // key resolves regardless of how the send was spelled.
+        const dotIdx = step.channel.indexOf(".");
+        const channelKey = dotIdx >= 0 ? step.channel.slice(dotIdx + 1) : step.channel;
         const msg: InboxMsg = {
-          channel: step.channel,
+          channel: channelKey,
           content: payload,
           sender: senderName,
           seqPadded,
         };
-        // Route to the nearest ancestor context that has a route for this channel.
         let targetCtx = ctx;
         let routed = false;
         for (let i = this.workflowCtxStack.length - 1; i >= 0; i -= 1) {
-          if (this.workflowCtxStack[i]!.routes.has(step.channel)) {
+          if (this.workflowCtxStack[i]!.routes.has(channelKey)) {
             targetCtx = this.workflowCtxStack[i]!;
             routed = true;
             break;
           }
         }
         targetCtx.queue.push(msg);
-        // Persist inbox file only when a route consumes the channel — otherwise
-        // the file would be dead audit data with no corresponding dispatch.
         if (routed) {
           const inboxFileDir = join(this.runDir, "inbox");
           mkdirSync(inboxFileDir, { recursive: true });
-          writeFileSync(join(inboxFileDir, `${seqPadded}-${step.channel}.txt`), payload, "utf8");
+          writeFileSync(join(inboxFileDir, `${seqPadded}-${channelKey}.txt`), payload, "utf8");
         }
         appendRunSummaryLine(
           JSON.stringify({
@@ -665,98 +823,54 @@ export class NodeWorkflowRuntime {
         );
         continue;
       }
-      if (step.type === "prompt") {
-        if (step.returns !== undefined && !step.captureName) {
-          return this.mergeStepResult(accOut, accErr, {
-            status: 1,
-            output: "",
-            error: 'prompt with "returns" schema must capture to a variable',
-          });
-        }
-        const r = await this.runPromptStep(scope, step.raw, step.bodyKind, step.returns, step.captureName, io);
-        accOut += r.output;
-        if (!r.ok) return this.mergeStepResult(accOut, accErr, r.result);
-        continue;
-      }
       if (step.type === "const") {
-        if (step.value.kind === "expr") {
-          const exprRhs =
-            step.value.tripleQuoted ? tripleQuotedRawForRuntime(step.value.bashRhs) : step.value.bashRhs;
-          const exprIr = await this.interpolateWithCaptures(exprRhs, scope);
+        const v = step.value;
+        if (v.kind === "literal") {
+          const exprIr = await this.interpolateWithCaptures(v.raw, scope);
           if (!exprIr.ok) return this.mergeStepResult(accOut, accErr, exprIr.result);
           scope.vars.set(step.name, stripOuterQuotes(exprIr.value));
           continue;
         }
-        if (step.value.kind === "run_capture") {
-          const captureRef = step.value.ref.value;
-          const captureArgs = step.value.args ?? "";
-          if (step.value.async) {
-            // Async capture: create handle, store in scope, register for join.
-            asyncCounter += 1;
-            const branchStack = [...this.getFrameStack()];
-            const branchIndices = [...this.getAsyncIndices(), asyncCounter];
-            const promise = this.asyncFrameStack.run(branchStack, () =>
-              this.asyncIndicesStorage.run(branchIndices, () =>
-                this.executeRunRef(scope, captureRef, captureArgs),
-              ),
-            );
-            const handleId = this.createHandle(captureRef, promise);
-            localHandleIds.push(handleId);
-            scope.vars.set(step.name, handleId);
-            continue;
-          }
-          const runResult = await this.executeRunRef(scope, captureRef, captureArgs);
-          if (runResult.status !== 0) return this.mergeStepResult(accOut, accErr, runResult);
-          scope.vars.set(step.name, runResult.returnValue ?? runResult.output.trim());
-          continue;
-        }
-        if (step.value.kind === "run_inline_script_capture") {
-          const shebang = step.value.lang ? `#!/usr/bin/env ${step.value.lang}` : undefined;
-          const result = await this.executeInlineScript(scope, step.value.body, shebang, step.value.args ?? "");
-          if (result.status !== 0) return this.mergeStepResult(accOut, accErr, result);
-          scope.vars.set(step.name, result.returnValue ?? result.output.trim());
-          continue;
-        }
-        if (step.value.kind === "ensure_capture") {
-          const ensureResult = await this.executeEnsureRef(scope, step.value.ref.value, step.value.args ?? "", undefined);
-          if (ensureResult.status !== 0) return this.mergeStepResult(accOut, accErr, ensureResult);
-          scope.vars.set(step.name, ensureResult.returnValue ?? ensureResult.output.trim());
-          continue;
-        }
-        if (step.value.kind === "match_expr") {
-          const matchResult = await this.evaluateMatch(scope, step.value.match);
-          if (!matchResult.ok) return this.mergeStepResult(accOut, accErr, matchResult.result);
-          scope.vars.set(step.name, matchResult.value);
-          continue;
-        }
-        if (step.value.kind === "prompt_capture") {
-          const r = await this.runPromptStep(
-            scope,
-            step.value.raw,
-            step.value.bodyKind,
-            step.value.returns,
-            step.name,
-            io,
+        if (v.kind === "call" && v.async) {
+          asyncCounter += 1;
+          const captureRef = v.callee.value;
+          const captureArgs = argsToRuntimeString(v.args);
+          const branchStack = [...this.getFrameStack()];
+          const branchIndices = [...this.getAsyncIndices(), asyncCounter];
+          const promise = this.asyncFrameStack.run(branchStack, () =>
+            this.asyncIndicesStorage.run(branchIndices, () =>
+              this.executeRunRef(scope, captureRef, captureArgs),
+            ),
           );
-          accOut += r.output;
-          if (!r.ok) return this.mergeStepResult(accOut, accErr, r.result);
+          const handleId = this.createHandle(captureRef, promise);
+          localHandleIds.push(handleId);
+          scope.vars.set(step.name, handleId);
           continue;
         }
+        const r = await this.evaluateExpr(scope, v, step.name, io);
+        accOut += r.output;
+        if (!r.ok) return this.mergeStepResult(accOut, accErr, r.result);
+        // Prompt handlers bind via captureName side effect inside runPromptStep;
+        // all other Expr kinds bind here.
+        if (v.kind !== "prompt") {
+          scope.vars.set(step.name, r.value);
+        }
+        continue;
       }
-      if (step.type === "run") {
-        if (step.async) {
+      if (step.type === "exec") {
+        const body = step.body;
+        if (body.kind === "call" && body.async) {
           asyncCounter += 1;
           const branchStack = [...this.getFrameStack()];
           const branchIndices = [...this.getAsyncIndices(), asyncCounter];
-          const ref = step.workflow.value;
-          const argsRaw = step.args ?? "";
+          const ref = body.callee.value;
+          const argsRaw = argsToRuntimeString(body.args);
           const runInBranch = (fn: () => Promise<StepResult>): Promise<StepResult> =>
             this.asyncFrameStack.run(branchStack, () =>
               this.asyncIndicesStorage.run(branchIndices, fn),
             );
           let promise: Promise<StepResult>;
           if (step.recover) {
-            // Async + recover loop: wrap retry logic in a single promise.
             const recoverLimit = this.resolveRecoverLimit(scope.filePath);
             const recover = step.recover;
             promise = runInBranch(async () => {
@@ -771,7 +885,6 @@ export class NodeWorkflowRuntime {
               return lastResult;
             });
           } else if (step.catch) {
-            // Async + catch: single-shot recovery in the async branch.
             const recover = step.catch;
             promise = runInBranch(async () => {
               const result = await this.executeRunRef(scope, ref, argsRaw);
@@ -789,64 +902,132 @@ export class NodeWorkflowRuntime {
           if (step.captureName) scope.vars.set(step.captureName, handleId);
           continue;
         }
-        if (step.recover) {
-          const limit = this.resolveRecoverLimit(scope.filePath);
-          let lastResult = await this.executeRunRef(scope, step.workflow.value, step.args ?? "");
-          let attempt = 1;
-          while (lastResult.status !== 0 && attempt <= limit) {
-            const rr = await this.runRecoverBody(scope, step.recover, `${lastResult.output}${lastResult.error}`);
+        if (body.kind === "call") {
+          if (step.recover) {
+            const limit = this.resolveRecoverLimit(scope.filePath);
+            const ref = body.callee.value;
+            const argsRaw = argsToRuntimeString(body.args);
+            let lastResult = await this.executeRunRef(scope, ref, argsRaw);
+            let attempt = 1;
+            while (lastResult.status !== 0 && attempt <= limit) {
+              const rr = await this.runRecoverBody(scope, step.recover, `${lastResult.output}${lastResult.error}`);
+              if (rr.status !== 0 || rr.returnValue !== undefined) return this.mergeStepResult(accOut, accErr, rr);
+              lastResult = await this.executeRunRef(scope, ref, argsRaw);
+              attempt += 1;
+            }
+            if (lastResult.status === 0) {
+              if (step.captureName) {
+                scope.vars.set(step.captureName, lastResult.returnValue ?? lastResult.output.trim());
+              }
+            } else {
+              return this.mergeStepResult(accOut, accErr, lastResult);
+            }
+            continue;
+          }
+          const runResult = await this.executeRunRef(scope, body.callee.value, argsToRuntimeString(body.args));
+          if (runResult.status === 0) {
+            if (step.captureName) {
+              scope.vars.set(step.captureName, runResult.returnValue ?? runResult.output.trim());
+            }
+          } else if (step.catch) {
+            const rr = await this.runRecoverBody(scope, step.catch, `${runResult.output}${runResult.error}`);
             if (rr.status !== 0 || rr.returnValue !== undefined) return this.mergeStepResult(accOut, accErr, rr);
-            lastResult = await this.executeRunRef(scope, step.workflow.value, step.args ?? "");
-            attempt += 1;
+          } else {
+            return this.mergeStepResult(accOut, accErr, runResult);
+          }
+          continue;
+        }
+        if (body.kind === "ensure_call") {
+          const ensureResult = await this.executeEnsureRef(scope, body.callee.value, argsToRuntimeString(body.args), step.catch);
+          if (step.captureName && ensureResult.status === 0) {
+            scope.vars.set(step.captureName, ensureResult.returnValue ?? ensureResult.output.trim());
+          }
+          if (ensureResult.status !== 0) return this.mergeStepResult(accOut, accErr, ensureResult);
+          if (ensureResult.recoverReturn) return this.mergeStepResult(accOut, accErr, ensureResult);
+          continue;
+        }
+        if (body.kind === "inline_script") {
+          const shebang = body.lang ? `#!/usr/bin/env ${body.lang}` : undefined;
+          const argsRaw = argsToRuntimeString(body.args);
+          const runOnce = (): Promise<StepResult> =>
+            this.executeInlineScript(scope, body.body, shebang, argsRaw);
+          if (step.recover) {
+            const limit = this.resolveRecoverLimit(scope.filePath);
+            let lastResult = await runOnce();
+            let attempt = 1;
+            while (lastResult.status !== 0 && attempt <= limit) {
+              const rr = await this.runRecoverBody(scope, step.recover, `${lastResult.output}${lastResult.error}`);
+              if (rr.status !== 0 || rr.returnValue !== undefined) return this.mergeStepResult(accOut, accErr, rr);
+              lastResult = await runOnce();
+              attempt += 1;
+            }
+            if (lastResult.status === 0) {
+              if (step.captureName) {
+                scope.vars.set(step.captureName, lastResult.returnValue ?? lastResult.output.trim());
+              }
+            } else {
+              return this.mergeStepResult(accOut, accErr, lastResult);
+            }
+            continue;
           }
-          if (lastResult.status === 0) {
+          const result = await runOnce();
+          if (result.status === 0) {
             if (step.captureName) {
-              scope.vars.set(step.captureName, lastResult.returnValue ?? lastResult.output.trim());
+              scope.vars.set(step.captureName, result.returnValue ?? result.output.trim());
             }
+          } else if (step.catch) {
+            const rr = await this.runRecoverBody(scope, step.catch, `${result.output}${result.error}`);
+            if (rr.status !== 0 || rr.returnValue !== undefined) return this.mergeStepResult(accOut, accErr, rr);
           } else {
-            return this.mergeStepResult(accOut, accErr, lastResult);
+            return this.mergeStepResult(accOut, accErr, result);
           }
           continue;
         }
-        const runResult = await this.executeRunRef(scope, step.workflow.value, step.args ?? "");
-        if (runResult.status === 0) {
-          if (step.captureName) {
-            scope.vars.set(step.captureName, runResult.returnValue ?? runResult.output.trim());
+        if (body.kind === "prompt") {
+          if (body.returns !== undefined && !step.captureName) {
+            return this.mergeStepResult(accOut, accErr, {
+              status: 1,
+              output: "",
+              error: 'prompt with "returns" schema must capture to a variable',
+            });
           }
-        } else if (step.catch) {
-          const rr = await this.runRecoverBody(scope, step.catch, `${runResult.output}${runResult.error}`);
-          if (rr.status !== 0 || rr.returnValue !== undefined) return this.mergeStepResult(accOut, accErr, rr);
-        } else {
-          return this.mergeStepResult(accOut, accErr, runResult);
+          const r = await this.runPromptStep(scope, body.raw, body.returns, step.captureName, io);
+          accOut += r.output;
+          if (!r.ok) return this.mergeStepResult(accOut, accErr, r.result);
+          continue;
         }
-        continue;
-      }
-      if (step.type === "run_inline_script") {
-        const shebang = step.lang ? `#!/usr/bin/env ${step.lang}` : undefined;
-        const result = await this.executeInlineScript(scope, step.body, shebang, step.args ?? "");
-        if (step.captureName && result.status === 0) {
-          scope.vars.set(step.captureName, result.returnValue ?? result.output.trim());
+        if (body.kind === "match") {
+          const matchResult = await this.evaluateMatch(scope, body.match);
+          if (!matchResult.ok) return this.mergeStepResult(accOut, accErr, matchResult.result);
+          if (step.captureName) scope.vars.set(step.captureName, matchResult.value);
+          continue;
         }
-        if (result.status !== 0) return this.mergeStepResult(accOut, accErr, result);
-        continue;
-      }
-      if (step.type === "ensure") {
-        const ensureResult = await this.executeEnsureRef(scope, step.ref.value, step.args ?? "", step.catch);
-        if (step.captureName && ensureResult.status === 0) {
-          scope.vars.set(step.captureName, ensureResult.returnValue ?? ensureResult.output.trim());
+        if (body.kind === "shell") {
+          const cmdIr = await this.interpolateWithCaptures(body.command, scope);
+          if (!cmdIr.ok) return this.mergeStepResult(accOut, accErr, cmdIr.result);
+          const stepName = `sh_line_${body.loc.line}`;
+          const result = await this.executeManagedStep(
+            "script",
+            stepName,
+            [],
+            (io) => this.executeShLine(scope, cmdIr.value, io),
+          );
+          if (step.captureName && result.status === 0) {
+            scope.vars.set(step.captureName, result.returnValue ?? result.output.trim());
+          }
+          if (result.status !== 0) return this.mergeStepResult(accOut, accErr, result);
+          continue;
         }
-        if (ensureResult.status !== 0) return this.mergeStepResult(accOut, accErr, ensureResult);
-        if (ensureResult.recoverReturn) return this.mergeStepResult(accOut, accErr, ensureResult);
-        continue;
+        return this.mergeStepResult(accOut, accErr, {
+          status: 1,
+          output: "",
+          error: `unsupported exec body kind in runtime: ${body.kind}`,
+        });
       }
       if (step.type === "if") {
-        // Resolve handle if the subject variable is a handle.
-        const rawSubject = scope.vars.get(step.subject);
-        if (rawSubject && this.isHandle(rawSubject)) {
-          const hr = await this.resolveHandleVar(scope, step.subject);
-          if (hr.status !== 0) return this.mergeStepResult(accOut, accErr, hr);
-        }
-        const subjectVal = scope.vars.get(step.subject) ?? scope.env?.[step.subject] ?? "";
+        const resolved = await this.resolveSubjectValue(scope, step.subject);
+        if (!resolved.ok) return this.mergeStepResult(accOut, accErr, resolved.result);
+        const subjectVal = resolved.value;
         let condMet = false;
         if (step.operator === "==" && step.operand.kind === "string_literal") {
           condMet = subjectVal === step.operand.value;
@@ -857,8 +1038,9 @@ export class NodeWorkflowRuntime {
         } else if (step.operator === "!~" && step.operand.kind === "regex") {
           condMet = !new RegExp(step.operand.source).test(subjectVal);
         }
-        if (condMet) {
-          const bodyResult = await this.executeSteps(scope, step.body, io);
+        const branch = condMet ? step.body : step.elseBody;
+        if (branch) {
+          const bodyResult = await this.executeSteps(scope, branch, io);
           if (bodyResult.status !== 0 || bodyResult.returnValue !== undefined) {
             return this.mergeStepResult(accOut, accErr, bodyResult);
           }
@@ -883,12 +1065,6 @@ export class NodeWorkflowRuntime {
         }
         continue;
       }
-      if (step.type === "match") {
-        const matchResult = await this.evaluateMatch(scope, step.expr);
-        if (!matchResult.ok) return this.mergeStepResult(accOut, accErr, matchResult.result);
-        // Standalone match: value is discarded
-        continue;
-      }
     }
     // Implicit join: await all unresolved handles created in this scope before returning.
     if (localHandleIds.length > 0) {
@@ -944,8 +1120,17 @@ export class NodeWorkflowRuntime {
   }
 
   private async drainWorkflowQueue(scope: Scope, ctx: WorkflowContext): Promise<StepResult> {
+    const limit = resolveInboxDispatchLimit(this.env);
     let cursor = 0;
     while (cursor < ctx.queue.length) {
+      if (cursor >= limit) {
+        const blocker = ctx.queue[cursor]!;
+        return {
+          status: 1,
+          output: "",
+          error: `E_INBOX_DISPATCH_LIMIT: drained ${limit} messages without quiescing — likely a circular send (channel "${blocker.channel}"); raise JAIPH_INBOX_MAX_DISPATCH if intentional`,
+        };
+      }
       const msg = ctx.queue[cursor]!;
       cursor += 1;
       const targets = ctx.routes.get(msg.channel) ?? [];
@@ -1087,30 +1272,31 @@ export class NodeWorkflowRuntime {
    * Execute a prompt step, stream output to artifacts, and bind the captured
    * value (and per-field exports when a returns schema is set) into `scope`.
    * Returns the chunk of stdout to add to the caller's accumulator.
+   *
+   * Transport-failure backoff: a non-zero exit from `executePrompt` (spawn
+   * failure, backend non-zero exit, codex HTTP error) is retried on the
+   * configured delay schedule (default: 15s → 1m → 10m → 30m → 2h, 6 attempts
+   * total). Each attempt is a fresh `executePrompt` call with its own
+   * PROMPT_START/PROMPT_END and STEP_START/STEP_END events. Backoff composes
+   * *below* `recover`/`catch`: retries are exhausted before the failure
+   * reaches the enclosing recover loop. Deterministic post-processing
+   * failures (invalid JSON, schema validation) are not retried — they fail
+   * identically on re-run.
    */
   private async runPromptStep(
     scope: Scope,
     raw: string,
-    bodyKind: "string" | "identifier" | "triple_quoted" | undefined,
     returns: string | undefined,
     captureName: string | undefined,
     io: StepIO | undefined,
   ): Promise<{ ok: true; output: string } | { ok: false; result: StepResult; output: string }> {
-    const promptRaw = bodyKind === "triple_quoted" ? tripleQuotedRawForRuntime(raw) : raw;
-    const promptIr = await this.interpolateWithCaptures(promptRaw, scope);
+    const promptIr = await this.interpolateWithCaptures(raw, scope);
     if (!promptIr.ok) return { ok: false, result: promptIr.result, output: "" };
     let promptText = promptIr.value;
     const promptConfig = resolveConfig(scope.env);
     const backend = promptConfig.backend || "cursor";
     const stepName = resolvePromptStepName(promptConfig);
     const modelRes = resolveModel(promptConfig);
-    const promptStep = this.emitter.emitPromptStepStart(stepName, scope.vars, raw);
-    this.emitter.emitPromptEvent("PROMPT_START", {
-      backend,
-      model: modelRes.model || undefined,
-      model_reason: modelRes.reason,
-      preview: promptText.slice(0, 120),
-    });
     let schemaFields: PromptSchemaField[] | undefined;
     if (returns !== undefined) {
       schemaFields = parsePromptSchema(returns);
@@ -1119,49 +1305,117 @@ export class NodeWorkflowRuntime {
         "\n\nRespond with exactly one line of valid JSON (no markdown, no explanation) matching this schema: " +
         JSON.stringify(schemaObject);
     }
-    const out = new PassThrough();
-    const chunks: string[] = [];
-    const err = new PassThrough();
-    const errChunks: string[] = [];
-    out.on("data", (d) => {
-      const chunk = String(d);
-      chunks.push(chunk);
-      appendFileSync(promptStep.outFile, chunk);
-      io?.appendOut(chunk);
-    });
-    err.on("data", (d) => {
-      const chunk = String(d);
-      errChunks.push(chunk);
-      io?.appendErr(chunk);
-    });
-    const result = await executePrompt(promptText, promptConfig, out, scope.env, err);
-    const promptErr = errChunks.join("");
-    this.emitter.emitPromptStepEnd(promptStep, result.status, chunks.join(""), promptErr);
-    this.emitter.emitPromptEvent("PROMPT_END", {
-      backend,
-      model: modelRes.model || undefined,
-      model_reason: modelRes.reason,
-      status: result.status,
-    });
-    const output = chunks.join("");
-    if (result.status !== 0) {
-      return {
-        ok: false,
-        result: { status: result.status, output: "", error: promptErr.trim() || "prompt failed" },
-        output,
+    const delaysRes = this.getPromptRetryDelays();
+    if (!delaysRes.ok) {
+      this.emitter.emitLog("LOGERR", `prompt retry config invalid: ${delaysRes.error}`);
+      return { ok: false, result: { status: 1, output: "", error: delaysRes.error }, output: "" };
+    }
+    const delays = delaysRes.delays;
+    const totalAttempts = delays.length + 1;
+
+    let lastOutput = "";
+    let lastResult: StepResult = { status: 1, output: "", error: "prompt failed" };
+    let lastFinal = "";
+
+    for (let attempt = 1; attempt <= totalAttempts; attempt += 1) {
+      if (this.abortController.signal.aborted) {
+        this.emitter.emitLog(
+          "LOGERR",
+          `prompt aborted before attempt ${attempt}/${totalAttempts} (${backend}); retries halted`,
+        );
+        return {
+          ok: false,
+          result: { status: lastResult.status || 1, output: "", error: "prompt retry aborted" },
+          output: lastOutput,
+        };
+      }
+      const promptStep = this.emitter.emitPromptStepStart(stepName, scope.vars, raw);
+      this.emitter.emitPromptEvent("PROMPT_START", {
+        backend,
+        model: modelRes.model || undefined,
+        model_reason: modelRes.reason,
+        preview: promptText.slice(0, 120),
+      });
+      const out = new PassThrough();
+      const chunks: string[] = [];
+      const err = new PassThrough();
+      const errChunks: string[] = [];
+      out.on("data", (d) => {
+        const chunk = String(d);
+        chunks.push(chunk);
+        appendFileSync(promptStep.outFile, chunk);
+        io?.appendOut(chunk);
+      });
+      err.on("data", (d) => {
+        const chunk = String(d);
+        errChunks.push(chunk);
+        io?.appendErr(chunk);
+      });
+      const result = await executePrompt(promptText, promptConfig, out, scope.env, err);
+      const promptErr = errChunks.join("");
+      this.emitter.emitPromptStepEnd(promptStep, result.status, chunks.join(""), promptErr);
+      this.emitter.emitPromptEvent("PROMPT_END", {
+        backend,
+        model: modelRes.model || undefined,
+        model_reason: modelRes.reason,
+        status: result.status,
+      });
+      lastOutput = chunks.join("");
+      lastFinal = result.final;
+      lastResult = {
+        status: result.status,
+        output: "",
+        error: promptErr.trim() || "prompt failed",
       };
+      if (result.status === 0) break;
+      // Transport failure path: log + (sleep + retry) or terminate.
+      const errSummary = summarizeError(lastResult.error ?? "");
+      if (attempt >= totalAttempts) {
+        this.emitter.emitLog(
+          "LOGERR",
+          `prompt attempt ${attempt}/${totalAttempts} failed (${backend}): ${errSummary}; retries exhausted, failing step`,
+        );
+        return { ok: false, result: lastResult, output: lastOutput };
+      }
+      const nextDelayMs = delays[attempt - 1]!;
+      const nextDelayLabel = formatRetryDelay(nextDelayMs);
+      this.emitter.emitLog(
+        "LOGERR",
+        `prompt attempt ${attempt}/${totalAttempts} failed (${backend}): ${errSummary}; retrying in ${nextDelayLabel}`,
+      );
+      try {
+        await this.sleep(nextDelayMs, this.abortController.signal);
+      } catch (sleepErr) {
+        if (isPromptRetryAbortError(sleepErr) || this.abortController.signal.aborted) {
+          this.emitter.emitLog(
+            "LOGERR",
+            `prompt retry aborted during backoff after attempt ${attempt}/${totalAttempts} (${backend}); retries halted`,
+          );
+          return {
+            ok: false,
+            result: { status: lastResult.status || 1, output: "", error: "prompt retry aborted" },
+            output: lastOutput,
+          };
+        }
+        throw sleepErr;
+      }
     }
+
     if (schemaFields) {
-      const extracted = extractJson(result.final);
+      const extracted = extractJson(lastFinal);
       if (!extracted) {
-        return { ok: false, result: { status: 1, output: "", error: "prompt returned invalid JSON" }, output };
+        return {
+          ok: false,
+          result: { status: 1, output: "", error: "prompt returned invalid JSON" },
+          output: lastOutput,
+        };
       }
       const validation = validateFields(extracted.obj, schemaFields);
       if (validation !== 0) {
         return {
           ok: false,
           result: { status: validation, output: "", error: "prompt response failed schema validation" },
-          output,
+          output: lastOutput,
         };
       }
       if (captureName) {
@@ -1171,9 +1425,9 @@ export class NodeWorkflowRuntime {
         }
       }
     } else if (captureName) {
-      scope.vars.set(captureName, result.final);
+      scope.vars.set(captureName, lastFinal);
     }
-    return { ok: true, output };
+    return { ok: true, output: lastOutput };
   }
 
   /** Run a recover/catch body with `failure` bound to the failed step's payload. */
@@ -1195,7 +1449,7 @@ export class NodeWorkflowRuntime {
     scope: Scope,
     ref: string,
     argsRaw: string,
-    catchDef: EnsureRecover | undefined,
+    catchDef: CatchBody | undefined,
   ): Promise<StepResult> {
     const resolvedArgs = await this.resolveArgsRaw(scope, argsRaw);
     if (!Array.isArray(resolvedArgs)) return resolvedArgs;
@@ -1363,6 +1617,10 @@ export class NodeWorkflowRuntime {
   }
 
   private resolveRecoverLimit(filePath: string): number {
+    const activeWorkflowMeta = this.workflowCtxStack[this.workflowCtxStack.length - 1]?.workflowMeta;
+    if (activeWorkflowMeta?.run?.recoverLimit !== undefined) {
+      return activeWorkflowMeta.run.recoverLimit;
+    }
     const moduleMeta = this.graph.modules.get(filePath)?.ast.metadata;
     return moduleMeta?.run?.recoverLimit ?? 10;
   }
diff --git a/src/runtime/kernel/prompt-retry.test.ts b/src/runtime/kernel/prompt-retry.test.ts
new file mode 100644
index 00000000..f50f0dd6
--- /dev/null
+++ b/src/runtime/kernel/prompt-retry.test.ts
@@ -0,0 +1,131 @@
+import { describe, it } from "node:test";
+import assert from "node:assert/strict";
+import {
+  DEFAULT_PROMPT_RETRY_DELAYS_MS,
+  defaultPromptSleep,
+  formatRetryDelay,
+  isPromptRetryAbortError,
+  PromptRetryAbortError,
+  resolvePromptRetryDelays,
+  summarizeError,
+} from "./prompt-retry";
+
+describe("resolvePromptRetryDelays", () => {
+  it("returns the default schedule when env is empty", () => {
+    assert.deepEqual(resolvePromptRetryDelays({}), [
+      15_000, 60_000, 600_000, 1_800_000, 7_200_000,
+    ]);
+  });
+
+  it("matches the documented default constant", () => {
+    assert.deepEqual([...DEFAULT_PROMPT_RETRY_DELAYS_MS], resolvePromptRetryDelays({}));
+  });
+
+  it("disables retries when JAIPH_PROMPT_RETRY=0", () => {
+    assert.deepEqual(resolvePromptRetryDelays({ JAIPH_PROMPT_RETRY: "0" }), []);
+  });
+
+  it("disable switch trims whitespace", () => {
+    assert.deepEqual(resolvePromptRetryDelays({ JAIPH_PROMPT_RETRY: "  0  " }), []);
+  });
+
+  it("parses JAIPH_PROMPT_RETRY_DELAYS as comma-separated ms", () => {
+    assert.deepEqual(
+      resolvePromptRetryDelays({ JAIPH_PROMPT_RETRY_DELAYS: "10,20,30" }),
+      [10, 20, 30],
+    );
+  });
+
+  it("trims whitespace around each delay entry", () => {
+    assert.deepEqual(
+      resolvePromptRetryDelays({ JAIPH_PROMPT_RETRY_DELAYS: " 10 , 20 ,30 " }),
+      [10, 20, 30],
+    );
+  });
+
+  it("throws on non-numeric entries", () => {
+    assert.throws(
+      () => resolvePromptRetryDelays({ JAIPH_PROMPT_RETRY_DELAYS: "10,abc,30" }),
+      /JAIPH_PROMPT_RETRY_DELAYS contains invalid entry "abc"/,
+    );
+  });
+
+  it("throws on negative-looking entries (sign chars are rejected)", () => {
+    assert.throws(
+      () => resolvePromptRetryDelays({ JAIPH_PROMPT_RETRY_DELAYS: "10,-5" }),
+      /JAIPH_PROMPT_RETRY_DELAYS contains invalid entry "-5"/,
+    );
+  });
+
+  it("throws on empty list when the var is set with only commas/whitespace", () => {
+    assert.throws(
+      () => resolvePromptRetryDelays({ JAIPH_PROMPT_RETRY_DELAYS: " , , " }),
+      /JAIPH_PROMPT_RETRY_DELAYS is set but has no delay entries/,
+    );
+  });
+});
+
+describe("defaultPromptSleep", () => {
+  it("resolves after the requested ms when not aborted", async () => {
+    const start = Date.now();
+    const ctrl = new AbortController();
+    await defaultPromptSleep(20, ctrl.signal);
+    assert.ok(Date.now() - start >= 15, "should have actually waited (~20ms)");
+  });
+
+  it("rejects with PromptRetryAbortError when the signal is already aborted", async () => {
+    const ctrl = new AbortController();
+    ctrl.abort();
+    await assert.rejects(
+      () => defaultPromptSleep(10_000, ctrl.signal),
+      (err) => isPromptRetryAbortError(err) && err instanceof PromptRetryAbortError,
+    );
+  });
+
+  it("rejects promptly when aborted mid-sleep", async () => {
+    const ctrl = new AbortController();
+    const start = Date.now();
+    const pending = defaultPromptSleep(10_000, ctrl.signal);
+    setTimeout(() => ctrl.abort(), 10);
+    await assert.rejects(pending, (err) => isPromptRetryAbortError(err));
+    assert.ok(Date.now() - start < 500, "abort should short-circuit the wait");
+  });
+});
+
+describe("formatRetryDelay", () => {
+  it("renders sub-second values in ms", () => {
+    assert.equal(formatRetryDelay(750), "750ms");
+  });
+
+  it("renders seconds for <60s values", () => {
+    assert.equal(formatRetryDelay(15_000), "15s");
+  });
+
+  it("renders minutes for <60m values", () => {
+    assert.equal(formatRetryDelay(60_000), "1m");
+    assert.equal(formatRetryDelay(600_000), "10m");
+    assert.equal(formatRetryDelay(1_800_000), "30m");
+  });
+
+  it("renders hours for >=60m values", () => {
+    assert.equal(formatRetryDelay(7_200_000), "2h");
+  });
+});
+
+describe("summarizeError", () => {
+  it("returns first non-empty line, trimmed", () => {
+    assert.equal(summarizeError("  first line  \nsecond line"), "first line");
+  });
+
+  it("placeholder when error is empty", () => {
+    assert.equal(summarizeError(""), "(no error message)");
+    assert.equal(summarizeError("   \n   "), "(no error message)");
+  });
+
+  it("truncates very long lines with an ellipsis marker", () => {
+    const long = "x".repeat(400);
+    const out = summarizeError(long);
+    assert.ok(out.length <= 220);
+    assert.match(out, /…$/);
+  });
+});
diff --git a/src/runtime/kernel/prompt-retry.ts b/src/runtime/kernel/prompt-retry.ts
new file mode 100644
index 00000000..5a971963
--- /dev/null
+++ b/src/runtime/kernel/prompt-retry.ts
@@ -0,0 +1,119 @@
+/**
+ * Retry policy for prompt-execution (transport) failures.
+ *
+ * Schema: a fixed sequence of delays (ms) to wait before each retry attempt.
+ * `delays.length + 1` total attempts (1 initial + N retries). Schedule the
+ * default sequence escalates: 15s, 1m, 10m, 30m, 2h — total ~2h41m wall-clock
+ * for a full failure run. Under Docker the container timeout
+ * (`runtime.docker_timeout_seconds`, default 3600s) caps this; raise it via
+ * the metadata key or JAIPH_DOCKER_TIMEOUT for workflows that need the full
+ * retry budget inside a sandbox.
+ */
+export const DEFAULT_PROMPT_RETRY_DELAYS_MS: readonly number[] = [
+  15_000,
+  60_000,
+  600_000,
+  1_800_000,
+  7_200_000,
+];
+
+/**
+ * Resolve the retry delay schedule from environment.
+ *
+ * - JAIPH_PROMPT_RETRY=0 → disable retries (returns []).
+ * - JAIPH_PROMPT_RETRY_DELAYS="15000,60000" → override schedule (comma list of ms).
+ * - Otherwise → DEFAULT_PROMPT_RETRY_DELAYS_MS.
+ *
+ * Throws on invalid input (non-numeric entries, negative values) so the
+ * misconfiguration surfaces as a clear step error rather than silently
+ * falling back to the default.
+ */
+export function resolvePromptRetryDelays(env: NodeJS.ProcessEnv | Record<string, string | undefined>): number[] {
+  const disable = env.JAIPH_PROMPT_RETRY;
+  if (disable !== undefined && disable.trim() === "0") {
+    return [];
+  }
+  const raw = env.JAIPH_PROMPT_RETRY_DELAYS;
+  if (raw === undefined || raw.trim() === "") {
+    return [...DEFAULT_PROMPT_RETRY_DELAYS_MS];
+  }
+  const parts = raw.split(",").map((p) => p.trim()).filter((p) => p.length > 0);
+  if (parts.length === 0) {
+    throw new Error(
+      `JAIPH_PROMPT_RETRY_DELAYS is set but has no delay entries; expected comma-separated ms (e.g. "15000,60000") or unset`,
+    );
+  }
+  const delays: number[] = [];
+  for (const part of parts) {
+    if (!/^[0-9]+$/.test(part)) {
+      throw new Error(
+        `JAIPH_PROMPT_RETRY_DELAYS contains invalid entry "${part}"; expected non-negative integers (ms)`,
+      );
+    }
+    const n = Number.parseInt(part, 10);
+    if (!Number.isFinite(n) || n < 0) {
+      throw new Error(
+        `JAIPH_PROMPT_RETRY_DELAYS contains invalid entry "${part}"; expected non-negative integers (ms)`,
+      );
+    }
+    delays.push(n);
+  }
+  return delays;
+}
+
+/**
+ * setTimeout-based sleep that races against an AbortSignal. When the signal
+ * fires, the pending timer is cleared and the promise rejects with an
+ * abort-marked Error so the retry loop exits promptly without further
+ * executePrompt calls.
+ */
+export function defaultPromptSleep(ms: number, signal: AbortSignal): Promise<void> {
+  return new Promise((resolve, reject) => {
+    if (signal.aborted) {
+      reject(new PromptRetryAbortError());
+      return;
+    }
+    const onAbort = (): void => {
+      clearTimeout(timer);
+      signal.removeEventListener("abort", onAbort);
+      reject(new PromptRetryAbortError());
+    };
+    const timer = setTimeout(() => {
+      signal.removeEventListener("abort", onAbort);
+      resolve();
+    }, ms);
+    signal.addEventListener("abort", onAbort, { once: true });
+  });
+}
+
+export class PromptRetryAbortError extends Error {
+  constructor() {
+    super("prompt retry aborted");
+    this.name = "PromptRetryAbortError";
+  }
+}
+
+export function isPromptRetryAbortError(err: unknown): err is PromptRetryAbortError {
+  return err instanceof PromptRetryAbortError;
+}
+
+/** Render a backoff delay for human log messages (e.g. "15s", "1m", "2h"). */
+export function formatRetryDelay(ms: number): string {
+  if (ms < 1000) return `${ms}ms`;
+  const seconds = Math.round(ms / 1000);
+  if (seconds < 60) return `${seconds}s`;
+  const minutes = Math.round(seconds / 60);
+  if (minutes < 60) return `${minutes}m`;
+  const hours = Math.round(minutes / 60);
+  return `${hours}h`;
+}
+
+/** Single-line summary of an error string for log messages. */
+export function summarizeError(err: string): string {
+  const trimmed = err.trim();
+  if (trimmed.length === 0) return "(no error message)";
+  const firstLine = trimmed.split(/\r?\n/, 1)[0]!.trim();
+  if (firstLine.length === 0) return "(no error message)";
+  const MAX = 200;
+  return firstLine.length > MAX ? `${firstLine.slice(0, MAX)}…` : firstLine;
+}
diff --git a/src/runtime/kernel/prompt.test.ts b/src/runtime/kernel/prompt.test.ts
index b07606f9..fa10db5c 100644
--- a/src/runtime/kernel/prompt.test.ts
+++ b/src/runtime/kernel/prompt.test.ts
@@ -3,10 +3,13 @@ import * as assert from "node:assert/strict";
 import { chmodSync, existsSync, mkdtempSync, rmSync, writeFileSync } from "node:fs";
 import { tmpdir } from "node:os";
 import { join } from "node:path";
+import { EventEmitter } from "node:events";
 import { PassThrough } from "node:stream";
+import type { ChildProcess } from "node:child_process";
 import {
   buildBackendArgs,
   executePrompt,
+  installPromptWatchdog,
   prepareClaudeEnv,
   resolveConfig,
   resolveModel,
@@ -231,6 +234,202 @@ describe("executePrompt", () => {
   });
 });
 
+/** Minimal ChildProcess stand-in: an EventEmitter with a recording `kill`. */
+function makeFakeChild(): { child: ChildProcess; killSignals: string[] } {
+  const emitter = new EventEmitter() as EventEmitter & { pid: number; kill: (s?: string) => boolean };
+  const killSignals: string[] = [];
+  emitter.pid = 4242;
+  emitter.kill = (signal?: string) => {
+    killSignals.push(signal ?? "SIGTERM");
+    return true;
+  };
+  return { child: emitter as unknown as ChildProcess, killSignals };
+}
+
+describe("installPromptWatchdog", () => {
+  it("layer 2: terminates and fails when output stalls past the idle timeout", async () => {
+    const { child, killSignals } = makeFakeChild();
+    const events: Array<{ status: number; reason: string; final: string }> = [];
+    const stderr = new PassThrough();
+    const wd = installPromptWatchdog(
+      child,
+      makeConfig({ idleTimeoutMs: 40, maxDurationMs: 0, completionGraceMs: 0 }),
+      "claude",
+      stderr,
+      (status, reason, final) => events.push({ status, reason, final }),
+    );
+    await delay(120);
+    wd.clear();
+    assert.equal(events.length, 1);
+    assert.equal(events[0].status, 1);
+    assert.match(events[0].reason, /no output/);
+    assert.ok(killSignals.includes("SIGTERM"));
+  });
+
+  it("layer 2: bump() resets the idle timer so active runs are not killed", async () => {
+    const { child } = makeFakeChild();
+    const events: number[] = [];
+    const wd = installPromptWatchdog(
+      child,
+      makeConfig({ idleTimeoutMs: 80, maxDurationMs: 0, completionGraceMs: 0 }),
+      "claude",
+      new PassThrough(),
+      (status) => events.push(status),
+    );
+    // Keep bumping inside the idle window for longer than the timeout itself.
+    for (let i = 0; i < 4; i += 1) {
+      await delay(40);
+      wd.bump();
+    }
+    assert.equal(events.length, 0, "should not have expired while active");
+    wd.clear();
+  });
+
+  it("layer 3: terminates and fails past the absolute maximum duration", async () => {
+    const { child, killSignals } = makeFakeChild();
+    const events: Array<{ status: number; reason: string }> = [];
+    const wd = installPromptWatchdog(
+      child,
+      makeConfig({ idleTimeoutMs: 0, maxDurationMs: 40, completionGraceMs: 0 }),
+      "claude",
+      new PassThrough(),
+      (status, reason) => events.push({ status, reason }),
+    );
+    // bump() must NOT save it from the absolute cap.
+    await delay(20);
+    wd.bump();
+    await delay(60);
+    wd.clear();
+    assert.equal(events.length, 1);
+    assert.equal(events[0].status, 1);
+    assert.match(events[0].reason, /maximum duration/);
+    assert.ok(killSignals.includes("SIGTERM"));
+  });
+
+  it("layer 1: after completion, terminates and SUCCEEDS if the process never exits", async () => {
+    const { child, killSignals } = makeFakeChild();
+    const events: Array<{ status: number; reason: string; final: string }> = [];
+    const wd = installPromptWatchdog(
+      child,
+      makeConfig({ idleTimeoutMs: 0, maxDurationMs: 0, completionGraceMs: 40 }),
+      "claude",
+      new PassThrough(),
+      (status, reason, final) => events.push({ status, reason, final }),
+    );
+    wd.markComplete("the answer");
+    await delay(120);
+    wd.clear();
+    assert.equal(events.length, 1);
+    assert.equal(events[0].status, 0, "completion grace must settle with success");
+    assert.equal(events[0].final, "the answer");
+    assert.match(events[0].reason, /did not exit/);
+    assert.ok(killSignals.includes("SIGTERM"));
+  });
+
+  it("clear() before any timer fires prevents termination", async () => {
+    const { child, killSignals } = makeFakeChild();
+    const events: number[] = [];
+    const wd = installPromptWatchdog(
+      child,
+      makeConfig({ idleTimeoutMs: 40, maxDurationMs: 40, completionGraceMs: 40 }),
+      "claude",
+      new PassThrough(),
+      (status) => events.push(status),
+    );
+    wd.clear();
+    await delay(120);
+    assert.equal(events.length, 0);
+    assert.equal(killSignals.length, 0);
+  });
+
+  it("fires onExpire at most once even when multiple layers would trip", async () => {
+    const { child } = makeFakeChild();
+    const events: number[] = [];
+    const wd = installPromptWatchdog(
+      child,
+      makeConfig({ idleTimeoutMs: 30, maxDurationMs: 35, completionGraceMs: 0 }),
+      "claude",
+      new PassThrough(),
+      (status) => events.push(status),
+    );
+    await delay(120);
+    wd.clear();
+    assert.equal(events.length, 1);
+  });
+});
+
+describe("executePrompt — prompt watchdog (end to end)", () => {
+  it("recovers (success) when the agent finishes but the process never exits", async () => {
+    const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-grace-"));
+    try {
+      // Fake cursor-agent: emit a terminal `result` event, then hang forever.
+      const fakeAgent = join(root, "cursor-agent");
+      writeFileSync(
+        fakeAgent,
+        [
+          "#!/usr/bin/env bash",
+          `printf '%s\\n' '{"type":"result","result":"done-but-stuck"}'`,
+          // `exec` so SIGTERM hits sleep directly — no orphaned grandchild.
+          "exec sleep 600",
+          "",
+        ].join("\n"),
+      );
+      chmodSync(fakeAgent, 0o755);
+      const stdout = new PassThrough();
+      stdout.on("data", () => {});
+      const result = await executePrompt(
+        "ignored",
+        makeConfig({
+          agentCommand: fakeAgent,
+          workspaceRoot: root,
+          trustedWorkspace: root,
+          completionGraceMs: 150,
+          idleTimeoutMs: 0,
+          maxDurationMs: 0,
+        }),
+        stdout,
+      );
+      assert.equal(result.status, 0);
+      assert.equal(result.final, "done-but-stuck");
+    } finally {
+      rmSync(root, { recursive: true, force: true });
+    }
+  });
+
+  it("recovers (failure) when the agent hangs with no output", async () => {
+    const root = mkdtempSync(join(tmpdir(), "jaiph-prompt-idle-"));
+    try {
+      const fakeAgent = join(root, "cursor-agent");
+      writeFileSync(
+        fakeAgent,
+        ["#!/usr/bin/env bash", "exec sleep 600", ""].join("\n"),
+      );
+      chmodSync(fakeAgent, 0o755);
+      const stdout = new PassThrough();
+      stdout.on("data", () => {});
+      const result = await executePrompt(
+        "ignored",
+        makeConfig({
+          agentCommand: fakeAgent,
+          workspaceRoot: root,
+          trustedWorkspace: root,
+          completionGraceMs: 0,
+          idleTimeoutMs: 150,
+          maxDurationMs: 0,
+        }),
+        stdout,
+      );
+      assert.equal(result.status, 1);
+    } finally {
+      rmSync(root, { recursive: true, force: true });
+    }
+  });
+});
+
+function delay(ms: number): Promise<void> {
+  return new Promise((resolve) => setTimeout(resolve, ms));
+}
+
 describe("prepareClaudeEnv", () => {
   it("keeps existing env when configured claude dir is writable", () => {
     const root = mkdtempSync(join(tmpdir(), "jaiph-claude-env-ok-"));
diff --git a/src/runtime/kernel/prompt.ts b/src/runtime/kernel/prompt.ts
index 8a8569ad..c4b26f05 100644
--- a/src/runtime/kernel/prompt.ts
+++ b/src/runtime/kernel/prompt.ts
@@ -1,6 +1,6 @@
 // Prompt execution: spawn the configured agent backend and stream its output.
 
-import { spawn as nodeSpawn } from "node:child_process";
+import { spawn as nodeSpawn, type ChildProcess } from "node:child_process";
 import { writeFileSync, readFileSync, existsSync, accessSync, mkdirSync, cpSync, constants as fsConstants } from "node:fs";
 import { basename, delimiter, join } from "node:path";
 import { parseStream, type StreamWriter } from "./stream-parser";
@@ -17,8 +17,44 @@ export type PromptConfig = {
   codexApiKey: string;
   codexApiUrl: string;
   promptFinalFile: string;
+  /**
+   * Watchdog timeouts for the subprocess backends (claude / cursor / custom).
+   * All in milliseconds; `0` disables that watchdog. Optional so existing
+   * callers/tests that build a config literal keep working — `runBackend`
+   * falls back to the DEFAULT_* constants when a field is omitted.
+   */
+  completionGraceMs?: number;
+  idleTimeoutMs?: number;
+  maxDurationMs?: number;
 };
 
+/**
+ * Layer 1 — completion grace: once the backend emits its terminal `result`
+ * event the answer is complete. We give the process this long to exit on its
+ * own before terminating it and returning success. Guards the known failure
+ * mode where `claude -p` finishes the work but never exits.
+ */
+export const DEFAULT_PROMPT_COMPLETION_GRACE_MS = 30_000;
+/**
+ * Layer 2 — idle timeout: if the backend produces no stdout/stderr for this
+ * long it is considered hung mid-work. We terminate it and return a non-zero
+ * status so the runtime's retry/backoff loop takes over.
+ */
+export const DEFAULT_PROMPT_IDLE_TIMEOUT_MS = 900_000; // 15m
+/**
+ * Layer 3 — absolute cap: a single prompt may never run longer than this,
+ * regardless of activity. Backstop against slow-but-not-idle hangs.
+ */
+export const DEFAULT_PROMPT_MAX_DURATION_MS = 7_200_000; // 2h
+
+/** Parse a "seconds" env value into milliseconds; empty/invalid → default. `0` is honored (disables). */
+function parseSecondsMs(raw: string | undefined, defaultMs: number): number {
+  if (raw === undefined || raw.trim() === "") return defaultMs;
+  const seconds = Number(raw);
+  if (!Number.isFinite(seconds) || seconds < 0) return defaultMs;
+  return Math.floor(seconds * 1000);
+}
+
 export type ModelResolution = {
   model: string;
   reason: "explicit" | "flags" | "backend-default";
@@ -63,6 +99,15 @@ export function resolveConfig(env: NodeJS.ProcessEnv = process.env): PromptConfi
     codexApiKey: env.OPENAI_API_KEY || "",
     codexApiUrl: env.JAIPH_CODEX_API_URL || "https://api.openai.com/v1/chat/completions",
     promptFinalFile: env.JAIPH_PROMPT_FINAL_FILE || "",
+    completionGraceMs: parseSecondsMs(
+      env.JAIPH_PROMPT_COMPLETION_GRACE_SECONDS,
+      DEFAULT_PROMPT_COMPLETION_GRACE_MS,
+    ),
+    idleTimeoutMs: parseSecondsMs(
+      env.JAIPH_PROMPT_IDLE_TIMEOUT_SECONDS,
+      DEFAULT_PROMPT_IDLE_TIMEOUT_MS,
+    ),
+    maxDurationMs: parseSecondsMs(env.JAIPH_PROMPT_MAX_SECONDS, DEFAULT_PROMPT_MAX_DURATION_MS),
   };
 }
 
@@ -356,6 +401,119 @@ function runCodexBackend(
   });
 }
 
+type PromptWatchdog = {
+  /** Record backend activity (an stdout/stderr chunk); resets the idle timer. */
+  bump: () => void;
+  /** Record that the backend emitted its terminal result event (Layer 1). */
+  markComplete: (finalSoFar: string) => void;
+  /** Stop all timers; call once the prompt has settled. */
+  clear: () => void;
+};
+
+/**
+ * Install the three watchdog layers over a spawned backend child process:
+ *
+ *  1. Completion grace — once the backend signals completion (`markComplete`),
+ *     give it `completionGraceMs` to exit on its own, then terminate it and
+ *     settle with success. Fixes the case where `claude -p` finishes the work
+ *     but the process never exits (so the output stream never closes).
+ *  2. Idle timeout — if no output arrives for `idleTimeoutMs`, treat the run
+ *     as hung mid-work, terminate it, and settle with failure (status 1) so the
+ *     runtime's retry/backoff loop takes over.
+ *  3. Absolute cap — terminate and fail past `maxDurationMs` regardless of
+ *     activity, as a backstop against slow-but-not-idle hangs.
+ *
+ * `onExpire(status, reason, finalSoFar)` fires at most once. By the time it
+ * runs the child has already been sent SIGTERM (escalating to SIGKILL after a
+ * short delay), so the caller only needs to settle its promise.
+ */
+export function installPromptWatchdog(
+  child: ChildProcess,
+  config: PromptConfig,
+  backend: string,
+  stderr: NodeJS.WritableStream,
+  onExpire: (status: number, reason: string, finalSoFar: string) => void,
+): PromptWatchdog {
+  const completionGraceMs = config.completionGraceMs ?? DEFAULT_PROMPT_COMPLETION_GRACE_MS;
+  const idleTimeoutMs = config.idleTimeoutMs ?? DEFAULT_PROMPT_IDLE_TIMEOUT_MS;
+  const maxDurationMs = config.maxDurationMs ?? DEFAULT_PROMPT_MAX_DURATION_MS;
+
+  let fired = false;
+  let idleTimer: NodeJS.Timeout | undefined;
+  let maxTimer: NodeJS.Timeout | undefined;
+  let graceTimer: NodeJS.Timeout | undefined;
+  let lastFinal = "";
+
+  const clear = (): void => {
+    if (idleTimer) clearTimeout(idleTimer);
+    if (maxTimer) clearTimeout(maxTimer);
+    if (graceTimer) clearTimeout(graceTimer);
+    idleTimer = maxTimer = graceTimer = undefined;
+  };
+
+  const killChild = (): void => {
+    try {
+      child.kill("SIGTERM");
+    } catch {
+      // no-op
+    }
+    const escalate = setTimeout(() => {
+      try {
+        child.kill("SIGKILL");
+      } catch {
+        // no-op
+      }
+    }, 5000);
+    escalate.unref?.();
+  };
+
+  const expire = (status: number, reason: string): void => {
+    if (fired) return;
+    fired = true;
+    clear();
+    stderr.write(`jaiph: ${reason}; terminating ${backend} backend.\n`);
+    killChild();
+    onExpire(status, reason, lastFinal);
+  };
+
+  const armIdle = (): void => {
+    if (idleTimeoutMs <= 0) return;
+    if (idleTimer) clearTimeout(idleTimer);
+    idleTimer = setTimeout(
+      () => expire(1, `prompt produced no output for ${Math.round(idleTimeoutMs / 1000)}s`),
+      idleTimeoutMs,
+    );
+    idleTimer.unref?.();
+  };
+
+  if (maxDurationMs > 0) {
+    maxTimer = setTimeout(
+      () => expire(1, `prompt exceeded the ${Math.round(maxDurationMs / 1000)}s maximum duration`),
+      maxDurationMs,
+    );
+    maxTimer.unref?.();
+  }
+  armIdle();
+
+  return {
+    bump: () => armIdle(),
+    markComplete: (finalSoFar: string) => {
+      lastFinal = finalSoFar;
+      if (completionGraceMs <= 0 || fired || graceTimer) return;
+      graceTimer = setTimeout(
+        () =>
+          expire(
+            0,
+            `prompt completed but ${backend} did not exit within ${Math.round(completionGraceMs / 1000)}s`,
+          ),
+        completionGraceMs,
+      );
+      graceTimer.unref?.();
+    },
+    clear,
+  };
+}
+
 /** Run the backend process and parse its streaming output. */
 function runBackend(
   config: PromptConfig,
@@ -403,9 +561,48 @@ function runBackend(
       env: childEnv,
     });
 
+    // Single-settle guard shared by the normal-exit path and every watchdog.
+    let settled = false;
+    let exitCode: number | null = null;
+    // Extra stream to tear down on settle (the claude `merged` PassThrough).
+    let extraStream: { destroy: () => void } | undefined;
+    const settle = (final: string, status: number): void => {
+      if (settled) return;
+      settled = true;
+      watchdog.clear();
+      // Release Node's handles on the child's pipes. Without this, a descendant
+      // that outlives the child while holding the stdout write end (the classic
+      // `claude -p` hang) keeps these streams — and the event loop — alive even
+      // after we've terminated the child and resolved. Destroying here lets the
+      // runtime move on (and ultimately exit) regardless.
+      try {
+        child.stdin?.destroy();
+        child.stdout?.destroy();
+        child.stderr?.destroy();
+        extraStream?.destroy();
+      } catch {
+        // best-effort cleanup
+      }
+      resolve({ final, status });
+    };
+
+    // Watchdog layers (completion grace / idle / absolute cap). For custom
+    // commands only layers 2 and 3 apply — there is no result event to trigger
+    // layer 1, so markComplete is simply never called.
+    const watchdog = installPromptWatchdog(
+      child,
+      config,
+      isCustom ? command : config.backend,
+      stderr,
+      (status, _reason, finalSoFar) => settle(finalSoFar, status),
+    );
+
     child.on("error", (err) => {
       stderr.write(`jaiph: failed to start ${command}: ${err.message}\n`);
-      resolve({ final: "", status: 1 });
+      settle("", 1);
+    });
+    child.on("exit", (code) => {
+      exitCode = code;
     });
 
     if (useStdin && child.stdin) {
@@ -418,7 +615,9 @@ function runBackend(
       let final = "";
       let wroteHeader = false;
       child.stderr?.pipe(stderr);
+      child.stderr?.on("data", () => watchdog.bump());
       child.stdout?.on("data", (chunk: Buffer) => {
+        watchdog.bump();
         const text = chunk.toString();
         if (!wroteHeader) {
           writer.writeFinal("Final answer:\n");
@@ -428,7 +627,7 @@ function runBackend(
         final += text;
       });
       child.on("close", (code) => {
-        resolve({ final, status: code ?? 0 });
+        settle(final, code ?? exitCode ?? 0);
       });
       return;
     }
@@ -442,20 +641,31 @@ function runBackend(
       child.stderr?.pipe(merged);
       child.on("close", () => merged.end());
       parseInput = merged;
+      extraStream = merged;
     } else {
       // Cursor: parse only stdout; pipe stderr through to process stderr
       parseInput = child.stdout!;
       child.stderr?.pipe(stderr);
     }
 
-    parseStream(parseInput, writer).then((final) => {
-      child.on("close", (code) => {
-        resolve({ final, status: code ?? 0 });
-      });
-      if (child.exitCode !== null) {
-        resolve({ final, status: child.exitCode });
+    parseStream(parseInput, writer, {
+      onComplete: (finalSoFar) => watchdog.markComplete(finalSoFar),
+    }).then((final) => {
+      // Stream ended — process closed, or the watchdog already killed it and
+      // settled (in which case `settle` here is a no-op).
+      const close = (code: number | null): void => settle(final, code ?? exitCode ?? 0);
+      if (child.exitCode !== null || exitCode !== null) {
+        close(child.exitCode ?? exitCode);
+      } else {
+        child.on("close", (code) => close(code));
       }
     });
+
+    // Reset the idle watchdog on every chunk. Attached after parseStream so the
+    // cursor backend (whose stdout IS the parse input) does not drop the first
+    // chunk to a premature switch into flowing mode.
+    child.stdout?.on("data", () => watchdog.bump());
+    child.stderr?.on("data", () => watchdog.bump());
   });
 }
 
diff --git a/src/runtime/kernel/runtime-arg-parser.ts b/src/runtime/kernel/runtime-arg-parser.ts
index b09db127..925d9df4 100644
--- a/src/runtime/kernel/runtime-arg-parser.ts
+++ b/src/runtime/kernel/runtime-arg-parser.ts
@@ -5,7 +5,7 @@
  * resolve interpolated strings, parse call argument lists (including managed
  * `run`/`ensure` and inline-script forms), and validate prompt return schemas.
  */
-import { parseCallRef } from "../../parse/core";
+import { argsToRuntimeString, parseCallRef } from "../../parse/core";
 import { formatUtcTimestamp } from "./emit";
 
 export const BARE_IDENT_RE = /^[A-Za-z_][A-Za-z0-9_]*$/;
@@ -146,7 +146,7 @@ export function parseManagedArgAt(raw: string, start: number): { token: ParsedAr
         kind: "managed",
         managedKind: keyword,
         ref: call.ref,
-        argsRaw: call.args ?? "",
+        argsRaw: argsToRuntimeString(call.args),
       },
       next: start + keyword.length + skipped + consumed,
     };
diff --git a/src/runtime/kernel/stream-parser.ts b/src/runtime/kernel/stream-parser.ts
index 1e200b99..3b781907 100644
--- a/src/runtime/kernel/stream-parser.ts
+++ b/src/runtime/kernel/stream-parser.ts
@@ -14,6 +14,8 @@ export type StreamState = {
   sawFinalStreamDelta: boolean;
   sawFinalMessage: boolean;
   sawVisibleFinalText: boolean;
+  /** Set once the backend emits its terminal `result` event (work complete). */
+  sawResult: boolean;
 };
 
 export function createStreamState(): StreamState {
@@ -27,6 +29,7 @@ export function createStreamState(): StreamState {
     sawFinalStreamDelta: false,
     sawFinalMessage: false,
     sawVisibleFinalText: false,
+    sawResult: false,
   };
 }
 
@@ -185,7 +188,12 @@ export function processStreamLine(
         return;
       }
 
-      // Result object
+      // Result object — the backend's terminal event; marks the run complete
+      // even when the final text already arrived via deltas or an assistant
+      // message (in which case `result` may be empty).
+      if (obj.type === "result") {
+        state.sawResult = true;
+      }
       if (obj.type === "result" && typeof obj.result === "string" && obj.result.length > 0) {
         if (!state.sawFinalStreamDelta && !state.sawFinalMessage) {
           const normalized = normalizeInitialFinalText(obj.result, state);
@@ -225,13 +233,26 @@ export function effectiveFinal(state: StreamState): string {
 export function parseStream(
   input: Readable,
   writer: StreamWriter,
+  opts?: {
+    /**
+     * Fired exactly once when the backend emits its terminal `result` event,
+     * with the final answer accumulated so far. Lets callers detect that the
+     * agent has finished even if the underlying process has not yet exited.
+     */
+    onComplete?: (finalSoFar: string) => void;
+  },
 ): Promise<string> {
   return new Promise((resolve) => {
     const state = createStreamState();
     const rl: Interface = createInterface({ input, crlfDelay: Infinity });
+    let firedComplete = false;
 
     rl.on("line", (line: string) => {
       processStreamLine(line, state, writer);
+      if (state.sawResult && !firedComplete) {
+        firedComplete = true;
+        opts?.onComplete?.(effectiveFinal(state));
+      }
     });
 
     rl.on("close", () => {
diff --git a/src/runtime/kernel/workflow-launch.test.ts b/src/runtime/kernel/workflow-launch.test.ts
index 024f5f83..7f487e87 100644
--- a/src/runtime/kernel/workflow-launch.test.ts
+++ b/src/runtime/kernel/workflow-launch.test.ts
@@ -1,18 +1,23 @@
 import { test } from "node:test";
 import assert from "node:assert/strict";
 import { buildRunModuleLaunch } from "./workflow-launch";
+import { WORKFLOW_RUNNER_ARG } from "./node-workflow-runner";
 
-test("buildRunModuleLaunch always uses node runner", () => {
+test("buildRunModuleLaunch routes through the __workflow-runner dispatch (node build)", () => {
   const launch = buildRunModuleLaunch(
     ["/tmp/meta.txt", "/tmp/workflow.sh", "entry", "a"],
     { JAIPH_SOURCE_ABS: "/tmp/source.jh" },
   );
   assert.equal(launch.command, process.execPath);
-  assert.equal(launch.args[1], "/tmp/meta.txt");
-  assert.equal(launch.args[2], "/tmp/source.jh");
-  assert.equal(launch.args[3], "/tmp/workflow.sh");
-  assert.equal(launch.args[4], "default");
-  assert.equal(launch.args[5], "a");
+  // Node build: [cli.js, __workflow-runner, meta, source, built, "default", ...runArgs]
+  assert.match(launch.args[0]!, /cli\.js$/);
+  assert.equal(launch.args[1], WORKFLOW_RUNNER_ARG);
+  assert.equal(launch.args[2], "/tmp/meta.txt");
+  assert.equal(launch.args[3], "/tmp/source.jh");
+  assert.equal(launch.args[4], "/tmp/workflow.sh");
+  assert.equal(launch.args[5], "default");
+  assert.equal(launch.args[6], "a");
+  assert.equal(launch.env.JAIPH_META_FILE, "/tmp/meta.txt");
 });
 
 test("buildRunModuleLaunch throws without JAIPH_SOURCE_ABS", () => {
diff --git a/src/runtime/kernel/workflow-launch.ts b/src/runtime/kernel/workflow-launch.ts
index 090ca2a5..e82532f4 100644
--- a/src/runtime/kernel/workflow-launch.ts
+++ b/src/runtime/kernel/workflow-launch.ts
@@ -1,5 +1,17 @@
 import { spawn, ChildProcess } from "node:child_process";
 import { join } from "node:path";
+import { WORKFLOW_RUNNER_ARG } from "./node-workflow-runner";
+
+/**
+ * True when the running process is the bun --compile standalone binary.
+ *
+ * In that mode `process.execPath` points at the jaiph binary itself, so a
+ * spawn must use `[jaiph, __workflow-runner, ...]` argv. Under node it points
+ * at the node interpreter and the spawn needs `[node, cli.js, __workflow-runner, ...]`.
+ */
+function isBunCompiledStandalone(): boolean {
+  return typeof (globalThis as { Bun?: unknown }).Bun !== "undefined";
+}
 
 /**
  * Build argv/env for executing a workflow via the Node runtime.
@@ -17,11 +29,15 @@ export function buildRunModuleLaunch(
   if (!sourceAbs) {
     throw new Error("JAIPH_SOURCE_ABS is required for workflow launch");
   }
-  const runnerPath = join(__dirname, "node-workflow-runner.js");
+  const runnerArgv = [WORKFLOW_RUNNER_ARG, metaFile, sourceAbs, builtScript, "default", ...runArgs];
+  const launchEnv = { ...env, JAIPH_META_FILE: metaFile };
+  if (isBunCompiledStandalone()) {
+    return { command: process.execPath, args: runnerArgv, env: launchEnv };
+  }
   return {
     command: process.execPath,
-    args: [runnerPath, metaFile, sourceAbs, builtScript, "default", ...runArgs],
-    env: { ...env, JAIPH_META_FILE: metaFile },
+    args: [join(__dirname, "..", "..", "cli.js"), ...runnerArgv],
+    env: launchEnv,
   };
 }
 
diff --git a/src/runtime/orchestration-text.ts b/src/runtime/orchestration-text.ts
deleted file mode 100644
index 0940e27b..00000000
--- a/src/runtime/orchestration-text.ts
+++ /dev/null
@@ -1,22 +0,0 @@
-import { dedentCommonLeadingWhitespace } from "../parse/dedent";
-import { tripleQuoteBodyToRaw } from "../parse/triple-quote";
-
-/** Unescape inner text of a `tripleQuoteBodyToRaw`-shaped `"…"` token (same as format/emit decoders). */
-function unescapeDslDoubleQuotedInner(inner: string): string {
-  return inner.replace(/\\"/g, '"').replace(/\\\\/g, "\\");
-}
-
-/**
- * Values stored as `tripleQuoteBodyToRaw(parsedBody)` keep source indentation for the formatter.
- * At runtime, apply common-leading-whitespace removal (same as historical parse-time dedent).
- */
-export function tripleQuotedRawForRuntime(raw: string): string {
-  if (raw.length < 2 || raw[0] !== '"' || raw[raw.length - 1] !== '"') return raw;
-  const inner = unescapeDslDoubleQuotedInner(raw.slice(1, -1));
-  return tripleQuoteBodyToRaw(dedentCommonLeadingWhitespace(inner));
-}
-
-/** Plain multiline text from `log """…"""` / `logerr` / `fail` (no surrounding quotes in AST). */
-export function plainMultilineOrchestrationForRuntime(text: string): string {
-  return dedentCommonLeadingWhitespace(text);
-}
diff --git a/src/transpile/build.ts b/src/transpile/build.ts
index cbe4d478..4000d897 100644
--- a/src/transpile/build.ts
+++ b/src/transpile/build.ts
@@ -1,8 +1,9 @@
-import { chmodSync, mkdirSync, readFileSync, readdirSync, statSync, writeFileSync } from "node:fs";
+import { chmodSync, mkdirSync, readdirSync, statSync, writeFileSync } from "node:fs";
 import { dirname, extname, join, parse, relative, resolve } from "node:path";
-import { parsejaiph } from "../parser";
-import type { ScriptArtifact } from "./emit-script";
-import { JAIPH_EXT_REGEX, resolveImportPath } from "./resolve";
+import { emitScriptsForModuleFromGraph } from "./emit-from-graph";
+import type { ModuleGraph } from "./module-graph";
+import { loadModuleGraph } from "./module-graph";
+import { JAIPH_EXT_REGEX } from "./resolve";
 
 function ensureDir(path: string): void {
   mkdirSync(path, { recursive: true });
@@ -95,32 +96,16 @@ export function walkTestFiles(inputPath: string): string[] {
   return files;
 }
 
-/** Entry `.jh` plus all files reachable via `import` (transitive), sorted. */
-export function collectTransitiveJhModules(entrypoint: string, workspaceRoot?: string): string[] {
-  const visited = new Set<string>();
-  const queue = [entrypoint];
-  while (queue.length > 0) {
-    const file = queue.pop()!;
-    if (visited.has(file)) continue;
-    visited.add(file);
-    const ast = parsejaiph(readFileSync(file, "utf8"), file);
-    for (const imp of ast.imports) {
-      const importedFile = resolveImportPath(file, imp.path, workspaceRoot);
-      if (!visited.has(importedFile)) queue.push(importedFile);
-    }
-  }
-  const files = [...visited];
-  files.sort();
-  return files;
-}
-
 /**
- * Writes extracted `script` bodies to `<targetDir>/scripts`.
+ * Path-based entry point. Loads a `ModuleGraph` and writes extracted `script`
+ * bodies under `<targetDir>/scripts`. For a directory input, every non-test
+ * `.jh` becomes its own root: each rooted graph is loaded and emitted. The
+ * directory walk preserves the historical multi-entry validation semantics
+ * for `jaiph compile <dir>` and the integration test corpus.
  */
 export function buildScripts(
   inputPath: string,
   targetDir: string | undefined,
-  emitScriptsFn: (file: string, root: string) => ScriptArtifact[],
   workspaceRoot?: string,
 ): { scriptsDir: string } {
   const absInput = resolve(inputPath);
@@ -128,20 +113,53 @@ export function buildScripts(
   const rootDir = inputStat.isDirectory() ? absInput : dirname(absInput);
   const outRoot = resolve(targetDir ?? rootDir);
   ensureDir(outRoot);
+  const scriptsRoot = join(outRoot, "scripts");
+  ensureDir(scriptsRoot);
+
+  if (inputStat.isFile()) {
+    const graph = loadModuleGraph(absInput, workspaceRoot);
+    emitGraphInto(graph, rootDir, scriptsRoot);
+    return { scriptsDir: scriptsRoot };
+  }
 
-  const entrypointFile = inputStat.isFile() ? absInput : null;
-  const files = entrypointFile ? collectTransitiveJhModules(entrypointFile, workspaceRoot) : walkjhFiles(rootDir);
+  for (const entry of walkjhFiles(absInput)) {
+    const graph = loadModuleGraph(entry, workspaceRoot);
+    emitGraphInto(graph, rootDir, scriptsRoot);
+  }
+  return { scriptsDir: scriptsRoot };
+}
+
+/**
+ * Graph-based entry point. The caller has already built a `ModuleGraph` (the
+ * default `jaiph run` path); emit every reachable module's scripts into
+ * `<targetDir>/scripts` without re-parsing anything. `rootDir` defaults to
+ * the entry's parent directory so symbol prefixes match the path-based form.
+ */
+export function buildScriptsFromGraph(
+  graph: ModuleGraph,
+  targetDir: string,
+  rootDir?: string,
+): { scriptsDir: string } {
+  const outRoot = resolve(targetDir);
+  ensureDir(outRoot);
   const scriptsRoot = join(outRoot, "scripts");
   ensureDir(scriptsRoot);
+  const resolvedRoot = resolve(rootDir ?? dirname(graph.entryFile));
+  emitGraphInto(graph, resolvedRoot, scriptsRoot);
+  return { scriptsDir: scriptsRoot };
+}
 
+function emitGraphInto(graph: ModuleGraph, rootDir: string, scriptsRoot: string): void {
+  const files = [...graph.modules.keys()].sort();
   for (const file of files) {
-    const scripts = emitScriptsFn(file, rootDir);
+    const scripts = emitScriptsForModuleFromGraph(graph, file, rootDir);
     for (const s of scripts) {
       const scriptPath = join(scriptsRoot, s.name);
       writeFileSync(scriptPath, s.content, "utf8");
       chmodSync(scriptPath, 0o755);
     }
   }
-
-  return { scriptsDir: scriptsRoot };
 }
+
+// Re-export so `jaiph compile` can use the centralized regex.
+export { JAIPH_EXT_REGEX };
diff --git a/src/transpile/compiler-edge.acceptance.test.ts b/src/transpile/compiler-edge.acceptance.test.ts
index ca99a578..e2b7a17c 100644
--- a/src/transpile/compiler-edge.acceptance.test.ts
+++ b/src/transpile/compiler-edge.acceptance.test.ts
@@ -366,9 +366,11 @@ test("ACCEPTANCE: prompt with returns schema (single-line) parses and emits type
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "const");
   assert.ok(step.type === "const" && step.name === "result");
-  assert.ok(step.type === "const" && step.value.kind === "prompt_capture");
-  assert.ok(step.type === "const" && step.value.returns !== undefined);
-  assert.match(step.value.returns!, /type:\s*string/);
+  assert.ok(step.type === "const" && step.value.kind === "prompt");
+  if (step.type === "const" && step.value.kind === "prompt") {
+    assert.ok(step.value.returns !== undefined);
+    assert.match(step.value.returns!, /type:\s*string/);
+  }
 
   withTempDir("jaiph-acc-prompt-returns-", (root) => {
     writeFileSync(
@@ -398,10 +400,12 @@ test("ACCEPTANCE: prompt with returns schema (multiline continuation) parses", (
   assert.equal(mod.workflows.length, 1);
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "const");
-  assert.ok(step.type === "const" && step.value.kind === "prompt_capture");
-  assert.ok(step.type === "const" && step.value.returns !== undefined);
-  assert.match(step.value.returns!, /type:\s*string/);
-  assert.match(step.value.returns!, /risk:\s*string/);
+  assert.ok(step.type === "const" && step.value.kind === "prompt");
+  if (step.type === "const" && step.value.kind === "prompt") {
+    assert.ok(step.value.returns !== undefined);
+    assert.match(step.value.returns!, /type:\s*string/);
+    assert.match(step.value.returns!, /risk:\s*string/);
+  }
 });
 
 test("ACCEPTANCE: unsupported type in returns schema fails with E_SCHEMA", () => {
diff --git a/src/transpile/compiler-golden.test.ts b/src/transpile/compiler-golden.test.ts
index b4c78c74..cc89a45e 100644
--- a/src/transpile/compiler-golden.test.ts
+++ b/src/transpile/compiler-golden.test.ts
@@ -109,13 +109,17 @@ test("parser: assignment capture parses for ensure, run, and const run capture",
   const steps = mod.workflows[0].steps;
   assert.equal(steps.length, 2);
   assert.equal(steps[0].type, "const");
-  const c0 = steps[0] as { type: "const"; name: string; value: { kind: string } };
-  assert.equal(c0.name, "response");
-  assert.equal(c0.value.kind, "ensure_capture");
+  const c0 = steps[0];
+  if (c0.type === "const") {
+    assert.equal(c0.name, "response");
+    assert.equal(c0.value.kind, "ensure_call");
+  }
   assert.equal(steps[1].type, "const");
-  const c1 = steps[1] as { type: "const"; name: string; value: { kind: string } };
-  assert.equal(c1.name, "out");
-  assert.equal(c1.value.kind, "run_capture");
+  const c1 = steps[1];
+  if (c1.type === "const") {
+    assert.equal(c1.name, "out");
+    assert.equal(c1.value.kind, "call");
+  }
 });
 
 test("parser: config block parses and populates mod.metadata", () => {
@@ -343,13 +347,13 @@ test("parser: run ... catch parses correctly", () => {
   ].join("\n");
   const mod = parsejaiph(source, "/fake/entry.jh");
   const step = mod.workflows[0].steps[0];
-  assert.equal(step.type, "run");
-  if (step.type === "run") {
+  assert.equal(step.type, "exec");
+  if (step.type === "exec" && step.body.kind === "call") {
     assert.ok(step.catch);
     assert.equal(step.catch!.bindings.failure, "err");
     const recoverSteps = "block" in step.catch! ? step.catch!.block : [step.catch!.single];
     assert.equal(recoverSteps.length, 1);
-    assert.equal(recoverSteps[0].type, "log");
+    assert.equal(recoverSteps[0].type, "say");
   }
 });
 
@@ -360,9 +364,14 @@ test("parser: fail step parses quoted message", () => {
     "}",
   ].join("\n");
   const mod = parsejaiph(source, "/fake/entry.jh");
-  const step = mod.workflows[0].steps[0] as { type: string; message: string };
-  assert.equal(step.type, "fail");
-  assert.equal(step.message, '"expected reason"');
+  const step = mod.workflows[0].steps[0];
+  assert.equal(step.type, "say");
+  if (step.type === "say") {
+    assert.equal(step.level, "fail");
+    if (step.message.kind === "literal") {
+      assert.equal(step.message.raw, '"expected reason"');
+    }
+  }
 });
 
 test("parser: const string expr and const run capture parse", () => {
@@ -376,15 +385,19 @@ test("parser: const string expr and const run capture parse", () => {
   const mod = parsejaiph(source, "/fake/entry.jh");
   const steps = mod.workflows[0].steps;
   assert.equal(steps.length, 2);
-  const c0 = steps[0] as { type: string; name: string; value: { kind: string; bashRhs?: string } };
-  const c1 = steps[1] as { type: string; name: string; value: { kind: string } };
+  const c0 = steps[0];
+  const c1 = steps[1];
   assert.equal(c0.type, "const");
-  assert.equal(c0.name, "msg");
-  assert.equal(c0.value.kind, "expr");
-  assert.equal(c0.value.bashRhs, '"hi"');
+  if (c0.type === "const") {
+    assert.equal(c0.name, "msg");
+    assert.equal(c0.value.kind, "literal");
+    if (c0.value.kind === "literal") assert.equal(c0.value.raw, '"hi"');
+  }
   assert.equal(c1.type, "const");
-  assert.equal(c1.name, "out");
-  assert.equal(c1.value.kind, "run_capture");
+  if (c1.type === "const") {
+    assert.equal(c1.name, "out");
+    assert.equal(c1.value.kind, "call");
+  }
 });
 
 test("parser: const rejects bare call-like rhs without run", () => {
@@ -408,16 +421,13 @@ test("parser: const allows run-wrapped script call with args", () => {
     "}",
   ].join("\n");
   const mod = parsejaiph(source, "/fake/entry.jh");
-  const step = mod.workflows[0].steps[0] as {
-    type: string;
-    name: string;
-    value: { kind: string; ref?: { value: string }; args?: string };
-  };
+  const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "const");
-  assert.equal(step.name, "x");
-  assert.equal(step.value.kind, "run_capture");
-  assert.equal(step.value.ref?.value, "some_script");
-  assert.equal(step.value.args, '${arg1}');
+  if (step.type === "const" && step.value.kind === "call") {
+    assert.equal(step.name, "x");
+    assert.equal(step.value.callee.value, "some_script");
+    assert.deepEqual(step.value.args, [{ kind: "var", name: "arg1" }]);
+  }
 });
 
 test("parser: const prompt capture parses", () => {
@@ -427,14 +437,12 @@ test("parser: const prompt capture parses", () => {
     "}",
   ].join("\n");
   const mod = parsejaiph(source, "/fake/entry.jh");
-  const step = mod.workflows[0].steps[0] as {
-    type: string;
-    name: string;
-    value: { kind: string };
-  };
+  const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "const");
-  assert.equal(step.name, "ans");
-  assert.equal(step.value.kind, "prompt_capture");
+  if (step.type === "const") {
+    assert.equal(step.name, "ans");
+    assert.equal(step.value.kind, "prompt");
+  }
 });
 
 test("parser: wait parses as workflow step (not shell)", () => {
@@ -478,8 +486,10 @@ test("parser: send operator parses channel <- \"literal\"", () => {
   const step = mod.workflows[0].steps[0];
   assert.equal(step.type, "send");
   if (step.type !== "send") throw new Error("expected send");
-  assert.equal(step.rhs.kind, "literal");
-  assert.equal(step.rhs.token, `"hello"`);
+  assert.equal(step.value.kind, "literal");
+  if (step.value.kind === "literal") {
+    assert.equal(step.value.raw, `"hello"`);
+  }
   assert.equal(step.channel, "findings");
 });
 
@@ -597,7 +607,7 @@ test("parser: <- inside quotes is not a send", () => {
   ].join("\n");
   const mod = parsejaiph(source, "/fake/entry.jh");
   assert.equal(mod.workflows[0].steps.length, 1);
-  assert.equal(mod.workflows[0].steps[0].type, "log");
+  assert.equal(mod.workflows[0].steps[0].type, "say");
 });
 
 test("parser: channel route declaration parses into ChannelDef.routes", () => {
@@ -659,8 +669,12 @@ test("parser: capture + send is E_PARSE", () => {
     "}",
   ].join("\n");
   const mod = parsejaiph(source, "/fake/entry.jh");
-  // Parsed as a shell step; validation will reject it later
-  assert.equal(mod.workflows[0].steps[0].type, "shell");
+  // Parsed as an exec step with shell body; validation will reject it later
+  const step = mod.workflows[0].steps[0];
+  assert.equal(step.type, "exec");
+  if (step.type === "exec") {
+    assert.equal(step.body.kind, "shell");
+  }
 });
 
 // === Top-level const (env declaration) tests ===
diff --git a/src/transpile/diagnostics-collector.test.ts b/src/transpile/diagnostics-collector.test.ts
new file mode 100644
index 00000000..59b6a290
--- /dev/null
+++ b/src/transpile/diagnostics-collector.test.ts
@@ -0,0 +1,215 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { mkdtempSync, readFileSync, rmSync, writeFileSync } from "node:fs";
+import { join, resolve } from "node:path";
+import { tmpdir } from "node:os";
+import { spawnSync } from "node:child_process";
+import { loadModuleGraph } from "./module-graph";
+import { collectDiagnostics } from "./validate";
+
+// Compiled test sits at dist/src/transpile/; the source tree is three levels up.
+const repoRoot = resolve(__dirname, "../../..");
+const validatePath = resolve(repoRoot, "src/transpile/validate.ts");
+const validateStepPath = resolve(repoRoot, "src/transpile/validate-step.ts");
+const cliJsPath = resolve(repoRoot, "dist/src/cli.js");
+
+/**
+ * Acceptance #1: a fixture with N >= 3 independent errors reports the full
+ * set in one compile (not just the first), in source order.
+ *
+ * The three independent errors:
+ *  1. duplicate import alias `helper` (line 2 — second import line)
+ *  2. send to undefined channel `notify` (line 6 — inside the workflow body)
+ *  3. unknown ref `do_thing` in a run call (line 7)
+ */
+test("Diagnostics: collects 3 independent errors from one compile in source order", () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-diag-multi-"));
+  try {
+    writeFileSync(
+      join(root, "helper.jh"),
+      ["export rule check(x) {", '  return "ok"', "}", ""].join("\n"),
+    );
+    writeFileSync(
+      join(root, "m.jh"),
+      [
+        'import "./helper.jh" as helper',
+        'import "./helper.jh" as helper',
+        "",
+        "workflow default() {",
+        '  log "hi"',
+        '  notify <- "payload"',
+        "  run do_thing()",
+        "}",
+        "",
+      ].join("\n"),
+    );
+
+    const graph = loadModuleGraph(join(root, "m.jh"));
+    const diag = collectDiagnostics(graph);
+    const sorted = diag.sorted().filter((d) => d.file.endsWith("m.jh"));
+
+    assert.equal(
+      sorted.length,
+      3,
+      `expected 3 diagnostics, got: ${JSON.stringify(diag.sorted(), null, 2)}`,
+    );
+    assert.equal(sorted[0].line, 2, "duplicate import alias should be on line 2");
+    assert.match(sorted[0].message, /duplicate import alias "helper"/);
+    assert.equal(sorted[1].line, 6, "undefined channel should be on line 6");
+    assert.match(sorted[1].message, /Channel "notify" is not defined/);
+    assert.equal(sorted[2].line, 7, "unknown ref should be on line 7");
+    assert.match(sorted[2].message, /unknown local workflow or script reference "do_thing"/);
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
+
+/**
+ * Acceptance #3: throwing call-sites are reduced to a documented "fatal"
+ * subset. The validator entry point (`validate.ts`) no longer throws on
+ * user-level errors; it appends to a `Diagnostics` collector instead.
+ *
+ * Reference baseline (pre-migration): `validate.ts` alone had ~54 raw
+ * `throw jaiphError(` call-sites. After migration that file holds zero.
+ *
+ * The remaining `throw jaiphError(...)` call-sites in `src/` fall into two
+ * groups:
+ *
+ *   - **Fatal aborts** (continuing would produce garbage): the parser's
+ *     `fail()` helper (`src/parse/core.ts`), the loader / graph builder
+ *     (`src/transpile/module-graph.ts`), the test-file shape check
+ *     (`src/cli/commands/test.ts`), plus the legacy bridge inside the
+ *     collector itself (`src/diagnostics.ts`).
+ *   - **Leaf validation helpers** (validate-string, validate-prompt-schema,
+ *     validate-ref-resolution, shell-jaiph-guard): these still throw but
+ *     every caller wraps them in `diag.capture(...)`, which converts the
+ *     thrown `jaiphError` into a recoverable diagnostic and continues with
+ *     the next validation unit.
+ *
+ * Test files (`*.test.ts`) are excluded from the count — they intentionally
+ * exercise the throwing legacy bridge.
+ */
+test("Diagnostics: throwing call-sites match the documented fatal allowlist", () => {
+  const validateSrc = readFileSync(validatePath, "utf8");
+  const validateStepSrc = readFileSync(validateStepPath, "utf8");
+  const throwCount =
+    (validateSrc.match(/throw\s+jaiphError\(/g) ?? []).length +
+    (validateStepSrc.match(/throw\s+jaiphError\(/g) ?? []).length;
+  assert.equal(
+    throwCount,
+    0,
+    `expected validate.ts + validate-step.ts to use diag.error exclusively, found ${throwCount} throw jaiphError sites`,
+  );
+
+  // Sanity: confirm the migration replaced rather than removed. After Refactor 4
+  // (visitor-table validator) the bulk of these sites moved into the sibling
+  // `validate-step.ts`, so count across both files.
+  const diagErrorCount =
+    (validateSrc.match(/diag\.error\(/g) ?? []).length +
+    (validateStepSrc.match(/diag\.error\(/g) ?? []).length;
+  assert.ok(
+    diagErrorCount >= 40,
+    `expected many diag.error sites across validate.ts + validate-step.ts, found ${diagErrorCount}`,
+  );
+
+  // The fatal allowlist: files where a `throw jaiphError(...)` is allowed
+  // because continuing would produce garbage (parser / loader) or because
+  // the throw is wrapped by `diag.capture(...)` at every caller.
+  const allowlist = new Set([
+    "src/diagnostics.ts",                          // legacy bridge
+    "src/parse/core.ts",                           // parser fail()
+    "src/cli/commands/test.ts",                    // test-file shape fatal
+    "src/transpile/module-graph.ts",               // loader fatal
+    "src/transpile/validate-string.ts",            // leaf helper (captured)
+    "src/transpile/validate-prompt-schema.ts",     // leaf helper (captured)
+    "src/transpile/validate-ref-resolution.ts",    // leaf helper (captured)
+    "src/transpile/shell-jaiph-guard.ts",          // leaf helper (captured)
+  ]);
+
+  // Walk every .ts file under src/, excluding tests, and confirm any raw
+  // `throw jaiphError(` lives in the allowlist. Anything outside the
+  // allowlist is a regression — non-fatal validator/transpiler code must
+  // route through the collector instead.
+  const offenders: string[] = [];
+  walkTsFiles(resolve(repoRoot, "src"), (relPath, contents) => {
+    if (relPath.endsWith(".test.ts")) return;
+    if (!/throw\s+jaiphError\(/.test(contents)) return;
+    if (!allowlist.has(relPath)) offenders.push(relPath);
+  });
+  assert.deepEqual(
+    offenders,
+    [],
+    `unexpected throw jaiphError(...) outside the fatal allowlist: ${offenders.join(", ")}`,
+  );
+});
+
+function walkTsFiles(
+  dir: string,
+  cb: (relPath: string, contents: string) => void,
+): void {
+  const { readdirSync, statSync } = require("node:fs") as typeof import("node:fs");
+  for (const name of readdirSync(dir)) {
+    const full = join(dir, name);
+    const st = statSync(full);
+    if (st.isDirectory()) {
+      walkTsFiles(full, cb);
+      continue;
+    }
+    if (!full.endsWith(".ts")) continue;
+    const rel = full.slice(repoRoot.length + 1);
+    cb(rel, readFileSync(full, "utf8"));
+  }
+}
+
+interface CompileDiagnosticJson {
+  file: string;
+  line: number;
+  col: number;
+  code: string;
+  message: string;
+}
+
+/**
+ * Acceptance #4: CLI exit code is non-zero whenever the collector is
+ * non-empty. `jaiph compile --json` must return the full diagnostic set.
+ */
+test("CLI: `jaiph compile --json` returns full set + non-zero exit on multiple errors", () => {
+  const root = mkdtempSync(join(tmpdir(), "jaiph-diag-cli-"));
+  try {
+    writeFileSync(
+      join(root, "helper.jh"),
+      ["export rule check(x) {", '  return "ok"', "}", ""].join("\n"),
+    );
+    writeFileSync(
+      join(root, "m.jh"),
+      [
+        'import "./helper.jh" as helper',
+        'import "./helper.jh" as helper',
+        "",
+        "workflow default() {",
+        '  log "hi"',
+        '  notify <- "payload"',
+        "  run do_thing()",
+        "}",
+        "",
+      ].join("\n"),
+    );
+
+    const out = spawnSync(
+      process.execPath,
+      [cliJsPath, "compile", "--json", join(root, "m.jh")],
+      { encoding: "utf8" },
+    );
+
+    assert.notEqual(
+      out.status,
+      0,
+      `expected non-zero exit; stdout=${out.stdout} stderr=${out.stderr}`,
+    );
+    const parsed = JSON.parse(out.stdout) as CompileDiagnosticJson[];
+    const inFile = parsed.filter((d) => d.file.endsWith("m.jh"));
+    assert.equal(inFile.length, 3, `expected 3 diagnostics; got ${out.stdout}`);
+  } finally {
+    rmSync(root, { recursive: true, force: true });
+  }
+});
diff --git a/src/transpile/emit-from-graph.ts b/src/transpile/emit-from-graph.ts
new file mode 100644
index 00000000..805e7dc9
--- /dev/null
+++ b/src/transpile/emit-from-graph.ts
@@ -0,0 +1,38 @@
+import { readFileSync } from "node:fs";
+import type { ModuleGraph } from "./module-graph";
+import { buildScriptFiles, type ScriptArtifact } from "./emit-script";
+import { workflowSymbolForFile } from "./resolve";
+import { resolveScriptImportPath, validateModule } from "./validate";
+
+/**
+ * Parse, validate, and extract per-`script` bash files for one module in the
+ * graph. Operates entirely on in-memory ASTs from `graph`; `.jh` files are
+ * never re-read. External `import script` bodies still come from disk (they
+ * are not `.jh`).
+ */
+export function emitScriptsForModuleFromGraph(
+  graph: ModuleGraph,
+  inputFile: string,
+  rootDir: string,
+): ScriptArtifact[] {
+  const node = graph.modules.get(inputFile);
+  if (!node) {
+    throw new Error(`emitScriptsForModule: ${inputFile} is not in the graph`);
+  }
+  const ast = node.ast;
+  validateModule(ast, graph);
+  const workflowSymbol = workflowSymbolForFile(inputFile, rootDir);
+  const importedWorkflowSymbols = new Map<string, string>();
+  for (const [alias, importedFile] of node.imports) {
+    importedWorkflowSymbols.set(alias, workflowSymbolForFile(importedFile, rootDir));
+  }
+  let resolvedScriptImports: Map<string, string> | undefined;
+  if (ast.scriptImports && ast.scriptImports.length > 0) {
+    resolvedScriptImports = new Map();
+    for (const si of ast.scriptImports) {
+      const resolved = resolveScriptImportPath(ast.filePath, si.path);
+      resolvedScriptImports.set(si.alias, readFileSync(resolved, "utf8"));
+    }
+  }
+  return buildScriptFiles(ast, importedWorkflowSymbols, workflowSymbol, resolvedScriptImports);
+}
diff --git a/src/transpile/emit-script.ts b/src/transpile/emit-script.ts
index 5ccf8675..2de81999 100644
--- a/src/transpile/emit-script.ts
+++ b/src/transpile/emit-script.ts
@@ -1,5 +1,5 @@
 import { inlineScriptName } from "../inline-script-name";
-import type { jaiphModule, ScriptImportDef, WorkflowStepDef } from "../types";
+import type { Expr, jaiphModule, ScriptImportDef, WorkflowStepDef } from "../types";
 import { scriptShebangIsBash } from "../parse/script-bash";
 import { langToShebang } from "../parse/scripts";
 
@@ -69,31 +69,50 @@ function wrapBashStandaloneScriptBody(body: string, envPreamble: string): string
 
 export type ScriptArtifact = { name: string; content: string };
 
-/** Collect all inline script steps from a step tree (handles if/else/catch nesting). */
+/** Walk all `Expr` nodes carried by a step and yield inline-script bodies. */
+function emitInlineFromExpr(expr: Expr, seen: Set<string>, out: ScriptArtifact[]): void {
+  if (expr.kind === "inline_script") {
+    const shebang = expr.lang ? langToShebang(expr.lang) : undefined;
+    emitInlineScriptArtifact(expr.body, shebang, seen, out);
+  }
+}
+
+/** Collect all inline script bodies from a step tree (handles if/for/catch/recover nesting). */
 function collectInlineScripts(
   steps: WorkflowStepDef[],
   seen: Set<string>,
   out: ScriptArtifact[],
 ): void {
   for (const s of steps) {
-    if (s.type === "run_inline_script") {
-      const shebang = s.lang ? langToShebang(s.lang) : undefined;
-      emitInlineScriptArtifact(s.body, shebang, seen, out);
-    } else if (s.type === "const" && s.value.kind === "run_inline_script_capture") {
-      const shebang = s.value.lang ? langToShebang(s.value.lang) : undefined;
-      emitInlineScriptArtifact(s.value.body, shebang, seen, out);
-    } else if (s.type === "return" && s.managed?.kind === "run_inline_script") {
-      const shebang = s.managed.lang ? langToShebang(s.managed.lang) : undefined;
-      emitInlineScriptArtifact(s.managed.body, shebang, seen, out);
-    } else if ((s.type === "log" || s.type === "logerr") && s.managed?.kind === "run_inline_script") {
-      const shebang = s.managed.lang ? langToShebang(s.managed.lang) : undefined;
-      emitInlineScriptArtifact(s.managed.body, shebang, seen, out);
-    } else if ((s.type === "ensure" || s.type === "run") && s.catch) {
-      const recoverSteps = "single" in s.catch ? [s.catch.single] : s.catch.block;
-      collectInlineScripts(recoverSteps, seen, out);
-    } else if (s.type === "if") {
-      collectInlineScripts(s.body, seen, out);
-    } else if (s.type === "for_lines") {
+    if (s.type === "exec") {
+      emitInlineFromExpr(s.body, seen, out);
+      if (s.catch) {
+        const recoverSteps = "single" in s.catch ? [s.catch.single] : s.catch.block;
+        collectInlineScripts(recoverSteps, seen, out);
+      }
+      if (s.recover) {
+        const recoverSteps = "single" in s.recover ? [s.recover.single] : s.recover.block;
+        collectInlineScripts(recoverSteps, seen, out);
+      }
+      continue;
+    }
+    if (s.type === "const") {
+      emitInlineFromExpr(s.value, seen, out);
+      continue;
+    }
+    if (s.type === "return") {
+      emitInlineFromExpr(s.value, seen, out);
+      continue;
+    }
+    if (s.type === "say") {
+      emitInlineFromExpr(s.message, seen, out);
+      continue;
+    }
+    if (s.type === "send") {
+      emitInlineFromExpr(s.value, seen, out);
+      continue;
+    }
+    if (s.type === "if" || s.type === "for_lines") {
       collectInlineScripts(s.body, seen, out);
     }
   }
diff --git a/src/transpile/module-graph.test.ts b/src/transpile/module-graph.test.ts
new file mode 100644
index 00000000..09b39999
--- /dev/null
+++ b/src/transpile/module-graph.test.ts
@@ -0,0 +1,259 @@
+import { mkdtempSync, readdirSync, rmSync, writeFileSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { test } from "node:test";
+import assert from "node:assert/strict";
+
+import { buildScriptsFromGraph } from "../transpiler";
+import { buildRuntimeGraph, resolveScriptRef, resolveWorkflowRef } from "../runtime/kernel/graph";
+import {
+  loadModuleGraph,
+  serializeModuleGraph,
+  deserializeModuleGraph,
+} from "./module-graph";
+
+function write(filePath: string, content: string): void {
+  writeFileSync(filePath, content, "utf8");
+}
+
+/**
+ * Acceptance criterion 4 from the parser-simplification design: each `.jh`
+ * source file in a compile is parsed exactly once. After `loadModuleGraph`
+ * walks the entry plus its transitive imports, neither `buildScripts` nor
+ * `buildRuntimeGraph` may re-read a `.jh` source — verified by corrupting
+ * every file post-load and asserting the pipeline still succeeds.
+ */
+test("module-graph: buildScripts + buildRuntimeGraph reuse pre-parsed ASTs and never re-read .jh after load", () => {
+  const dir = mkdtempSync(join(tmpdir(), "jaiph-graph-noreparse-"));
+  try {
+    const main = join(dir, "main.jh");
+    const lib = join(dir, "lib.jh");
+    write(
+      lib,
+      [
+        "rule check() {",
+        '  log "ok"',
+        "}",
+        "script helper = `echo hi`",
+        "workflow inner() {",
+        "  echo ok",
+        "}",
+        "",
+      ].join("\n"),
+    );
+    write(
+      main,
+      [
+        'import "./lib.jh" as lib',
+        "script local_script = `echo local`",
+        "workflow default() {",
+        "  run lib.inner()",
+        "}",
+        "",
+      ].join("\n"),
+    );
+
+    const graph = loadModuleGraph(main);
+    assert.equal(graph.modules.size, 2);
+    assert.ok(graph.modules.has(main));
+    assert.ok(graph.modules.has(lib));
+
+    // Corrupt source contents. Files still exist (so existsSync passes), but
+    // any new parse call would throw a parse error.
+    write(main, "!!! invalid jaiph syntax !!!\n");
+    write(lib, "!!! invalid jaiph syntax !!!\n");
+
+    const outDir = mkdtempSync(join(tmpdir(), "jaiph-graph-out-"));
+    try {
+      const { scriptsDir } = buildScriptsFromGraph(graph, outDir);
+      const emitted = readdirSync(scriptsDir).sort();
+      assert.deepEqual(emitted, ["helper", "local_script"]);
+
+      const runtime = buildRuntimeGraph(graph);
+      assert.equal(runtime.modules.size, 2);
+      const inner = resolveWorkflowRef(runtime, main, {
+        value: "lib.inner",
+        loc: { line: 1, col: 1 },
+      });
+      assert.equal(inner?.workflow.name, "inner");
+      const helper = resolveScriptRef(runtime, main, "lib.helper");
+      assert.equal(helper?.script.name, "helper");
+    } finally {
+      rmSync(outDir, { recursive: true, force: true });
+    }
+  } finally {
+    rmSync(dir, { recursive: true, force: true });
+  }
+});
+
+/**
+ * Cross-module workflow, rule, and script resolution survives the graph
+ * pipeline.
+ */
+test("module-graph: cross-module workflow, rule, and script resolution", () => {
+  const dir = mkdtempSync(join(tmpdir(), "jaiph-graph-crossmod-"));
+  try {
+    const main = join(dir, "main.jh");
+    const lib = join(dir, "lib.jh");
+    write(
+      lib,
+      [
+        "rule check() {",
+        '  log "ok"',
+        "}",
+        "script helper = `echo hi`",
+        "workflow inner() {",
+        "  echo ok",
+        "}",
+        "",
+      ].join("\n"),
+    );
+    write(
+      main,
+      [
+        'import "./lib.jh" as lib',
+        "rule local_check() {",
+        '  log "local"',
+        "}",
+        "script local_script = `echo local`",
+        "workflow default() {",
+        "  run lib.inner()",
+        "}",
+        "",
+      ].join("\n"),
+    );
+
+    const graph = loadModuleGraph(main);
+    const outDir = mkdtempSync(join(tmpdir(), "jaiph-graph-out2-"));
+    try {
+      const { scriptsDir } = buildScriptsFromGraph(graph, outDir);
+      const emitted = readdirSync(scriptsDir).sort();
+      assert.deepEqual(emitted, ["helper", "local_script"]);
+
+      const runtime = buildRuntimeGraph(graph);
+      const localWf = resolveWorkflowRef(runtime, main, {
+        value: "default",
+        loc: { line: 1, col: 1 },
+      });
+      assert.equal(localWf?.workflow.name, "default");
+      const importedWf = resolveWorkflowRef(runtime, main, {
+        value: "lib.inner",
+        loc: { line: 1, col: 1 },
+      });
+      assert.equal(importedWf?.workflow.name, "inner");
+      const localScript = resolveScriptRef(runtime, main, "local_script");
+      assert.equal(localScript?.script.name, "local_script");
+      const importedScript = resolveScriptRef(runtime, main, "lib.helper");
+      assert.equal(importedScript?.script.name, "helper");
+    } finally {
+      rmSync(outDir, { recursive: true, force: true });
+    }
+  } finally {
+    rmSync(dir, { recursive: true, force: true });
+  }
+});
+
+/**
+ * Cross-process boundary: the parent serializes the graph, the child
+ * deserializes it and reuses every AST. Asserts the JSON format is
+ * round-trippable so the runner can rebuild the graph without re-parsing.
+ */
+test("module-graph: serialize round-trip preserves the import closure for the child runner", () => {
+  const dir = mkdtempSync(join(tmpdir(), "jaiph-graph-roundtrip-"));
+  try {
+    const main = join(dir, "main.jh");
+    const lib = join(dir, "lib.jh");
+    write(
+      lib,
+      [
+        "workflow inner() {",
+        "  echo ok",
+        "}",
+        "",
+      ].join("\n"),
+    );
+    write(
+      main,
+      [
+        'import "./lib.jh" as lib',
+        "workflow default() {",
+        "  run lib.inner()",
+        "}",
+        "",
+      ].join("\n"),
+    );
+
+    const graph = loadModuleGraph(main);
+    const serialized = serializeModuleGraph(graph);
+    // Corrupt source contents so any deserialized-path consumer that tries to
+    // re-parse would fail loudly. Files still exist so existsSync passes.
+    write(main, "!!! invalid !!!\n");
+    write(lib, "!!! invalid !!!\n");
+    const round = deserializeModuleGraph(serialized);
+    assert.equal(round.modules.size, 2);
+    const runtime = buildRuntimeGraph(round);
+    const importedWf = resolveWorkflowRef(runtime, main, {
+      value: "lib.inner",
+      loc: { line: 1, col: 1 },
+    });
+    assert.equal(importedWf?.workflow.name, "inner");
+  } finally {
+    rmSync(dir, { recursive: true, force: true });
+  }
+});
+
+/**
+ * Three-module closure: prove the optimization scales beyond the direct
+ * import case in the acceptance criteria.
+ */
+test("module-graph: handles a 3-module closure with one shared parse", () => {
+  const dir = mkdtempSync(join(tmpdir(), "jaiph-graph-three-"));
+  try {
+    const main = join(dir, "main.jh");
+    const libA = join(dir, "a.jh");
+    const libB = join(dir, "b.jh");
+    write(libA, "workflow a() {\n  echo ok\n}\n");
+    write(
+      libB,
+      [
+        'import "./a.jh" as a',
+        "workflow b() {",
+        "  run a.a()",
+        "}",
+        "",
+      ].join("\n"),
+    );
+    write(
+      main,
+      [
+        'import "./b.jh" as b',
+        "workflow default() {",
+        "  run b.b()",
+        "}",
+        "",
+      ].join("\n"),
+    );
+
+    const graph = loadModuleGraph(main);
+    assert.equal(graph.modules.size, 3);
+
+    // Corrupt every source: any downstream re-parse would now fail.
+    write(main, "!!! invalid !!!\n");
+    write(libA, "!!! invalid !!!\n");
+    write(libB, "!!! invalid !!!\n");
+
+    const outDir = mkdtempSync(join(tmpdir(), "jaiph-graph-three-out-"));
+    try {
+      buildScriptsFromGraph(graph, outDir);
+      const runtime = buildRuntimeGraph(graph);
+      const bRef = resolveWorkflowRef(runtime, main, { value: "b.b", loc: { line: 1, col: 1 } });
+      assert.equal(bRef?.workflow.name, "b");
+      const bNode = runtime.modules.get(libB)!;
+      assert.equal(bNode.imports.get("a"), libA);
+    } finally {
+      rmSync(outDir, { recursive: true, force: true });
+    }
+  } finally {
+    rmSync(dir, { recursive: true, force: true });
+  }
+});
diff --git a/src/transpile/module-graph.ts b/src/transpile/module-graph.ts
new file mode 100644
index 00000000..f896a07e
--- /dev/null
+++ b/src/transpile/module-graph.ts
@@ -0,0 +1,118 @@
+import { existsSync, readFileSync, writeFileSync } from "node:fs";
+import { resolve } from "node:path";
+import { jaiphError } from "../errors";
+import { parsejaiph } from "../parser";
+import { resolveImportPath } from "./resolve";
+import type { jaiphModule } from "../types";
+
+/**
+ * `ModuleGraph` is the single representation of "all `.jh` modules reachable
+ * from an entry point, parsed once." `loadModuleGraph` is the only routine
+ * that reads and parses `.jh` sources; `validateReferences` and the script
+ * emitter both consume the graph without touching the filesystem for source
+ * or AST reads.
+ */
+
+export interface ModuleNode {
+  filePath: string;
+  ast: jaiphModule;
+  /** alias → resolved absolute path of imported `.jh` module */
+  imports: Map<string, string>;
+}
+
+export interface ModuleGraph {
+  entryFile: string;
+  workspaceRoot?: string;
+  modules: Map<string, ModuleNode>;
+}
+
+function buildNode(filePath: string, ast: jaiphModule, workspaceRoot?: string): ModuleNode {
+  const imports = new Map<string, string>();
+  for (const imp of ast.imports) {
+    imports.set(imp.alias, resolveImportPath(filePath, imp.path, workspaceRoot));
+  }
+  return { filePath, ast, imports };
+}
+
+/**
+ * Walks the entry plus its transitive `.jh` import closure. Each reachable
+ * file is read from disk and parsed exactly once. Import paths are resolved
+ * via {@link resolveImportPath} so library fallbacks behave as elsewhere in
+ * the toolchain. Missing imports are not surfaced here; the validator
+ * reports `E_IMPORT_NOT_FOUND` once it inspects the graph.
+ */
+export function loadModuleGraph(entryFile: string, workspaceRoot?: string): ModuleGraph {
+  const entry = resolve(entryFile);
+  const modules = new Map<string, ModuleNode>();
+  type QueueEntry = { file: string; importer?: { file: string; alias: string; loc: { line: number; col: number } } };
+  const queue: QueueEntry[] = [{ file: entry }];
+  while (queue.length > 0) {
+    const { file: current, importer } = queue.shift()!;
+    if (modules.has(current)) continue;
+    if (!existsSync(current)) {
+      if (importer) {
+        throw jaiphError(
+          importer.file,
+          importer.loc.line,
+          importer.loc.col,
+          "E_IMPORT_NOT_FOUND",
+          `import "${importer.alias}" resolves to missing file "${current}"`,
+        );
+      }
+      throw jaiphError(current, 1, 1, "E_IMPORT_NOT_FOUND", `entry file not found: "${current}"`);
+    }
+    const ast = parsejaiph(readFileSync(current, "utf8"), current);
+    const node = buildNode(current, ast, workspaceRoot);
+    modules.set(current, node);
+    for (const imp of ast.imports) {
+      const resolved = node.imports.get(imp.alias)!;
+      if (!modules.has(resolved)) {
+        queue.push({ file: resolved, importer: { file: current, alias: imp.alias, loc: imp.loc } });
+      }
+    }
+  }
+  return { entryFile: entry, workspaceRoot, modules };
+}
+
+/** Build a graph from an already-parsed AST plus its workspace-resolved imports. Used by the cross-process deserializer. */
+export function moduleGraphFromAsts(
+  entryFile: string,
+  astByFile: Map<string, jaiphModule>,
+  workspaceRoot?: string,
+): ModuleGraph {
+  const modules = new Map<string, ModuleNode>();
+  for (const [filePath, ast] of astByFile) {
+    modules.set(filePath, buildNode(filePath, ast, workspaceRoot));
+  }
+  return { entryFile: resolve(entryFile), workspaceRoot, modules };
+}
+
+/** Stable JSON encoding for cross-process transfer (entries sorted by absolute path). */
+export function serializeModuleGraph(graph: ModuleGraph): string {
+  const entries = [...graph.modules.entries()];
+  entries.sort(([a], [b]) => (a < b ? -1 : a > b ? 1 : 0));
+  return JSON.stringify({
+    entryFile: graph.entryFile,
+    workspaceRoot: graph.workspaceRoot ?? null,
+    modules: entries.map(([file, node]) => ({ file, ast: node.ast })),
+  });
+}
+
+export function deserializeModuleGraph(content: string): ModuleGraph {
+  const obj = JSON.parse(content) as {
+    entryFile: string;
+    workspaceRoot: string | null;
+    modules: Array<{ file: string; ast: jaiphModule }>;
+  };
+  const astByFile = new Map<string, jaiphModule>();
+  for (const m of obj.modules) astByFile.set(m.file, m.ast);
+  return moduleGraphFromAsts(obj.entryFile, astByFile, obj.workspaceRoot ?? undefined);
+}
+
+export function writeModuleGraph(filePath: string, graph: ModuleGraph): void {
+  writeFileSync(filePath, serializeModuleGraph(graph), "utf8");
+}
+
+export function readModuleGraph(filePath: string): ModuleGraph {
+  return deserializeModuleGraph(readFileSync(filePath, "utf8"));
+}
diff --git a/src/transpile/no-runtime-imports.test.ts b/src/transpile/no-runtime-imports.test.ts
new file mode 100644
index 00000000..6db377ee
--- /dev/null
+++ b/src/transpile/no-runtime-imports.test.ts
@@ -0,0 +1,38 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readFileSync, readdirSync, statSync } from "node:fs";
+import { resolve, join } from "node:path";
+
+// Tests run from dist/src/transpile/, so repo root is three levels up.
+const repoRoot = resolve(__dirname, "../../..");
+const transpileDir = join(repoRoot, "src/transpile");
+
+function listTsFiles(dir: string): string[] {
+  const out: string[] = [];
+  for (const entry of readdirSync(dir)) {
+    const abs = join(dir, entry);
+    if (statSync(abs).isDirectory()) {
+      out.push(...listTsFiles(abs));
+      continue;
+    }
+    if (!entry.endsWith(".ts")) continue;
+    if (entry.endsWith(".test.ts")) continue;
+    out.push(abs);
+  }
+  return out;
+}
+
+test("AC1: no src/transpile/ production source imports from src/runtime/", () => {
+  const files = listTsFiles(transpileDir);
+  assert.ok(files.length > 0, "expected to discover transpile source files");
+  for (const abs of files) {
+    const rel = abs.slice(repoRoot.length + 1);
+    const content = readFileSync(abs, "utf8");
+    const re = /from\s+["'][^"']*\/runtime\/[^"']*["']/;
+    assert.equal(
+      re.test(content),
+      false,
+      `${rel} imports from src/runtime/ — compile-time must not depend on runtime semantics`,
+    );
+  }
+});
diff --git a/src/transpile/pipeline-io-purity.test.ts b/src/transpile/pipeline-io-purity.test.ts
new file mode 100644
index 00000000..8603ec45
--- /dev/null
+++ b/src/transpile/pipeline-io-purity.test.ts
@@ -0,0 +1,233 @@
+import { mkdtempSync, readdirSync, readFileSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { extname, join, resolve } from "node:path";
+import { test } from "node:test";
+import assert from "node:assert/strict";
+
+import { parsejaiph } from "../parser";
+import { loadModuleGraph } from "./module-graph";
+import { validateReferences } from "./validate";
+import { buildScriptsFromGraph } from "../transpiler";
+
+// `require("node:fs")` returns the real, mutable module exports; the
+// TypeScript-emitted `__importStar` wrapper used by `import * as fs` builds a
+// separate getter-only object that defeats monkey-patching, so the purity
+// guards below patch through `require` instead.
+// eslint-disable-next-line @typescript-eslint/no-var-requires
+const realFs: typeof import("node:fs") = require("node:fs");
+
+/** Parser fixtures — exercised stand-alone (parse only; broken imports are fine here). */
+const PARSER_FIXTURE_ROOTS = [
+  resolve(process.cwd(), "test-fixtures/golden-ast/fixtures"),
+  resolve(process.cwd(), "test-fixtures/sample-build/fixtures"),
+  resolve(process.cwd(), "examples"),
+];
+
+/**
+ * Pipeline fixtures — must have a self-contained import closure so
+ * `loadModuleGraph` + `validateReferences` + emit can run end-to-end.
+ * `test-fixtures/golden-ast` is excluded because its `imports.jh` fixture
+ * references a stub `lib.jh` that does not ship alongside it.
+ */
+const PIPELINE_FIXTURE_ROOTS = [
+  resolve(process.cwd(), "test-fixtures/sample-build/fixtures"),
+  resolve(process.cwd(), "examples"),
+];
+
+function listJhFiles(dir: string): string[] {
+  const out: string[] = [];
+  const stack = [dir];
+  while (stack.length > 0) {
+    const current = stack.pop()!;
+    for (const entry of readdirSync(current, { withFileTypes: true })) {
+      const full = join(current, entry.name);
+      if (entry.isDirectory()) stack.push(full);
+      else if (entry.isFile() && extname(entry.name) === ".jh") out.push(full);
+    }
+  }
+  return out;
+}
+
+/**
+ * Acceptance criterion 1: `parsejaiph(source, filePath)` is I/O-pure. With
+ * every fs entry point stubbed to throw for the duration of the call,
+ * parsing every fixture must still succeed because the parser never reaches
+ * `node:fs` at all.
+ */
+test("parser-io-purity: parsejaiph never touches node:fs for any fixture", () => {
+  const fixtures: Array<{ file: string; content: string }> = [];
+  for (const root of PARSER_FIXTURE_ROOTS) {
+    for (const file of listJhFiles(root)) {
+      fixtures.push({ file, content: readFileSync(file, "utf8") });
+    }
+  }
+  assert.ok(fixtures.length > 0, "expected to find .jh fixtures to parse");
+
+  for (const { file, content } of fixtures) {
+    const guard = installFsGuard(() => true);
+    try {
+      const ast = parsejaiph(content, file);
+      assert.equal(ast.filePath, file, `parse produced unexpected filePath for ${file}`);
+    } finally {
+      guard.restore();
+    }
+  }
+});
+
+/**
+ * Acceptance criterion 2: once the module graph is loaded, neither
+ * `validate(graph)` nor `emit(graph, outDir)` may reach the filesystem for
+ * `.jh` source or AST reads. Writing emitted bash files is allowed.
+ *
+ * The test loads each fixture (fs is unstubbed during load), then stubs
+ * `fs.readFileSync` / `fs.existsSync` to throw on any `.jh` path, and runs
+ * `validateReferences(graph)` plus a full script emit. Both must succeed.
+ */
+test("pipeline-io-purity: validate(graph) and emit(graph, outDir) never read .jh from disk", () => {
+  const entries: string[] = [];
+  for (const root of PIPELINE_FIXTURE_ROOTS) {
+    for (const file of listJhFiles(root)) {
+      // Skip *.test.jh — those are exercised by the test-runner path; the
+      // graph pipeline still loads them but they share the same purity
+      // guarantees and lengthen the test for no extra coverage.
+      if (file.endsWith(".test.jh")) continue;
+      entries.push(file);
+    }
+  }
+  assert.ok(entries.length > 0, "expected to find .jh fixtures");
+
+  for (const entry of entries) {
+    const graph = loadModuleGraph(entry);
+    const outDir = mkdtempSync(join(tmpdir(), "jaiph-emit-purity-"));
+    const guard = installFsGuard((path) => extname(path) === ".jh");
+    try {
+      validateReferences(graph);
+      buildScriptsFromGraph(graph, outDir);
+    } finally {
+      guard.restore();
+      rmSync(outDir, { recursive: true, force: true });
+    }
+  }
+});
+
+/**
+ * Acceptance criterion 4: each `.jh` source file in a compile is parsed
+ * exactly once. The test creates a graph with transitive imports
+ * (entry → lib → leaf), counts `parsejaiph` invocations across
+ * `loadModuleGraph` + `validateReferences` + `buildScriptsFromGraph`, and
+ * asserts the count equals the number of unique modules.
+ */
+test("parse-once: full pipeline calls parsejaiph exactly once per reachable .jh module", () => {
+  const dir = mkdtempSync(join(tmpdir(), "jaiph-parse-once-"));
+  try {
+    const entry = join(dir, "main.jh");
+    const libA = join(dir, "a.jh");
+    const libB = join(dir, "b.jh");
+    require("node:fs").writeFileSync(libA, "workflow a() {\n  echo ok\n}\n", "utf8");
+    require("node:fs").writeFileSync(
+      libB,
+      ['import "./a.jh" as a', "workflow b() {", "  run a.a()", "}", ""].join("\n"),
+      "utf8",
+    );
+    require("node:fs").writeFileSync(
+      entry,
+      ['import "./b.jh" as b', "workflow default() {", "  run b.b()", "}", ""].join("\n"),
+      "utf8",
+    );
+
+    const counter = installParseCounter();
+    try {
+      const graph = loadModuleGraph(entry);
+      validateReferences(graph);
+      const outDir = mkdtempSync(join(tmpdir(), "jaiph-parse-once-out-"));
+      try {
+        buildScriptsFromGraph(graph, outDir);
+      } finally {
+        rmSync(outDir, { recursive: true, force: true });
+      }
+      assert.equal(graph.modules.size, 3);
+      assert.equal(
+        counter.byFile.size,
+        3,
+        `expected 3 unique files parsed, got ${[...counter.byFile.keys()].join(", ")}`,
+      );
+      for (const [file, count] of counter.byFile) {
+        assert.equal(count, 1, `file ${file} parsed ${count} times (expected 1)`);
+      }
+    } finally {
+      counter.restore();
+    }
+  } finally {
+    rmSync(dir, { recursive: true, force: true });
+  }
+});
+
+interface FsGuard {
+  restore(): void;
+}
+
+/**
+ * Replace `fs.readFileSync`, `fs.existsSync`, `fs.statSync` so they throw
+ * when `shouldBlock(path)` returns true. Patching is done against the real
+ * `require("node:fs")` exports because the TS `__importStar` wrapper used
+ * by `import * as fs` returns getter-only properties.
+ */
+function installFsGuard(shouldBlock: (path: string) => boolean): FsGuard {
+  const orig = {
+    readFileSync: realFs.readFileSync,
+    existsSync: realFs.existsSync,
+    statSync: realFs.statSync,
+  };
+  const guardCall = (name: string, path: unknown): void => {
+    if (typeof path !== "string") return;
+    if (shouldBlock(path)) {
+      throw new Error(`fs.${name} blocked by purity guard: ${path}`);
+    }
+  };
+  const mutable = realFs as unknown as Record<string, unknown>;
+  mutable.readFileSync = (path: unknown, opts?: unknown) => {
+    guardCall("readFileSync", path);
+    return orig.readFileSync(path as Parameters<typeof orig.readFileSync>[0], opts as Parameters<typeof orig.readFileSync>[1]);
+  };
+  mutable.existsSync = (path: unknown) => {
+    guardCall("existsSync", path);
+    return orig.existsSync(path as Parameters<typeof orig.existsSync>[0]);
+  };
+  mutable.statSync = (path: unknown, opts?: unknown) => {
+    guardCall("statSync", path);
+    return orig.statSync(path as Parameters<typeof orig.statSync>[0], opts as Parameters<typeof orig.statSync>[1]);
+  };
+  return {
+    restore(): void {
+      mutable.readFileSync = orig.readFileSync;
+      mutable.existsSync = orig.existsSync;
+      mutable.statSync = orig.statSync;
+    },
+  };
+}
+
+interface ParseCounter {
+  byFile: Map<string, number>;
+  restore(): void;
+}
+
+/**
+ * Replace the exported `parsejaiph` on the module so every call goes through
+ * a counting wrapper. Works because TypeScript's CJS output rewrites named
+ * imports as property reads against the module's exports object.
+ */
+function installParseCounter(): ParseCounter {
+  const parserMod = require("../parser") as { parsejaiph: typeof parsejaiph };
+  const original = parserMod.parsejaiph;
+  const byFile = new Map<string, number>();
+  parserMod.parsejaiph = function counting(source: string, filePath: string) {
+    byFile.set(filePath, (byFile.get(filePath) ?? 0) + 1);
+    return original(source, filePath);
+  } as typeof parsejaiph;
+  return {
+    byFile,
+    restore(): void {
+      parserMod.parsejaiph = original;
+    },
+  };
+}
diff --git a/src/transpile/validate-prompt-schema.test.ts b/src/transpile/validate-prompt-schema.test.ts
index 9f26300c..9fe1f637 100644
--- a/src/transpile/validate-prompt-schema.test.ts
+++ b/src/transpile/validate-prompt-schema.test.ts
@@ -65,34 +65,28 @@ test("validatePromptReturnsSchema: rejects malformed entry", () => {
 // --- validatePromptStepReturns ---
 
 test("validatePromptStepReturns: no error when no returns", () => {
-  const step = {
-    type: "prompt" as const,
-    raw: 'prompt "hello"',
-    loc: { line: 1, col: 1 },
-  };
-  validatePromptStepReturns(step, "test.jh");
+  validatePromptStepReturns(
+    { loc: { line: 1, col: 1 } },
+    undefined,
+    "test.jh",
+  );
 });
 
 test("validatePromptStepReturns: no error when returns with capture", () => {
-  const step = {
-    type: "prompt" as const,
-    raw: '"hello"',
-    loc: { line: 1, col: 1 },
-    captureName: "result",
-    returns: "{ name: string }",
-  };
-  validatePromptStepReturns(step, "test.jh");
+  validatePromptStepReturns(
+    { returns: "{ name: string }", loc: { line: 1, col: 1 } },
+    "result",
+    "test.jh",
+  );
 });
 
 test("validatePromptStepReturns: rejects returns without capture", () => {
-  const step = {
-    type: "prompt" as const,
-    raw: 'prompt "hello" returns "{ name: string }"',
-    loc: { line: 1, col: 1 },
-    returns: "{ name: string }",
-  };
   assert.throws(
-    () => validatePromptStepReturns(step, "test.jh"),
+    () => validatePromptStepReturns(
+      { returns: "{ name: string }", loc: { line: 1, col: 1 } },
+      undefined,
+      "test.jh",
+    ),
     /must capture to a variable/,
   );
 });
diff --git a/src/transpile/validate-prompt-schema.ts b/src/transpile/validate-prompt-schema.ts
index bb475e73..aee7d4b2 100644
--- a/src/transpile/validate-prompt-schema.ts
+++ b/src/transpile/validate-prompt-schema.ts
@@ -1,5 +1,4 @@
 import { jaiphError } from "../errors";
-import type { WorkflowStepDef } from "../types";
 
 const SUPPORTED_SCHEMA_TYPES = new Set<string>(["string", "number", "boolean"]);
 
@@ -51,20 +50,22 @@ export function validatePromptReturnsSchema(
   }
 }
 
+/** Validate that a prompt's optional returns schema is well-formed and bound to a capture. */
 export function validatePromptStepReturns(
-  step: Extract<WorkflowStepDef, { type: "prompt" }>,
+  prompt: { returns?: string; loc: { line: number; col: number } },
+  captureName: string | undefined,
   filePath: string,
 ): void {
-  if (step.returns !== undefined) {
-    if (!step.captureName) {
+  if (prompt.returns !== undefined) {
+    if (!captureName) {
       throw jaiphError(
         filePath,
-        step.loc.line,
-        step.loc.col,
+        prompt.loc.line,
+        prompt.loc.col,
         "E_PARSE",
         'prompt with "returns" schema must capture to a variable (e.g. const result = prompt "..." returns "{ ... }")',
       );
     }
-    validatePromptReturnsSchema(step.returns, filePath, step.loc.line, step.loc.col);
+    validatePromptReturnsSchema(prompt.returns, filePath, prompt.loc.line, prompt.loc.col);
   }
 }
diff --git a/src/transpile/validate-ref-resolution.test.ts b/src/transpile/validate-ref-resolution.test.ts
index a45329f3..42234774 100644
--- a/src/transpile/validate-ref-resolution.test.ts
+++ b/src/transpile/validate-ref-resolution.test.ts
@@ -58,7 +58,7 @@ test("lookupKind: finds workflow", () => {
 
 test("lookupKind: finds script", () => {
   const mod = minimalModule({
-    scripts: [{ name: "build_it", comments: [], body: "", bodyKind: "backtick" as const, loc: { line: 1, col: 1 } }],
+    scripts: [{ name: "build_it", comments: [], body: "", loc: { line: 1, col: 1 } }],
   });
   assert.equal(lookupKind(mod, "build_it"), "script");
 });
@@ -241,7 +241,7 @@ test("validateRef: bare_send_rhs rejects local workflow", () => {
 
 test("validateRef: bare_send_rhs rejects local script", () => {
   const mod = minimalModule({
-    scripts: [{ name: "build", comments: [], body: "", bodyKind: "backtick" as const, loc: { line: 1, col: 1 } }],
+    scripts: [{ name: "build", comments: [], body: "", loc: { line: 1, col: 1 } }],
   });
   const ctx = makeCtx();
   assert.throws(
diff --git a/src/transpile/validate-single-walk.test.ts b/src/transpile/validate-single-walk.test.ts
new file mode 100644
index 00000000..e4cc4d73
--- /dev/null
+++ b/src/transpile/validate-single-walk.test.ts
@@ -0,0 +1,106 @@
+import { readFileSync } from "node:fs";
+import { resolve } from "node:path";
+import test from "node:test";
+import assert from "node:assert/strict";
+
+// Compiled test sits at dist/src/transpile/; the source file is three levels
+// up under src/transpile/.
+const validatePath = resolve(__dirname, "../../../src/transpile/validate.ts");
+
+/**
+ * AC1 — The three pre-pass helpers (`collectKnownVars`,
+ * `collectPromptSchemas`, `validateImmutableBindings`) have been replaced by a
+ * single workflow walk. None of those names should reappear in validate.ts —
+ * if they do, this test fails immediately. The grep is anchored on word
+ * boundaries so unrelated identifiers (e.g. a `validateImmutableBindingsFoo`
+ * variant) would still be flagged.
+ */
+test("AC1: pre-pass helpers are deleted from validate.ts", () => {
+  const text = readFileSync(validatePath, "utf8");
+  const forbidden = [
+    "collectKnownVars",
+    "collectPromptSchemas",
+    "validateImmutableBindings",
+  ];
+  const offenders: string[] = [];
+  for (const name of forbidden) {
+    if (new RegExp(`\\b${name}\\b`).test(text)) {
+      offenders.push(name);
+    }
+  }
+  assert.deepEqual(
+    offenders,
+    [],
+    `forbidden helper names reappeared in validate.ts: ${offenders.join(", ")}`,
+  );
+});
+
+/**
+ * AC2 — Exactly one recursive helper in validate.ts walks
+ * `WorkflowStepDef[]`. A "helper" is any top-level or nested
+ * function/arrow declaration whose parameter list mentions
+ * `WorkflowStepDef[]`; it is "recursive" if its body calls its own name.
+ *
+ * Before the refactor there were four such walkers (`collectKnownVars`'s
+ * inner walk, `validateImmutableBindings`'s inner walk, the workflow's
+ * `validateStep`, and the rule's `validateRuleStep`). After the refactor
+ * only the single `descend` inside `walkStepTree` should remain.
+ */
+test("AC2: at most one recursive helper walks WorkflowStepDef[] in validate.ts", () => {
+  const text = readFileSync(validatePath, "utf8");
+  const helpers = findStepArrayHelpers(text);
+  const recursive = helpers.filter((h) =>
+    new RegExp(`\\b${h.name}\\(`).test(h.body),
+  );
+  assert.ok(
+    recursive.length <= 1,
+    `expected at most 1 recursive helper walking WorkflowStepDef[] in validate.ts, ` +
+      `found ${recursive.length}: ${recursive.map((h) => h.name).join(", ")}`,
+  );
+});
+
+interface Helper {
+  name: string;
+  body: string;
+}
+
+/**
+ * Locate every `function NAME(...)` or `const NAME = (...) => ...` declaration
+ * whose parameter list textually contains `WorkflowStepDef[]`, and return its
+ * name + body (text between the body's matching braces). Nested arrows count
+ * — that's how we catch a helper redeclared inside another function.
+ */
+function findStepArrayHelpers(text: string): Helper[] {
+  const out: Helper[] = [];
+  const declRe = /(?:^|\n)\s*(?:function\s+(\w+)\s*\(|(?:const|let)\s+(\w+)\s*=\s*(?:async\s*)?\()/g;
+  let match: RegExpExecArray | null;
+  while ((match = declRe.exec(text)) !== null) {
+    const name = match[1] ?? match[2];
+    if (!name) continue;
+    const openParen = text.indexOf("(", match.index);
+    if (openParen < 0) continue;
+    const closeParen = findMatching(text, openParen, "(", ")");
+    if (closeParen < 0) continue;
+    const params = text.slice(openParen, closeParen + 1);
+    if (!params.includes("WorkflowStepDef[]")) continue;
+    const bodyOpen = text.indexOf("{", closeParen);
+    if (bodyOpen < 0) continue;
+    const bodyClose = findMatching(text, bodyOpen, "{", "}");
+    if (bodyClose < 0) continue;
+    out.push({ name, body: text.slice(bodyOpen + 1, bodyClose) });
+  }
+  return out;
+}
+
+function findMatching(text: string, openIdx: number, open: string, close: string): number {
+  let depth = 0;
+  for (let i = openIdx; i < text.length; i += 1) {
+    const ch = text[i];
+    if (ch === open) depth += 1;
+    else if (ch === close) {
+      depth -= 1;
+      if (depth === 0) return i;
+    }
+  }
+  return -1;
+}
diff --git a/src/transpile/validate-step.ts b/src/transpile/validate-step.ts
new file mode 100644
index 00000000..cd9fb900
--- /dev/null
+++ b/src/transpile/validate-step.ts
@@ -0,0 +1,1056 @@
+/**
+ * Visitor table for the validator: one row per step type, one expression
+ * dispatcher, and the small per-call-shape helper that holds the five
+ * standard checks. `validateStep` is the only entry point — it consults
+ * `Scope.allowSteps` once and dispatches into `VALIDATORS`; everything below
+ * is scope-aware via the `ValidatorCtx`.
+ */
+import { Diagnostics } from "../diagnostics";
+import { matchSendOperator } from "../parse/core";
+import type { Arg, Expr, jaiphModule, MatchExprDef, WorkflowStepDef } from "../types";
+import { canonicalizeTripleQuotedString } from "../parse/triple-quote";
+import {
+  BARE_SEND_REF_MSG,
+  lookupKind,
+  RULE_REF_EXPECT,
+  RUN_IN_RULE_REF_EXPECT,
+  RUN_TARGET_REF_EXPECT,
+  validateRef,
+  WORKFLOW_REF_EXPECT,
+  type RefExpectMessages,
+  type RefResolutionContext,
+  type RefTargetKind,
+} from "./validate-ref-resolution";
+import { validatePromptReturnsSchema, validatePromptStepReturns } from "./validate-prompt-schema";
+import {
+  validateManagedWorkflowShell,
+  type SubstitutionValidateEnv,
+} from "./validate-substitution";
+import {
+  extractDotFieldRefs,
+  extractInlineCaptures,
+  validateFailString,
+  validateJaiphStringContent,
+  validateLogString,
+  validatePromptString,
+  validateReturnString,
+  validateSimpleInterpolationIdentifiers,
+} from "./validate-string";
+
+export interface Scope {
+  kind: "workflow" | "rule";
+  /** Step types allowed in this scope — single set-lookup gate at the visitor entry. */
+  allowSteps: Set<WorkflowStepDef["type"]>;
+  /** Per-step-type message used when a step is rejected by `allowSteps`. */
+  disallowStepMessages: Partial<Record<WorkflowStepDef["type"], string>>;
+  /** Ref expectation for `run ref(...)` callees (workflow vs rule semantics differ). */
+  runRefExpect: RefExpectMessages;
+  /** True for workflows — rules skip prompt schema collection and reject prompts. */
+  withPromptSchemas: boolean;
+}
+
+export const WORKFLOW_SCOPE: Scope = {
+  kind: "workflow",
+  allowSteps: new Set([
+    "trivia",
+    "send",
+    "say",
+    "return",
+    "const",
+    "exec",
+    "if",
+    "for_lines",
+  ]),
+  disallowStepMessages: {},
+  runRefExpect: RUN_TARGET_REF_EXPECT,
+  withPromptSchemas: true,
+};
+
+export const RULE_SCOPE: Scope = {
+  kind: "rule",
+  allowSteps: new Set(["trivia", "say", "return", "const", "exec", "if", "for_lines"]),
+  disallowStepMessages: {
+    send: "send is not allowed in rules",
+  },
+  runRefExpect: RUN_IN_RULE_REF_EXPECT,
+  withPromptSchemas: false,
+};
+
+export interface ValidatorCtx {
+  diag: Diagnostics;
+  ast: jaiphModule;
+  refCtx: RefResolutionContext;
+  scope: Scope;
+  knownVars: Set<string>;
+  promptSchemas: Map<string, string[]>;
+  recoverBindings: Set<string> | undefined;
+  localChannels: Set<string>;
+  localScripts: Set<string>;
+  localWorkflows: Set<string>;
+  importsByAlias: Map<string, string>;
+  importedAstCache: Map<string, jaiphModule>;
+}
+
+type StepValidator = (s: WorkflowStepDef, ctx: ValidatorCtx) => void;
+
+const VALIDATORS: Record<WorkflowStepDef["type"], StepValidator> = {
+  trivia: () => {},
+  const: validateConstStep,
+  return: validateReturnStep,
+  send: validateSendStep,
+  say: validateSayStep,
+  exec: validateExecStep,
+  if: validateIfStep,
+  for_lines: validateForLinesStep,
+};
+
+/** Sole entry for per-step validation. Scope gate first, table dispatch second. */
+export function validateStep(s: WorkflowStepDef, ctx: ValidatorCtx): void {
+  const v = (VALIDATORS as Record<string, StepValidator | undefined>)[s.type];
+  if (!v) {
+    const loc = (s as { loc?: { line: number; col: number } }).loc ?? { line: 0, col: 0 };
+    ctx.diag.error(
+      ctx.ast.filePath,
+      loc.line,
+      loc.col,
+      "E_VALIDATE",
+      `internal: no validator for step type "${(s as { type: string }).type}"`,
+    );
+  }
+  if (!ctx.scope.allowSteps.has(s.type)) {
+    const msg = ctx.scope.disallowStepMessages[s.type];
+    if (msg !== undefined) {
+      const loc = (s as { loc: { line: number; col: number } }).loc;
+      ctx.diag.error(ctx.ast.filePath, loc.line, loc.col, "E_VALIDATE", msg);
+    }
+    return;
+  }
+  v(s, ctx);
+}
+
+// -- Per-step validators ----------------------------------------------------
+
+function validateConstStep(s: WorkflowStepDef, ctx: ValidatorCtx): void {
+  if (s.type !== "const") return;
+  validateExpr(s.value, s.loc, "const", ctx);
+}
+
+function validateReturnStep(s: WorkflowStepDef, ctx: ValidatorCtx): void {
+  if (s.type !== "return") return;
+  validateExpr(s.value, s.loc, "return", ctx);
+}
+
+function validateSendStep(s: WorkflowStepDef, ctx: ValidatorCtx): void {
+  if (s.type !== "send") return;
+  validateChannelRef(s.channel, s.loc, ctx);
+  validateExpr(s.value, s.loc, "send", ctx);
+}
+
+function validateSayStep(s: WorkflowStepDef, ctx: ValidatorCtx): void {
+  if (s.type !== "say") return;
+  if (s.level === "log" || s.level === "logerr") {
+    if (s.message.kind === "inline_script") return;
+    if (s.message.kind === "literal") {
+      validateLogString(s.message.raw, ctx.ast.filePath, s.loc.line, s.loc.col, s.level);
+      const inner = s.message.raw;
+      validateInlineStringCaptures(inner, s.loc, ctx);
+      if (ctx.scope.withPromptSchemas) {
+        validateDotFieldRefs(inner, s.loc, ctx);
+      }
+      validateSimpleInterpolationIdentifiers(
+        inner,
+        ctx.ast.filePath,
+        s.loc.line,
+        s.loc.col,
+        s.level,
+        ctx.knownVars,
+        ctx.scope.kind,
+        ctx.scope.withPromptSchemas ? ctx.promptSchemas : undefined,
+        ctx.recoverBindings,
+        ctx.localScripts,
+      );
+      return;
+    }
+    ctx.diag.error(
+      ctx.ast.filePath,
+      s.loc.line,
+      s.loc.col,
+      "E_VALIDATE",
+      `unsupported ${s.level} message form`,
+    );
+  }
+  if (s.message.kind !== "literal") {
+    ctx.diag.error(
+      ctx.ast.filePath,
+      s.loc.line,
+      s.loc.col,
+      "E_VALIDATE",
+      "fail message must be a literal string",
+    );
+  }
+  validateFailString(s.message.raw, ctx.ast.filePath, s.loc.line, s.loc.col);
+  const failInner = semanticQuotedOrchestrationInner(s.message.raw);
+  validateInlineStringCaptures(failInner, s.loc, ctx);
+  if (ctx.scope.withPromptSchemas) {
+    validateDotFieldRefs(failInner, s.loc, ctx);
+  }
+  validateSimpleInterpolationIdentifiers(
+    failInner,
+    ctx.ast.filePath,
+    s.loc.line,
+    s.loc.col,
+    "fail",
+    ctx.knownVars,
+    ctx.scope.kind,
+    ctx.scope.withPromptSchemas ? ctx.promptSchemas : undefined,
+    ctx.recoverBindings,
+    ctx.localScripts,
+  );
+}
+
+function validateExecStep(s: WorkflowStepDef, ctx: ValidatorCtx): void {
+  if (s.type !== "exec") return;
+  const body = s.body;
+  if (body.kind === "prompt") {
+    if (ctx.scope.kind === "rule") {
+      ctx.diag.error(
+        ctx.ast.filePath,
+        body.loc.line,
+        body.loc.col,
+        "E_VALIDATE",
+        "prompt is not allowed in rules",
+      );
+    }
+    validateExpr(body, s.loc, "const", ctx);
+    validatePromptStepReturns(body, s.captureName, ctx.ast.filePath);
+    return;
+  }
+  if (body.kind === "shell") {
+    if (ctx.scope.kind === "rule") {
+      ctx.diag.error(
+        ctx.ast.filePath,
+        body.loc.line,
+        body.loc.col,
+        "E_VALIDATE",
+        "inline shell steps are forbidden in rules; use explicit script blocks",
+      );
+    }
+    validateWorkflowShellExec(body, ctx);
+    return;
+  }
+  if (body.kind === "call" && body.async && ctx.scope.kind === "rule") {
+    ctx.diag.error(
+      ctx.ast.filePath,
+      body.callee.loc.line,
+      body.callee.loc.col,
+      "E_VALIDATE",
+      "run async is not allowed in rules; use it in workflows only",
+    );
+  }
+  validateExpr(body, s.loc, "exec", ctx);
+}
+
+function validateIfStep(s: WorkflowStepDef, ctx: ValidatorCtx): void {
+  if (s.type !== "if") return;
+  if (s.operand.kind === "regex") {
+    try {
+      new RegExp(s.operand.source);
+    } catch {
+      ctx.diag.error(
+        ctx.ast.filePath,
+        s.loc.line,
+        s.loc.col,
+        "E_VALIDATE",
+        `invalid regex in if condition: /${s.operand.source}/`,
+      );
+    }
+  }
+  validateDotSubject(s.subject, s.loc, ctx);
+}
+
+function validateForLinesStep(s: WorkflowStepDef, ctx: ValidatorCtx): void {
+  if (s.type !== "for_lines") return;
+  if (!ctx.knownVars.has(s.sourceVar)) {
+    ctx.diag.error(
+      ctx.ast.filePath,
+      s.loc.line,
+      s.loc.col,
+      "E_VALIDATE",
+      `for ... in <name>: "${s.sourceVar}" is not a known variable in this scope`,
+    );
+  }
+}
+
+// -- Expr dispatcher --------------------------------------------------------
+
+type ExprLabel = "const" | "return" | "send" | "exec";
+
+function validateExpr(
+  expr: Expr,
+  stepLoc: { line: number; col: number },
+  label: ExprLabel,
+  ctx: ValidatorCtx,
+): void {
+  if (expr.kind === "literal") {
+    validateLiteralExpr(expr, stepLoc, label, ctx);
+    return;
+  }
+  if (expr.kind === "call" || expr.kind === "ensure_call") {
+    validateCallable(expr, ctx);
+    return;
+  }
+  if (expr.kind === "inline_script") {
+    return;
+  }
+  if (expr.kind === "match") {
+    validateMatchExpr(ctx.diag, ctx.ast.filePath, expr.match, ctx.knownVars);
+    validateDotSubject(expr.match.subject, expr.match.loc, ctx);
+    return;
+  }
+  if (expr.kind === "prompt") {
+    validatePromptExpr(expr, stepLoc, label, ctx);
+    return;
+  }
+  if (expr.kind === "bare_ref") {
+    if (label !== "send") {
+      ctx.diag.error(
+        ctx.ast.filePath,
+        expr.ref.loc.line,
+        expr.ref.loc.col,
+        "E_VALIDATE",
+        "bare reference is only valid as a send payload",
+      );
+    }
+    validateRef(expr.ref, ctx.ast, ctx.refCtx, {
+      mode: "bare_send_rhs",
+      bareSend: BARE_SEND_REF_MSG,
+      lookupImportedKind: makeImportedKindLookup(ctx),
+    });
+    return;
+  }
+  if (expr.kind === "shell") {
+    if (label !== "send") {
+      ctx.diag.error(
+        ctx.ast.filePath,
+        expr.loc.line,
+        expr.loc.col,
+        "E_VALIDATE",
+        "raw shell fragment is only valid as a send payload",
+      );
+    }
+    validateManagedWorkflowShell(expr.command, makeSubEnv(ctx, expr.loc));
+    return;
+  }
+}
+
+function validateLiteralExpr(
+  expr: Extract<Expr, { kind: "literal" }>,
+  stepLoc: { line: number; col: number },
+  label: ExprLabel,
+  ctx: ValidatorCtx,
+): void {
+  if (label === "send") {
+    const inner = expr.raw.startsWith('"') && expr.raw.endsWith('"') ? expr.raw.slice(1, -1) : expr.raw;
+    validateJaiphStringContent(inner, ctx.ast.filePath, stepLoc.line, stepLoc.col, "send");
+    validateInlineStringCaptures(inner, stepLoc, ctx);
+    validateDotFieldRefs(inner, stepLoc, ctx);
+    validateSimpleInterpolationIdentifiers(
+      inner,
+      ctx.ast.filePath,
+      stepLoc.line,
+      stepLoc.col,
+      "send",
+      ctx.knownVars,
+      ctx.scope.kind,
+      ctx.promptSchemas,
+      ctx.recoverBindings,
+      ctx.localScripts,
+    );
+    return;
+  }
+  if (label === "return") {
+    validateReturnString(expr.raw, ctx.ast.filePath, stepLoc.line, stepLoc.col);
+    if (expr.raw.startsWith('"')) {
+      const retInner = stripDQ(expr.raw);
+      validateInlineStringCaptures(retInner, stepLoc, ctx);
+      if (ctx.scope.withPromptSchemas) {
+        validateDotFieldRefs(retInner, stepLoc, ctx);
+      }
+      validateSimpleInterpolationIdentifiers(
+        retInner,
+        ctx.ast.filePath,
+        stepLoc.line,
+        stepLoc.col,
+        "return",
+        ctx.knownVars,
+        ctx.scope.kind,
+        ctx.scope.withPromptSchemas ? ctx.promptSchemas : undefined,
+        ctx.recoverBindings,
+        ctx.localScripts,
+      );
+    }
+    return;
+  }
+  // const / exec — same string-content handling
+  const scriptName = extractConstScriptName(expr.raw);
+  if (scriptName && ctx.localScripts.has(scriptName)) {
+    ctx.diag.error(
+      ctx.ast.filePath,
+      stepLoc.line,
+      stepLoc.col,
+      "E_VALIDATE",
+      `scripts are not values; "${scriptName}" is a script definition`,
+    );
+  }
+  const inner = stripDQ(expr.raw);
+  validateInlineStringCaptures(inner, stepLoc, ctx);
+  if (ctx.scope.withPromptSchemas) {
+    validateDotFieldRefs(inner, stepLoc, ctx);
+  }
+  validateSimpleInterpolationIdentifiers(
+    inner,
+    ctx.ast.filePath,
+    stepLoc.line,
+    stepLoc.col,
+    "const",
+    ctx.knownVars,
+    ctx.scope.kind,
+    ctx.scope.withPromptSchemas ? ctx.promptSchemas : undefined,
+    ctx.recoverBindings,
+    ctx.localScripts,
+  );
+}
+
+function validatePromptExpr(
+  expr: Extract<Expr, { kind: "prompt" }>,
+  stepLoc: { line: number; col: number },
+  label: ExprLabel,
+  ctx: ValidatorCtx,
+): void {
+  if (ctx.scope.kind === "rule") {
+    ctx.diag.error(
+      ctx.ast.filePath,
+      stepLoc.line,
+      stepLoc.col,
+      "E_VALIDATE",
+      "const ... = prompt is not allowed in rules",
+    );
+  }
+  if (label !== "const" && label !== "exec") {
+    ctx.diag.error(
+      ctx.ast.filePath,
+      stepLoc.line,
+      stepLoc.col,
+      "E_VALIDATE",
+      `prompt is not a valid ${label} value`,
+    );
+  }
+  const promptIdent = promptBareIdentifier(expr.raw);
+  if (promptIdent && ctx.localScripts.has(promptIdent)) {
+    ctx.diag.error(
+      ctx.ast.filePath,
+      stepLoc.line,
+      stepLoc.col,
+      "E_VALIDATE",
+      `scripts are not promptable; "${promptIdent}" is a script — use a string const instead`,
+    );
+  }
+  validatePromptString(expr.raw, ctx.ast.filePath, stepLoc.line, stepLoc.col);
+  if (expr.returns !== undefined) {
+    validatePromptReturnsSchema(expr.returns, ctx.ast.filePath, stepLoc.line, stepLoc.col);
+  }
+  const pcInner = stripDQ(expr.raw);
+  validateInlineStringCaptures(pcInner, stepLoc, ctx);
+  validateDotFieldRefs(pcInner, stepLoc, ctx);
+  validateSimpleInterpolationIdentifiers(
+    pcInner,
+    ctx.ast.filePath,
+    stepLoc.line,
+    stepLoc.col,
+    "prompt",
+    ctx.knownVars,
+    ctx.scope.kind,
+    ctx.promptSchemas,
+    ctx.recoverBindings,
+    ctx.localScripts,
+  );
+}
+
+// -- Managed call shape (the "5-check sequence") ----------------------------
+
+/**
+ * The five checks every call site repeats: shell-redirection, nested-unmanaged
+ * call inside literals, ref resolution, arity, and var-arg resolution. The
+ * scope picks the ref expectation for `run` (workflow vs rule semantics).
+ */
+function validateCallable(expr: Expr, ctx: ValidatorCtx): void {
+  if (expr.kind === "call") {
+    const loc = expr.callee.loc;
+    validateNoShellRedirection(ctx.diag, ctx.ast.filePath, loc, "run", expr.args);
+    validateNestedManagedCallArgs(ctx.diag, ctx.ast.filePath, loc, expr.args);
+    const isRuleScope = ctx.scope.kind === "rule";
+    if (
+      !expr.callee.value.includes(".") &&
+      ctx.knownVars.has(expr.callee.value) &&
+      !ctx.localScripts.has(expr.callee.value) &&
+      !(!isRuleScope && ctx.localWorkflows.has(expr.callee.value))
+    ) {
+      ctx.diag.error(
+        ctx.ast.filePath,
+        loc.line,
+        loc.col,
+        "E_VALIDATE",
+        `strings are not executable; "${expr.callee.value}" is a string — use a script instead`,
+      );
+    }
+    validateRef(expr.callee, ctx.ast, ctx.refCtx, {
+      mode: "expect",
+      expect: ctx.scope.runRefExpect,
+    });
+    validateArity(ctx.diag, ctx.ast.filePath, loc, expr.callee.value, expr.args, "workflow", ctx.ast, ctx.refCtx);
+    validateArgVarRefs(ctx.diag, ctx.ast.filePath, loc, expr.args, ctx.knownVars, ctx.recoverBindings);
+    return;
+  }
+  if (expr.kind === "ensure_call") {
+    const loc = expr.callee.loc;
+    validateNoShellRedirection(ctx.diag, ctx.ast.filePath, loc, "ensure", expr.args);
+    validateNestedManagedCallArgs(ctx.diag, ctx.ast.filePath, loc, expr.args);
+    validateRef(expr.callee, ctx.ast, ctx.refCtx, { mode: "expect", expect: RULE_REF_EXPECT });
+    validateArity(ctx.diag, ctx.ast.filePath, loc, expr.callee.value, expr.args, "rule", ctx.ast, ctx.refCtx);
+    validateArgVarRefs(ctx.diag, ctx.ast.filePath, loc, expr.args, ctx.knownVars, ctx.recoverBindings);
+  }
+}
+
+// -- Match expression -------------------------------------------------------
+
+export function validateMatchExpr(
+  diag: Diagnostics,
+  filePath: string,
+  expr: MatchExprDef,
+  knownVars: Set<string>,
+): void {
+  if (expr.arms.length === 0) {
+    diag.error(filePath, expr.loc.line, expr.loc.col, "E_VALIDATE", "match must have at least one arm");
+  }
+  let wildcardCount = 0;
+  for (const arm of expr.arms) {
+    if (arm.pattern.kind === "wildcard") wildcardCount += 1;
+    if (arm.pattern.kind === "regex") {
+      try {
+        new RegExp(arm.pattern.source);
+      } catch {
+        diag.error(
+          filePath,
+          expr.loc.line,
+          expr.loc.col,
+          "E_VALIDATE",
+          `invalid regex in match pattern: /${arm.pattern.source}/`,
+        );
+      }
+    }
+    const bodyTrimmed = (arm.tripleQuotedBody ? canonicalizeTripleQuotedString(arm.body) : arm.body).trimStart();
+    if (/^return(\s|$)/.test(bodyTrimmed)) {
+      diag.error(
+        filePath,
+        expr.loc.line,
+        expr.loc.col,
+        "E_VALIDATE",
+        `match arm body must not start with "return"; the match expression itself produces the value — use the expression directly after =>`,
+      );
+    }
+    if (/`[^`]*`\s*\(/.test(bodyTrimmed) || bodyTrimmed.startsWith("```")) {
+      diag.error(
+        filePath,
+        expr.loc.line,
+        expr.loc.col,
+        "E_VALIDATE",
+        `inline scripts are not allowed in match arm bodies; use a named script with "run script_name(…)" instead`,
+      );
+    }
+    if (!arm.tripleQuotedBody) {
+      const idMatch = bodyTrimmed.match(/^([A-Za-z_][A-Za-z0-9_]*)/);
+      if (idMatch) {
+        const ident = idMatch[1]!;
+        const after = bodyTrimmed.slice(ident.length);
+        const startsCall = after.startsWith("(");
+        const startsArgs = /^\s+\S/.test(after);
+        if ((startsCall || startsArgs) && ident !== "fail" && ident !== "run" && ident !== "ensure") {
+          const hint = ident === "error" ? ` did you mean "fail"?` : "";
+          diag.error(
+            filePath,
+            expr.loc.line,
+            expr.loc.col,
+            "E_VALIDATE",
+            `unknown match arm verb "${ident}"; allowed: fail "...", run ref(...), ensure ref(...).${hint}`,
+          );
+        }
+        if (!startsCall && !startsArgs && after.trim() === "" && !knownVars.has(ident)) {
+          diag.error(
+            filePath,
+            expr.loc.line,
+            expr.loc.col,
+            "E_VALIDATE",
+            `unknown identifier "${ident}" in match arm body; declare it with "const", use a capture, or add a parameter`,
+          );
+        }
+      }
+    }
+  }
+  if (wildcardCount === 0) {
+    diag.error(filePath, expr.loc.line, expr.loc.col, "E_VALIDATE", "match must have exactly one wildcard (_) arm");
+  }
+  if (wildcardCount > 1) {
+    diag.error(
+      filePath,
+      expr.loc.line,
+      expr.loc.col,
+      "E_VALIDATE",
+      "match must have exactly one wildcard (_) arm, found multiple",
+    );
+  }
+}
+
+// -- Workflow shell exec (workflow-only body kind) --------------------------
+
+function validateWorkflowShellExec(
+  body: Extract<Expr, { kind: "shell" }>,
+  ctx: ValidatorCtx,
+): void {
+  if (hasUnquotedSendArrow(body.command) && matchSendOperator(body.command) === null) {
+    ctx.diag.error(
+      ctx.ast.filePath,
+      body.loc.line,
+      body.loc.col,
+      "E_VALIDATE",
+      "invalid send: channel must be a single name or `alias.name` (at most one dot in the channel part)",
+    );
+  }
+  const t = body.command.trim();
+  if (/^(?:[A-Za-z_][A-Za-z0-9_]*)(?:\.[A-Za-z_][A-Za-z0-9_]*)*$/.test(t)) {
+    if (!t.includes(".")) {
+      if (ctx.localScripts.has(t) || ctx.localWorkflows.has(t)) {
+        ctx.diag.error(
+          ctx.ast.filePath,
+          body.loc.line,
+          body.loc.col,
+          "E_VALIDATE",
+          `use run ${t}() — a bare name that refers to a script or workflow must use a managed run step`,
+        );
+      }
+    } else {
+      validateRef({ value: t, loc: body.loc }, ctx.ast, ctx.refCtx, {
+        mode: "expect",
+        expect: RUN_TARGET_REF_EXPECT,
+      });
+      ctx.diag.error(
+        ctx.ast.filePath,
+        body.loc.line,
+        body.loc.col,
+        "E_VALIDATE",
+        `use run ${t}() — "${t}" is a valid script or workflow reference; use a managed run step`,
+      );
+    }
+  }
+}
+
+// -- Channel/route helpers --------------------------------------------------
+
+function validateChannelRef(channel: string, loc: { line: number; col: number }, ctx: ValidatorCtx): void {
+  const parts = channel.split(".");
+  if (parts.length === 1) {
+    if (!ctx.localChannels.has(channel)) {
+      ctx.diag.error(ctx.ast.filePath, loc.line, loc.col, "E_VALIDATE", `Channel "${channel}" is not defined`);
+    }
+    return;
+  }
+  if (parts.length !== 2) {
+    ctx.diag.error(ctx.ast.filePath, loc.line, loc.col, "E_VALIDATE", `Channel "${channel}" is not defined`);
+  }
+  const [alias, importedChannel] = parts;
+  const importedFile = ctx.importsByAlias.get(alias);
+  if (!importedFile) {
+    ctx.diag.error(ctx.ast.filePath, loc.line, loc.col, "E_VALIDATE", `Channel "${channel}" is not defined`);
+  }
+  const importedAst = ctx.importedAstCache.get(importedFile)!;
+  const importedChannels = new Set(importedAst.channels.map((c) => c.name));
+  if (!importedChannels.has(importedChannel)) {
+    ctx.diag.error(ctx.ast.filePath, loc.line, loc.col, "E_VALIDATE", `Channel "${channel}" is not defined`);
+  }
+}
+
+export const ROUTE_REF_EXPECT: RefExpectMessages = WORKFLOW_REF_EXPECT;
+
+export function resolveRouteTargetParams(
+  ref: string,
+  ast: jaiphModule,
+  refCtx: RefResolutionContext,
+): number | undefined {
+  const dotIdx = ref.indexOf(".");
+  if (dotIdx >= 0) {
+    const alias = ref.slice(0, dotIdx);
+    const name = ref.slice(dotIdx + 1);
+    const importPath = refCtx.importsByAlias.get(alias);
+    if (!importPath) return undefined;
+    const importedAst = refCtx.importedAstCache.get(importPath);
+    if (!importedAst) return undefined;
+    const wf = importedAst.workflows.find((w) => w.name === name);
+    return wf?.params.length;
+  }
+  const wf = ast.workflows.find((w) => w.name === ref);
+  return wf?.params.length;
+}
+
+// -- Inline string captures / dot-field refs --------------------------------
+
+function validateInlineStringCaptures(
+  content: string,
+  loc: { line: number; col: number },
+  ctx: ValidatorCtx,
+): void {
+  for (const cap of extractInlineCaptures(content)) {
+    if (cap.kind === "run") {
+      validateNoShellRedirection(ctx.diag, ctx.ast.filePath, loc, "run", cap.args);
+      validateRef({ value: cap.ref, loc }, ctx.ast, ctx.refCtx, {
+        mode: "expect",
+        expect: ctx.scope.runRefExpect,
+      });
+    } else {
+      validateNoShellRedirection(ctx.diag, ctx.ast.filePath, loc, "ensure", cap.args);
+      validateRef({ value: cap.ref, loc }, ctx.ast, ctx.refCtx, {
+        mode: "expect",
+        expect: RULE_REF_EXPECT,
+      });
+    }
+  }
+}
+
+function validateDotFieldRefs(
+  content: string,
+  loc: { line: number; col: number },
+  ctx: ValidatorCtx,
+): void {
+  for (const ref of extractDotFieldRefs(content)) {
+    validateDotFieldRef(ref.varName, ref.fieldName, loc, ctx);
+  }
+}
+
+/**
+ * Validate a dot-notation `if` / `match` subject like `r.verdict`. Emits the
+ * same `E_VALIDATE` diagnostics as `${var.field}` interpolation when the base
+ * is not a typed prompt capture or the field is not in its `returns` schema.
+ * Non-dot subjects (single identifier) are accepted without further checks
+ * to preserve prior behavior.
+ */
+function validateDotSubject(
+  subject: string,
+  loc: { line: number; col: number },
+  ctx: ValidatorCtx,
+): void {
+  const dotIdx = subject.indexOf(".");
+  if (dotIdx === -1) return;
+  const varName = subject.slice(0, dotIdx);
+  const fieldName = subject.slice(dotIdx + 1);
+  validateDotFieldRef(varName, fieldName, loc, ctx);
+}
+
+function validateDotFieldRef(
+  varName: string,
+  fieldName: string,
+  loc: { line: number; col: number },
+  ctx: ValidatorCtx,
+): void {
+  const fields = ctx.promptSchemas.get(varName);
+  if (!fields) {
+    ctx.diag.error(
+      ctx.ast.filePath,
+      loc.line,
+      loc.col,
+      "E_VALIDATE",
+      `\${${varName}.${fieldName}}: "${varName}" is not a typed prompt capture; dot notation requires a prompt with "returns" schema`,
+    );
+    return;
+  }
+  if (!fields.includes(fieldName)) {
+    ctx.diag.error(
+      ctx.ast.filePath,
+      loc.line,
+      loc.col,
+      "E_VALIDATE",
+      `\${${varName}.${fieldName}}: field "${fieldName}" is not defined in the returns schema for "${varName}"; available fields: ${fields.join(", ")}`,
+    );
+  }
+}
+
+// -- Shared call-shape helpers ----------------------------------------------
+
+function hasShellRedirection(args: Arg[] | undefined): boolean {
+  if (!args) return false;
+  for (const a of args) {
+    if (a.kind !== "literal") continue;
+    let inQuote = false;
+    const raw = a.raw;
+    for (let i = 0; i < raw.length; i++) {
+      const ch = raw[i];
+      if (ch === '"' && (i === 0 || raw[i - 1] !== "\\")) {
+        inQuote = !inQuote;
+        continue;
+      }
+      if (!inQuote && (ch === ">" || ch === "|" || ch === "&")) {
+        return true;
+      }
+    }
+  }
+  return false;
+}
+
+export function validateNoShellRedirection(
+  diag: Diagnostics,
+  filePath: string,
+  loc: { line: number; col: number },
+  keyword: string,
+  args: Arg[] | undefined,
+): void {
+  if (!hasShellRedirection(args)) return;
+  diag.error(
+    filePath,
+    loc.line,
+    loc.col,
+    "E_VALIDATE",
+    `shell redirection (>, >>, |, &) is not supported with ${keyword}; use a script block for shell operations`,
+  );
+}
+
+function validateNestedManagedCallArgs(
+  diag: Diagnostics,
+  filePath: string,
+  loc: { line: number; col: number },
+  args: Arg[] | undefined,
+): void {
+  if (!args) return;
+  for (const a of args) {
+    if (a.kind !== "literal") continue;
+    checkNestedManagedInLiteral(diag, filePath, loc, a.raw);
+  }
+}
+
+function checkNestedManagedInLiteral(
+  diag: Diagnostics,
+  filePath: string,
+  loc: { line: number; col: number },
+  raw: string,
+): void {
+  const stripped = stripQuotedSegmentContent(raw);
+  const re = /\b([A-Za-z_][A-Za-z0-9_.]*)\s*\(/g;
+  let match: RegExpExecArray | null;
+  while ((match = re.exec(stripped)) !== null) {
+    const before = stripped.slice(0, match.index).trimEnd();
+    const lastToken = before.length === 0 ? "" : before.slice(before.lastIndexOf(" ") + 1);
+    if (lastToken === "run" || lastToken === "ensure") continue;
+    diag.error(
+      filePath,
+      loc.line,
+      loc.col,
+      "E_VALIDATE",
+      `nested managed calls in argument position must be explicit; use "run ${match[1]}(...)" or "ensure ${match[1]}(...)" inside the argument list`,
+    );
+  }
+  const btRe = /`[^`]*`\s*\(/g;
+  let btMatch: RegExpExecArray | null;
+  while ((btMatch = btRe.exec(stripped)) !== null) {
+    const before = stripped.slice(0, btMatch.index).trimEnd();
+    const lastToken = before.length === 0 ? "" : before.slice(before.lastIndexOf(" ") + 1);
+    if (lastToken === "run" || lastToken === "ensure") continue;
+    diag.error(
+      filePath,
+      loc.line,
+      loc.col,
+      "E_VALIDATE",
+      `nested inline script calls in argument position must be explicit; use "run \`...\`(...)" inside the argument list`,
+    );
+  }
+}
+
+function stripQuotedSegmentContent(segment: string): string {
+  let out = "";
+  let quote: "'" | '"' | null = null;
+  for (let i = 0; i < segment.length; i += 1) {
+    const ch = segment[i]!;
+    if (quote) {
+      if (ch === quote && segment[i - 1] !== "\\") {
+        quote = null;
+      }
+      out += " ";
+      continue;
+    }
+    if (ch === "'" || ch === '"') {
+      quote = ch;
+      out += " ";
+      continue;
+    }
+    out += ch;
+  }
+  return out;
+}
+
+function validateArgVarRefs(
+  diag: Diagnostics,
+  filePath: string,
+  loc: { line: number; col: number },
+  args: Arg[] | undefined,
+  knownVars: Set<string>,
+  recoverBindings?: Set<string>,
+): void {
+  if (!args) return;
+  for (const a of args) {
+    if (a.kind !== "var") continue;
+    if (recoverBindings?.has(a.name)) continue;
+    if (knownVars.has(a.name)) continue;
+    diag.error(
+      filePath,
+      loc.line,
+      loc.col,
+      "E_VALIDATE",
+      `unknown identifier "${a.name}" used as bare argument; declare it with "const", use a capture, or add a workflow/rule parameter`,
+    );
+  }
+}
+
+function validateArity(
+  diag: Diagnostics,
+  filePath: string,
+  loc: { line: number; col: number },
+  ref: string,
+  args: Arg[] | undefined,
+  targetKind: "workflow" | "rule",
+  ast: jaiphModule,
+  refCtx: RefResolutionContext,
+): void {
+  const params = lookupCalleeParams(ref, targetKind, ast, refCtx);
+  if (params === undefined) return;
+  const argCount = args?.length ?? 0;
+  if (argCount !== params.length) {
+    diag.error(
+      filePath,
+      loc.line,
+      loc.col,
+      "E_VALIDATE",
+      `${targetKind} "${ref}" expects ${params.length} argument(s) (${params.join(", ") || "none"}), but got ${argCount}`,
+    );
+  }
+}
+
+function lookupCalleeParams(
+  ref: string,
+  targetKind: "workflow" | "rule",
+  ast: jaiphModule,
+  refCtx: RefResolutionContext,
+): string[] | undefined {
+  const parts = ref.split(".");
+  if (parts.length === 1) {
+    const name = parts[0];
+    if (targetKind === "workflow") {
+      const wf = ast.workflows.find((w) => w.name === name);
+      return wf?.params;
+    }
+    const rl = ast.rules.find((r) => r.name === name);
+    return rl?.params;
+  }
+  if (parts.length === 2) {
+    const [alias, name] = parts;
+    const importedFile = refCtx.importsByAlias.get(alias);
+    if (!importedFile) return undefined;
+    const importedAst = refCtx.importedAstCache.get(importedFile);
+    if (!importedAst) return undefined;
+    if (targetKind === "workflow") {
+      const wf = importedAst.workflows.find((w) => w.name === name);
+      return wf?.params;
+    }
+    const rl = importedAst.rules.find((r) => r.name === name);
+    return rl?.params;
+  }
+  return undefined;
+}
+
+// -- Misc small helpers -----------------------------------------------------
+
+function hasUnquotedSendArrow(line: string): boolean {
+  let inSingleQuote = false;
+  let inDoubleQuote = false;
+  for (let i = 0; i < line.length; i += 1) {
+    const ch = line[i];
+    if (ch === "\\" && (inDoubleQuote || inSingleQuote)) {
+      i += 1;
+      continue;
+    }
+    if (ch === "'" && !inDoubleQuote) {
+      inSingleQuote = !inSingleQuote;
+      continue;
+    }
+    if (ch === '"' && !inSingleQuote) {
+      inDoubleQuote = !inDoubleQuote;
+      continue;
+    }
+    if (!inSingleQuote && !inDoubleQuote && ch === "<" && line[i + 1] === "-") {
+      return true;
+    }
+  }
+  return false;
+}
+
+function stripDQ(s: string): string {
+  return s.length >= 2 && s[0] === '"' && s[s.length - 1] === '"' ? s.slice(1, -1) : s;
+}
+
+function semanticQuotedOrchestrationInner(dqRaw: string): string {
+  return stripDQ(dqRaw);
+}
+
+function extractConstScriptName(rhs: string): string | undefined {
+  const trimmed = rhs.trim();
+  if (/^[a-zA-Z_][a-zA-Z0-9_]*$/.test(trimmed)) return trimmed;
+  const inner = stripDQ(trimmed);
+  const m = inner.match(/^\$\{([a-zA-Z_][a-zA-Z0-9_]*)\}$/);
+  return m?.[1];
+}
+
+function promptBareIdentifier(raw: string): string | undefined {
+  const m = raw.match(/^"\$\{([A-Za-z_][A-Za-z0-9_]*)\}"$/);
+  return m?.[1];
+}
+
+export function parseSchemaFieldNames(rawSchema: string): string[] {
+  const inner = rawSchema.trim().replace(/^\s*\{\s*/, "").replace(/\s*\}\s*$/, "").trim();
+  if (!inner) return [];
+  const names: string[] = [];
+  for (const part of inner.split(",")) {
+    const m = part.trim().match(/^\s*([A-Za-z_][A-Za-z0-9_]*)\s*:\s*\S+\s*$/);
+    if (m) names.push(m[1]);
+  }
+  return names;
+}
+
+function makeImportedKindLookup(
+  ctx: ValidatorCtx,
+): (alias: string, name: string) => RefTargetKind | undefined {
+  return (alias, name) => {
+    const importedFile = ctx.importsByAlias.get(alias);
+    if (!importedFile) return undefined;
+    const importedAst = ctx.importedAstCache.get(importedFile)!;
+    return lookupKind(importedAst, name);
+  };
+}
+
+function makeSubEnv(
+  ctx: ValidatorCtx,
+  loc: { line: number; col: number },
+): SubstitutionValidateEnv {
+  return {
+    filePath: ctx.ast.filePath,
+    loc,
+    localRules: new Set(ctx.ast.rules.map((r) => r.name)),
+    localWorkflows: ctx.localWorkflows,
+    localScripts: ctx.localScripts,
+    importsByAlias: ctx.importsByAlias,
+    lookupImported: makeImportedKindLookup(ctx),
+  };
+}
diff --git a/src/transpile/validate-string.test.ts b/src/transpile/validate-string.test.ts
index f2e2cc93..251b65e3 100644
--- a/src/transpile/validate-string.test.ts
+++ b/src/transpile/validate-string.test.ts
@@ -399,11 +399,11 @@ test("rejected: ${run ref} with unknown ref in workflow", () => {
   });
 });
 
-test("extractInlineCaptures extracts run and ensure with args", () => {
+test("extractInlineCaptures extracts run and ensure with typed Arg[]", () => {
   const { extractInlineCaptures } = require("./validate-string");
   const result = extractInlineCaptures('prefix ${run greet(world)} middle ${ensure check()} suffix');
   assert.deepEqual(result, [
-    { kind: "run", ref: "greet", args: "${world}" },
+    { kind: "run", ref: "greet", args: [{ kind: "var", name: "world" }] },
     { kind: "ensure", ref: "check", args: undefined },
   ]);
 });
diff --git a/src/transpile/validate-string.ts b/src/transpile/validate-string.ts
index f6cdff05..4851031c 100644
--- a/src/transpile/validate-string.ts
+++ b/src/transpile/validate-string.ts
@@ -11,7 +11,7 @@
 
 import { jaiphError } from "../errors";
 import { parseCallRef } from "../parse/core";
-import { dedentCommonLeadingWhitespace } from "../parse/dedent";
+import type { Arg } from "../types";
 
 /**
  * Check for shell fallback/expansion syntax inside ${...} blocks.
@@ -99,7 +99,7 @@ const INLINE_CAPTURE_RE = /\$\{(run|ensure)\s+([^}]+)\}/g;
 export interface InlineCapture {
   kind: "run" | "ensure";
   ref: string;
-  args?: string;
+  args?: Arg[];
 }
 
 /** Extract ${run ref [args]} and ${ensure ref [args]} from string content (unquoted). */
@@ -281,7 +281,7 @@ export function validateJaiphStringContent(
       );
     }
 
-    if (call.args && /\$\{(?:run|ensure)\s/.test(call.args)) {
+    if (call.args?.some((a) => a.kind === "literal" && /\$\{(?:run|ensure)\s/.test(a.raw))) {
       throw jaiphError(
         filePath, line, col, "E_PARSE",
         `${context} cannot contain nested inline captures; extract to a const variable`,
@@ -298,15 +298,15 @@ export function validatePromptString(
   filePath: string,
   line: number,
   col: number,
-  opts?: { tripleQuoted?: boolean },
 ): void {
-  let content = stripDoubleQuotes(raw);
-  if (opts?.tripleQuoted) content = dedentCommonLeadingWhitespace(content);
+  const content = stripDoubleQuotes(raw);
   validateJaiphStringContent(content, filePath, line, col, "prompt");
 }
 
 /**
- * Validate a log/logerr message (inner content without quotes).
+ * Validate a log/logerr message (inner content without quotes). Triple-quoted
+ * messages arrive pre-dedented from the parser, so this validator no longer
+ * needs to know about that distinction.
  */
 export function validateLogString(
   message: string,
@@ -314,10 +314,8 @@ export function validateLogString(
   line: number,
   col: number,
   keyword: string,
-  opts?: { tripleQuoted?: boolean },
 ): void {
-  const text = opts?.tripleQuoted ? dedentCommonLeadingWhitespace(message) : message;
-  validateJaiphStringContent(text, filePath, line, col, keyword);
+  validateJaiphStringContent(message, filePath, line, col, keyword);
 }
 
 /**
@@ -328,10 +326,8 @@ export function validateFailString(
   filePath: string,
   line: number,
   col: number,
-  opts?: { tripleQuoted?: boolean },
 ): void {
-  let content = stripDoubleQuotes(message);
-  if (opts?.tripleQuoted) content = dedentCommonLeadingWhitespace(content);
+  const content = stripDoubleQuotes(message);
   validateJaiphStringContent(content, filePath, line, col, "fail");
 }
 
@@ -343,11 +339,9 @@ export function validateReturnString(
   filePath: string,
   line: number,
   col: number,
-  opts?: { tripleQuoted?: boolean },
 ): void {
   if (value.startsWith('"')) {
-    let content = stripDoubleQuotes(value);
-    if (opts?.tripleQuoted) content = dedentCommonLeadingWhitespace(content);
+    const content = stripDoubleQuotes(value);
     validateJaiphStringContent(content, filePath, line, col, "return");
   }
 }
diff --git a/src/transpile/validate-visitor.test.ts b/src/transpile/validate-visitor.test.ts
new file mode 100644
index 00000000..222d6efa
--- /dev/null
+++ b/src/transpile/validate-visitor.test.ts
@@ -0,0 +1,289 @@
+/**
+ * Acceptance tests for Refactor 4 (visitor-table validator).
+ *
+ * AC1 — `src/transpile/validate.ts` is at most 700 lines.
+ * AC3 — Diagnostic snapshot over every txtar `validate-*` error fixture pins
+ *       `{ code, line, col, message }` bit-for-bit.
+ * AC4 — Adding a new step type requires exactly one row in `VALIDATORS`: a
+ *       synthetic step type injected via type cast is rejected with the
+ *       documented "internal: no validator" message and produces exactly
+ *       one diagnostic.
+ */
+import test from "node:test";
+import assert from "node:assert/strict";
+import {
+  existsSync,
+  mkdtempSync,
+  readFileSync,
+  rmSync,
+  writeFileSync,
+} from "node:fs";
+import { join, resolve } from "node:path";
+import { tmpdir } from "node:os";
+import { Diagnostics } from "../diagnostics";
+import { loadModuleGraph } from "./module-graph";
+import { collectDiagnostics } from "./validate";
+import {
+  RULE_SCOPE,
+  WORKFLOW_SCOPE,
+  validateStep,
+  type ValidatorCtx,
+} from "./validate-step";
+import type { jaiphModule, WorkflowStepDef } from "../types";
+
+const repoRoot = resolve(__dirname, "../../..");
+const validatePath = resolve(repoRoot, "src/transpile/validate.ts");
+
+// --- AC1: file size bound -------------------------------------------------
+
+test("AC1: validate.ts is at most 700 lines", () => {
+  const text = readFileSync(validatePath, "utf8");
+  const lineCount = text.split("\n").length;
+  assert.ok(
+    lineCount <= 700,
+    `validate.ts is ${lineCount} lines (limit 700). The visitor-table refactor (Refactor 4) bounds this file; new validators belong in validate-step.ts.`,
+  );
+});
+
+// --- AC3: diagnostic snapshot --------------------------------------------
+
+interface TxtarTestCase {
+  name: string;
+  files: Map<string, string>;
+}
+
+function parseTxtar(content: string): TxtarTestCase[] {
+  const cases: TxtarTestCase[] = [];
+  const blocks = content.split(/^=== /m);
+  for (const block of blocks) {
+    const trimmed = block.trim();
+    if (!trimmed) continue;
+    const lines = trimmed.split("\n");
+    const name = lines[0].trim();
+    let fileStartIdx = -1;
+    for (let i = 1; i < lines.length; i += 1) {
+      if (lines[i].startsWith("--- ")) {
+        fileStartIdx = i;
+        break;
+      }
+    }
+    if (fileStartIdx < 0) continue;
+    cases.push({ name, files: parseVirtualFiles(lines.slice(fileStartIdx)) });
+  }
+  return cases;
+}
+
+function parseVirtualFiles(lines: string[]): Map<string, string> {
+  const files = new Map<string, string>();
+  let cur: string | undefined;
+  let buf: string[] = [];
+  for (const line of lines) {
+    if (line.startsWith("--- ")) {
+      if (cur !== undefined) files.set(cur, buf.join("\n") + "\n");
+      cur = line.slice(4).trim();
+      buf = [];
+    } else {
+      buf.push(line);
+    }
+  }
+  if (cur !== undefined) files.set(cur, buf.join("\n") + "\n");
+  return files;
+}
+
+function entryFile(files: Map<string, string>): string {
+  if (files.has("main.jh")) return "main.jh";
+  if (files.has("input.jh")) return "input.jh";
+  if (files.has("input.test.jh")) return "input.test.jh";
+  const first = files.keys().next().value;
+  if (!first) throw new Error("no virtual files");
+  return first;
+}
+
+interface SnapshotEntry {
+  file: string;
+  line: number;
+  col: number;
+  code: string;
+  message: string;
+}
+type Snapshot = Record<string, SnapshotEntry[]>;
+
+function captureSnapshot(): Snapshot {
+  const fixturesDir = resolve(repoRoot, "test-fixtures/compiler-txtar");
+  const out: Snapshot = {};
+  const files = ["validate-errors.txt", "validate-errors-multi-module.txt"];
+  for (const fileName of files) {
+    const content = readFileSync(join(fixturesDir, fileName), "utf8");
+    for (const tc of parseTxtar(content)) {
+      const key = `${fileName} > ${tc.name}`;
+      const tmpDir = mkdtempSync(join(tmpdir(), "jaiph-snap-"));
+      try {
+        for (const [name, body] of tc.files) {
+          writeFileSync(join(tmpDir, name), body, "utf8");
+        }
+        const entry = join(tmpDir, entryFile(tc.files));
+        let diagnostics: SnapshotEntry[] = [];
+        try {
+          const graph = loadModuleGraph(entry);
+          const diag = collectDiagnostics(graph);
+          diagnostics = diag.sorted().map((d) => ({
+            file: relativizeTmp(d.file, tmpDir),
+            line: d.line,
+            col: d.col,
+            code: d.code,
+            message: scrubTmp(d.message, tmpDir),
+          }));
+        } catch (e) {
+          // Fatal parser/loader error — capture as a synthetic diagnostic row
+          // so the snapshot still pins the failure mode.
+          const msg = (e as Error).message ?? String(e);
+          const m = msg.match(/^(.+):(\d+):(\d+) (\S+) ([\s\S]+)$/);
+          diagnostics = [
+            m
+              ? {
+                  file: relativizeTmp(m[1], tmpDir),
+                  line: Number(m[2]),
+                  col: Number(m[3]),
+                  code: m[4],
+                  message: scrubTmp(m[5], tmpDir),
+                }
+              : {
+                  file: "<unknown>",
+                  line: 0,
+                  col: 0,
+                  code: "E_FATAL",
+                  message: scrubTmp(msg, tmpDir),
+                },
+          ];
+        }
+        out[key] = diagnostics;
+      } finally {
+        rmSync(tmpDir, { recursive: true, force: true });
+      }
+    }
+  }
+  return out;
+}
+
+function relativizeTmp(p: string, tmpDir: string): string {
+  if (p.startsWith(tmpDir)) {
+    const rel = p.slice(tmpDir.length);
+    return rel.replace(/^[\/]+/, "");
+  }
+  return p;
+}
+
+/** Replace `<tmpDir>/...` substrings in error messages with `<TMP>/...` so the snapshot is stable across runs. */
+function scrubTmp(msg: string, tmpDir: string): string {
+  const escaped = tmpDir.replace(/[.*+?^${}()|[\]\\]/g, "\\$&");
+  return msg.replace(new RegExp(escaped, "g"), "<TMP>");
+}
+
+test("AC3: validate-* fixtures diagnostic snapshot pins {code, line, col, message}", () => {
+  const snapshotPath = resolve(
+    repoRoot,
+    "test-fixtures/compiler-txtar/validate-diagnostics-snapshot.json",
+  );
+  const current = captureSnapshot();
+
+  if (process.env.UPDATE_SNAPSHOTS === "1" || !existsSync(snapshotPath)) {
+    writeFileSync(snapshotPath, JSON.stringify(current, null, 2) + "\n", "utf8");
+    return;
+  }
+  const stored = JSON.parse(readFileSync(snapshotPath, "utf8")) as Snapshot;
+  assert.deepEqual(
+    current,
+    stored,
+    "diagnostic output drifted from snapshot. Re-run with UPDATE_SNAPSHOTS=1 only after confirming the change is intentional.",
+  );
+});
+
+// --- AC4: unknown step type rejection -------------------------------------
+
+test("AC4: unknown step type is rejected with the documented 'no validator' diagnostic (one error)", () => {
+  const ast: jaiphModule = {
+    filePath: "/synthetic.jh",
+    imports: [],
+    channels: [],
+    exports: [],
+    rules: [],
+    scripts: [],
+    workflows: [],
+  };
+  const diag = new Diagnostics();
+  const ctx: ValidatorCtx = {
+    diag,
+    ast,
+    refCtx: {
+      importsByAlias: new Map(),
+      importedAstCache: new Map(),
+      localRules: new Set(),
+      localWorkflows: new Set(),
+      localScripts: new Set(),
+    },
+    scope: WORKFLOW_SCOPE,
+    knownVars: new Set(),
+    promptSchemas: new Map(),
+    recoverBindings: undefined,
+    localChannels: new Set(),
+    localScripts: new Set(),
+    localWorkflows: new Set(),
+    importsByAlias: new Map(),
+    importedAstCache: new Map(),
+  };
+
+  const syntheticStep = {
+    type: "ZZZ_synthetic_step_type",
+    loc: { line: 42, col: 7 },
+  } as unknown as WorkflowStepDef;
+
+  diag.capture(() => validateStep(syntheticStep, ctx));
+  const errs = diag.sorted();
+  assert.equal(errs.length, 1, `expected exactly one diagnostic, got ${JSON.stringify(errs)}`);
+  assert.equal(errs[0].code, "E_VALIDATE");
+  assert.equal(errs[0].line, 42);
+  assert.equal(errs[0].col, 7);
+  assert.match(errs[0].message, /^internal: no validator for step type "ZZZ_synthetic_step_type"$/);
+});
+
+test("AC4: same synthetic step type is rejected in RULE_SCOPE too (scope-independent fallback)", () => {
+  const ast: jaiphModule = {
+    filePath: "/synthetic.jh",
+    imports: [],
+    channels: [],
+    exports: [],
+    rules: [],
+    scripts: [],
+    workflows: [],
+  };
+  const diag = new Diagnostics();
+  const ctx: ValidatorCtx = {
+    diag,
+    ast,
+    refCtx: {
+      importsByAlias: new Map(),
+      importedAstCache: new Map(),
+      localRules: new Set(),
+      localWorkflows: new Set(),
+      localScripts: new Set(),
+    },
+    scope: RULE_SCOPE,
+    knownVars: new Set(),
+    promptSchemas: new Map(),
+    recoverBindings: undefined,
+    localChannels: new Set(),
+    localScripts: new Set(),
+    localWorkflows: new Set(),
+    importsByAlias: new Map(),
+    importedAstCache: new Map(),
+  };
+  const syntheticStep = {
+    type: "ZZZ_synthetic_step_type",
+    loc: { line: 3, col: 1 },
+  } as unknown as WorkflowStepDef;
+
+  diag.capture(() => validateStep(syntheticStep, ctx));
+  const errs = diag.sorted();
+  assert.equal(errs.length, 1);
+  assert.match(errs[0].message, /^internal: no validator for step type "ZZZ_synthetic_step_type"$/);
+});
diff --git a/src/transpile/validate.ts b/src/transpile/validate.ts
index 30627918..e9d4d486 100644
--- a/src/transpile/validate.ts
+++ b/src/transpile/validate.ts
@@ -1,240 +1,78 @@
+import { existsSync } from "node:fs";
 import { dirname, resolve } from "node:path";
-import { jaiphError } from "../errors";
-import type { jaiphModule, MatchExprDef, WorkflowStepDef } from "../types";
-import type { SubstitutionValidateEnv } from "./validate-substitution";
-import { validateManagedWorkflowShell } from "./validate-substitution";
-import type { RefResolutionContext, RefTargetKind } from "./validate-ref-resolution";
+import { Diagnostics } from "../diagnostics";
+import type { Expr, jaiphModule, WorkflowStepDef } from "../types";
+import type { ModuleGraph } from "./module-graph";
+import { validateRef } from "./validate-ref-resolution";
 import {
-  BARE_SEND_REF_MSG,
-  lookupKind,
-  RULE_REF_EXPECT,
-  RUN_IN_RULE_REF_EXPECT,
-  RUN_TARGET_REF_EXPECT,
-  validateRef,
-  WORKFLOW_REF_EXPECT,
-} from "./validate-ref-resolution";
-import {
-  validatePromptString,
-  validateLogString,
-  validateFailString,
-  validateReturnString,
-  validateJaiphStringContent,
-  validateSimpleInterpolationIdentifiers,
-  extractInlineCaptures,
-  extractDotFieldRefs,
-} from "./validate-string";
-import { validatePromptReturnsSchema, validatePromptStepReturns } from "./validate-prompt-schema";
-import { dedentCommonLeadingWhitespace } from "../parse/dedent";
-import { matchSendOperator } from "../parse/core";
-import { tripleQuotedRawForRuntime } from "../runtime/orchestration-text";
-
-export interface ValidateContext {
-  resolveImportPath: (fromFile: string, importPath: string, workspaceRoot?: string) => string;
-  existsSync: (path: string) => boolean;
-  readFile: (path: string) => string;
-  parse: (content: string, filePath: string) => jaiphModule;
-  workspaceRoot?: string;
-}
+  parseSchemaFieldNames,
+  resolveRouteTargetParams,
+  ROUTE_REF_EXPECT,
+  RULE_SCOPE,
+  validateStep,
+  WORKFLOW_SCOPE,
+  type ValidatorCtx,
+} from "./validate-step";
 
-/** True when `<-` appears outside quotes (same idea as `matchSendOperator`). */
-function hasUnquotedSendArrow(line: string): boolean {
-  let inSingleQuote = false;
-  let inDoubleQuote = false;
-  for (let i = 0; i < line.length; i += 1) {
-    const ch = line[i];
-    if (ch === "\\" && (inDoubleQuote || inSingleQuote)) {
-      i += 1;
-      continue;
-    }
-    if (ch === "'" && !inDoubleQuote) {
-      inSingleQuote = !inSingleQuote;
-      continue;
-    }
-    if (ch === '"' && !inSingleQuote) {
-      inDoubleQuote = !inDoubleQuote;
-      continue;
-    }
-    if (!inSingleQuote && !inDoubleQuote && ch === "<" && line[i + 1] === "-") {
-      return true;
-    }
-  }
-  return false;
+/**
+ * One step entry in the flat list built by the single workflow walk.
+ *
+ * `recoverBindings` is the `Set` of failure-binding names contributed by an
+ * enclosing `catch` / `recover`, threaded down so steps inside a recovery
+ * body can resolve `<failure>` as an in-scope identifier.
+ */
+interface FlatStepEntry {
+  step: WorkflowStepDef;
+  recoverBindings: Set<string> | undefined;
 }
 
-/** Check if args contain unquoted shell redirection operators (>, >>, |, &). */
-function hasShellRedirection(args: string): boolean {
-  let inQuote = false;
-  for (let i = 0; i < args.length; i++) {
-    const ch = args[i];
-    if (ch === '"' && (i === 0 || args[i - 1] !== "\\")) {
-      inQuote = !inQuote;
-      continue;
-    }
-    if (!inQuote && (ch === ">" || ch === "|" || ch === "&")) {
-      return true;
-    }
-  }
-  return false;
+/**
+ * Result of the single recursive descent over a workflow's / rule's step
+ * tree: the global identifier set (envDecls + params + every nested const /
+ * capture / for-iterator), the top-level prompt schemas, and a flat list of
+ * every step in tree order. The flat list is what the main validator loop
+ * iterates over — that loop is non-recursive, so the only recursive helper
+ * walking `WorkflowStepDef[]` in this file is `walkStepTree` itself.
+ */
+interface StepTreeWalk {
+  knownVars: Set<string>;
+  promptSchemas: Map<string, string[]>;
+  flat: FlatStepEntry[];
 }
 
-function validateNoShellRedirection(
+function walkStepTree(
+  diag: Diagnostics,
   filePath: string,
-  loc: { line: number; col: number },
-  keyword: string,
-  args: string | undefined,
-): void {
-  if (!args || !hasShellRedirection(args)) return;
-  throw jaiphError(
-    filePath,
-    loc.line,
-    loc.col,
-    "E_VALIDATE",
-    `shell redirection (>, >>, |, &) is not supported with ${keyword}; use a script block for shell operations`,
-  );
-}
-
-function validateMatchExpr(filePath: string, expr: MatchExprDef, knownVars: Set<string>): void {
-  if (expr.arms.length === 0) {
-    throw jaiphError(filePath, expr.loc.line, expr.loc.col, "E_VALIDATE", "match must have at least one arm");
-  }
-  let wildcardCount = 0;
-  for (const arm of expr.arms) {
-    if (arm.pattern.kind === "wildcard") {
-      wildcardCount += 1;
-    }
-    if (arm.pattern.kind === "regex") {
-      try {
-        new RegExp(arm.pattern.source);
-      } catch {
-        throw jaiphError(
-          filePath,
-          expr.loc.line,
-          expr.loc.col,
-          "E_VALIDATE",
-          `invalid regex in match pattern: /${arm.pattern.source}/`,
-        );
-      }
-    }
-    // Reject `return` as the leading token of an arm body.
-    const bodyTrimmed = (arm.tripleQuotedBody ? tripleQuotedRawForRuntime(arm.body) : arm.body).trimStart();
-    if (/^return(\s|$)/.test(bodyTrimmed)) {
-      throw jaiphError(
-        filePath,
-        expr.loc.line,
-        expr.loc.col,
-        "E_VALIDATE",
-        `match arm body must not start with "return"; the match expression itself produces the value — use the expression directly after =>`,
-      );
-    }
-    // Reject inline script forms in arm bodies (backtick `…`() or fenced ```…```()).
-    if (/`[^`]*`\s*\(/.test(bodyTrimmed) || bodyTrimmed.startsWith("```")) {
-      throw jaiphError(
-        filePath,
-        expr.loc.line,
-        expr.loc.col,
-        "E_VALIDATE",
-        `inline scripts are not allowed in match arm bodies; use a named script with "run script_name(…)" instead`,
-      );
-    }
-    // Reject unknown verbs, bare function-call forms, and bare unknown identifiers in arm bodies.
-    // Allowed bodies: string literal ("..." or """..."""), $var/${var},
-    // bare in-scope identifier (param/const/capture), or a verb call: fail "...", run ref(...), ensure ref(...).
-    // A bare identifier followed by space+content (e.g. `error "msg"`) or by `(` (e.g. `error("msg")`)
-    // is a programming mistake — most likely a typo for `fail`. A bare identifier not in scope
-    // (e.g. `true`, `blorp`) is also rejected. Skip the check for triple-quoted bodies since those are literal text.
-    if (!arm.tripleQuotedBody) {
-      const idMatch = bodyTrimmed.match(/^([A-Za-z_][A-Za-z0-9_]*)/);
-      if (idMatch) {
-        const ident = idMatch[1]!;
-        const after = bodyTrimmed.slice(ident.length);
-        const startsCall = after.startsWith("(");
-        const startsArgs = /^\s+\S/.test(after);
-        if ((startsCall || startsArgs) && ident !== "fail" && ident !== "run" && ident !== "ensure") {
-          const hint = ident === "error" ? ` did you mean "fail"?` : "";
-          throw jaiphError(
-            filePath,
-            expr.loc.line,
-            expr.loc.col,
-            "E_VALIDATE",
-            `unknown match arm verb "${ident}"; allowed: fail "...", run ref(...), ensure ref(...).${hint}`,
-          );
-        }
-        // Reject bare unknown identifiers (e.g. `_ => true`, `_ => blorp`).
-        // Only bare words with no trailing content reach here — valid ones
-        // must be in-scope variables (params, consts, captures).
-        if (!startsCall && !startsArgs && after.trim() === "" && !knownVars.has(ident)) {
-          throw jaiphError(
-            filePath,
-            expr.loc.line,
-            expr.loc.col,
-            "E_VALIDATE",
-            `unknown identifier "${ident}" in match arm body; declare it with "const", use a capture, or add a parameter`,
-          );
-        }
-      }
-    }
-  }
-  if (wildcardCount === 0) {
-    throw jaiphError(filePath, expr.loc.line, expr.loc.col, "E_VALIDATE", "match must have exactly one wildcard (_) arm");
-  }
-  if (wildcardCount > 1) {
-    throw jaiphError(filePath, expr.loc.line, expr.loc.col, "E_VALIDATE", "match must have exactly one wildcard (_) arm, found multiple");
-  }
-}
+  steps: WorkflowStepDef[],
+  envDecls: { name: string; loc: { line: number; col: number } }[] | undefined,
+  params: string[],
+  declLoc: { line: number; col: number },
+  moduleScripts: Set<string>,
+  options: { withPromptSchemas: boolean },
+): StepTreeWalk {
+  const knownVars = new Set<string>();
+  const promptSchemas = new Map<string, string[]>();
+  const flat: FlatStepEntry[] = [];
 
-/** Collect all variable names defined in a step list (consts, captures, params). Flat walk — includes nested if/else blocks. */
-function collectKnownVars(steps: WorkflowStepDef[], envDecls?: { name: string }[], params?: string[]): Set<string> {
-  const vars = new Set<string>();
   if (envDecls) {
-    for (const d of envDecls) vars.add(d.name);
-  }
-  for (const p of params ?? []) {
-    vars.add(p);
+    for (const d of envDecls) knownVars.add(d.name);
   }
-  const walk = (ss: WorkflowStepDef[]): void => {
-    for (const s of ss) {
-      if (s.type === "const") {
-        vars.add(s.name);
-      }
-      if ((s.type === "ensure" || s.type === "run" || s.type === "prompt" || s.type === "run_inline_script") && s.captureName) {
-        vars.add(s.captureName);
-      }
-      if ((s.type === "ensure" || s.type === "run") && s.catch) {
-        const recoverSteps = "single" in s.catch ? [s.catch.single] : s.catch.block;
-        walk(recoverSteps);
-      }
-      if (s.type === "if") {
-        walk(s.body);
-      }
-      if (s.type === "for_lines") {
-        vars.add(s.iterVar);
-        walk(s.body);
-      }
-    }
-  };
-  walk(steps);
-  return vars;
-}
+  for (const p of params) knownVars.add(p);
 
-/** Validate that no immutable binding (param, const, capture) is redefined in the same scope. */
-function validateImmutableBindings(
-  filePath: string,
-  steps: WorkflowStepDef[],
-  params: string[],
-  declLoc: { line: number; col: number },
-  envDecls?: { name: string; loc: { line: number; col: number } }[],
-  moduleScripts?: Set<string>,
-): void {
-  // Map from name → { kind, line } for the first binding site.
-  const bound = new Map<string, { kind: string; line: number }>();
+  const seedBindings = new Map<string, { kind: string; line: number }>();
   for (const p of params) {
-    bound.set(p, { kind: "parameter", line: declLoc.line });
+    seedBindings.set(p, { kind: "parameter", line: declLoc.line });
   }
 
-  const check = (name: string, kind: string, loc: { line: number; col: number }, b: Map<string, { kind: string; line: number }>): void => {
+  const checkBinding = (
+    name: string,
+    kind: string,
+    loc: { line: number; col: number },
+    b: Map<string, { kind: string; line: number }>,
+  ): void => {
     const prev = b.get(name);
     if (prev) {
-      throw jaiphError(
+      diag.error(
         filePath,
         loc.line,
         loc.col,
@@ -242,8 +80,8 @@ function validateImmutableBindings(
         `cannot rebind immutable name "${name}"; already bound as ${prev.kind} at ${filePath}:${prev.line}`,
       );
     }
-    if (moduleScripts?.has(name)) {
-      throw jaiphError(
+    if (moduleScripts.has(name)) {
+      diag.error(
         filePath,
         loc.line,
         loc.col,
@@ -254,30 +92,56 @@ function validateImmutableBindings(
     b.set(name, { kind, line: loc.line });
   };
 
-  const walk = (ss: WorkflowStepDef[], b: Map<string, { kind: string; line: number }>): void => {
+  const descend = (
+    ss: WorkflowStepDef[],
+    bindings: Map<string, { kind: string; line: number }>,
+    recoverBindings: Set<string> | undefined,
+    topLevel: boolean,
+  ): void => {
     for (const s of ss) {
+      flat.push({ step: s, recoverBindings });
+
       if (s.type === "const") {
-        check(s.name, "const", s.loc, b);
-      }
-      if (s.type === "ensure" && s.captureName) {
-        check(s.captureName, "capture", s.ref.loc, b);
-      }
-      if (s.type === "run" && s.captureName) {
-        check(s.captureName, "capture", s.workflow.loc, b);
-      }
-      if ((s.type === "prompt" || s.type === "run_inline_script") && s.captureName) {
-        check(s.captureName, "capture", s.loc, b);
+        knownVars.add(s.name);
+        checkBinding(s.name, "const", s.loc, bindings);
+        if (options.withPromptSchemas && topLevel && s.value.kind === "prompt" && s.value.returns !== undefined) {
+          promptSchemas.set(s.name, parseSchemaFieldNames(s.value.returns));
+        }
+        continue;
       }
-      if ((s.type === "ensure" || s.type === "run") && s.catch) {
-        const recoverSteps = "single" in s.catch ? [s.catch.single] : s.catch.block;
-        walk(recoverSteps, b);
+
+      if (s.type === "exec") {
+        if (s.captureName) {
+          knownVars.add(s.captureName);
+          const captureLoc = execBodyLoc(s.body) ?? s.loc;
+          checkBinding(s.captureName, "capture", captureLoc, bindings);
+          if (options.withPromptSchemas && topLevel && s.body.kind === "prompt" && s.body.returns !== undefined) {
+            promptSchemas.set(s.captureName, parseSchemaFieldNames(s.body.returns));
+          }
+        }
+        if (s.catch) {
+          const catchSteps = "single" in s.catch ? [s.catch.single] : s.catch.block;
+          descend(catchSteps, bindings, new Set([s.catch.bindings.failure]), false);
+        }
+        if (s.recover) {
+          const recoverSteps = "single" in s.recover ? [s.recover.single] : s.recover.block;
+          descend(recoverSteps, bindings, new Set([s.recover.bindings.failure]), false);
+        }
+        continue;
       }
+
       if (s.type === "if") {
-        walk(s.body, b);
+        descend(s.body, bindings, recoverBindings, false);
+        if (s.elseBody) {
+          descend(s.elseBody, bindings, recoverBindings, false);
+        }
+        continue;
       }
+
       if (s.type === "for_lines") {
-        if (b.has(s.iterVar)) {
-          throw jaiphError(
+        knownVars.add(s.iterVar);
+        if (bindings.has(s.iterVar)) {
+          diag.error(
             filePath,
             s.loc.line,
             s.loc.col,
@@ -285,214 +149,67 @@ function validateImmutableBindings(
             `for loop iterator "${s.iterVar}" conflicts with an existing binding`,
           );
         }
-        const inner = new Map(b);
+        const inner = new Map(bindings);
         inner.set(s.iterVar, { kind: "loop_iterator", line: s.loc.line });
-        walk(s.body, inner);
+        descend(s.body, inner, recoverBindings, false);
+        continue;
       }
     }
   };
-  walk(steps, bound);
-}
 
-/** Count the number of call arguments from a space-separated args string (respects quotes). */
-function countCallArgs(argsStr: string | undefined): number {
-  if (!argsStr || !argsStr.trim()) return 0;
-  let count = 0;
-  let inQuote: string | null = null;
-  let hasContent = false;
-  for (let i = 0; i < argsStr.length; i++) {
-    const ch = argsStr[i];
-    if (inQuote) {
-      hasContent = true;
-      if (ch === inQuote && argsStr[i - 1] !== "\\") inQuote = null;
-    } else if (ch === '"' || ch === "'") {
-      hasContent = true;
-      inQuote = ch;
-    } else if (ch === " " || ch === "\t") {
-      if (hasContent) { count++; hasContent = false; }
-    } else {
-      hasContent = true;
-    }
-  }
-  if (hasContent) count++;
-  return count;
+  descend(steps, seedBindings, undefined, true);
+  return { knownVars, promptSchemas, flat };
 }
 
-/** Look up declared params for a workflow or rule target. Returns undefined if target has no declared params. */
-function lookupCalleeParams(
-  ref: string,
-  targetKind: "workflow" | "rule",
-  ast: jaiphModule,
-  refCtx: RefResolutionContext,
-): string[] | undefined {
-  const parts = ref.split(".");
-  if (parts.length === 1) {
-    const name = parts[0];
-    if (targetKind === "workflow") {
-      const wf = ast.workflows.find((w) => w.name === name);
-      return wf?.params;
-    }
-    const rl = ast.rules.find((r) => r.name === name);
-    return rl?.params;
-  }
-  if (parts.length === 2) {
-    const [alias, name] = parts;
-    const importedFile = refCtx.importsByAlias.get(alias);
-    if (!importedFile) return undefined;
-    const importedAst = refCtx.importedAstCache.get(importedFile);
-    if (!importedAst) return undefined;
-    if (targetKind === "workflow") {
-      const wf = importedAst.workflows.find((w) => w.name === name);
-      return wf?.params;
-    }
-    const rl = importedAst.rules.find((r) => r.name === name);
-    return rl?.params;
-  }
+/** Best-effort location for an exec body — used to attribute capture-binding errors. */
+function execBodyLoc(body: Expr): { line: number; col: number } | undefined {
+  if (body.kind === "call" || body.kind === "ensure_call") return body.callee.loc;
+  if (body.kind === "prompt" || body.kind === "shell") return body.loc;
+  if (body.kind === "match") return body.match.loc;
   return undefined;
 }
 
-/** Validate arity: if the callee declares named params, the call must supply exactly that many args. */
-function validateArity(
-  filePath: string,
-  loc: { line: number; col: number },
-  ref: string,
-  args: string | undefined,
-  targetKind: "workflow" | "rule",
-  ast: jaiphModule,
-  refCtx: RefResolutionContext,
-): void {
-  const params = lookupCalleeParams(ref, targetKind, ast, refCtx);
-  if (params === undefined) return; // callee not a workflow/rule in scope — skip
-  const argCount = countCallArgs(args);
-  if (argCount !== params.length) {
-    throw jaiphError(
-      filePath,
-      loc.line,
-      loc.col,
-      "E_VALIDATE",
-      `${targetKind} "${ref}" expects ${params.length} argument(s) (${params.join(", ") || "none"}), but got ${argCount}`,
-    );
-  }
+export function resolveScriptImportPath(fromFile: string, importPath: string): string {
+  return resolve(dirname(fromFile), importPath);
 }
 
-
-/** Validate bare identifier args against known variables. */
-function validateBareIdentifierArgs(
-  filePath: string,
-  loc: { line: number; col: number },
-  bareIdentifierArgs: string[] | undefined,
-  knownVars: Set<string>,
-  /** Extra variable names from `ensure … recover` bindings. */
-  recoverBindings?: Set<string>,
-): void {
-  if (!bareIdentifierArgs) return;
-  for (const name of bareIdentifierArgs) {
-    if (recoverBindings?.has(name)) {
-      continue;
-    }
-    if (!knownVars.has(name)) {
-      throw jaiphError(
-        filePath,
-        loc.line,
-        loc.col,
-        "E_VALIDATE",
-        `unknown identifier "${name}" used as bare argument; declare it with "const", use a capture, or add a workflow/rule parameter`,
-      );
-    }
-  }
+/**
+ * Legacy throwing entry. Builds a `Diagnostics` collector internally and
+ * throws the first sorted diagnostic via `jaiphError` so existing callers
+ * (and per-error tests) continue to see one error per failed compile.
+ *
+ * Use {@link collectDiagnostics} when you want the full set.
+ */
+export function validateReferences(graph: ModuleGraph): void {
+  const diag = collectDiagnostics(graph);
+  diag.throwFirstIfAny();
 }
 
-function stripQuotedArgContent(args: string): string {
-  let out = "";
-  let quote: "'" | '"' | null = null;
-  for (let i = 0; i < args.length; i += 1) {
-    const ch = args[i]!;
-    if (quote) {
-      if (ch === quote && args[i - 1] !== "\\") {
-        quote = null;
-      }
-      out += " ";
-      continue;
-    }
-    if (ch === "'" || ch === '"') {
-      quote = ch;
-      out += " ";
-      continue;
-    }
-    out += ch;
+/**
+ * New entry: walk the graph and append every validation error into a fresh
+ * `Diagnostics`. Never throws on user-level validation errors — non-validator
+ * problems (internal bugs) still bubble up.
+ */
+export function collectDiagnostics(graph: ModuleGraph): Diagnostics {
+  const diag = new Diagnostics();
+  for (const node of graph.modules.values()) {
+    validateModuleInto(node.ast, graph, diag);
   }
-  return out;
+  return diag;
 }
 
-function validateNestedManagedCallArgs(
-  filePath: string,
-  loc: { line: number; col: number },
-  args: string | undefined,
-): void {
-  if (!args) return;
-  const stripped = stripQuotedArgContent(args);
-  const re = /\b([A-Za-z_][A-Za-z0-9_.]*)\s*\(/g;
-  let match: RegExpExecArray | null;
-  while ((match = re.exec(stripped)) !== null) {
-    const before = stripped.slice(0, match.index).trimEnd();
-    const lastToken = before.length === 0 ? "" : before.slice(before.lastIndexOf(" ") + 1);
-    if (lastToken === "run" || lastToken === "ensure") {
-      continue;
-    }
-    throw jaiphError(
-      filePath,
-      loc.line,
-      loc.col,
-      "E_VALIDATE",
-      `nested managed calls in argument position must be explicit; use "run ${match[1]}(...)" or "ensure ${match[1]}(...)" inside the argument list`,
-    );
-  }
-  // Detect bare inline script calls: `body`() without preceding run/ensure
-  const btRe = /`[^`]*`\s*\(/g;
-  let btMatch: RegExpExecArray | null;
-  while ((btMatch = btRe.exec(stripped)) !== null) {
-    const before = stripped.slice(0, btMatch.index).trimEnd();
-    const lastToken = before.length === 0 ? "" : before.slice(before.lastIndexOf(" ") + 1);
-    if (lastToken === "run" || lastToken === "ensure") {
-      continue;
-    }
-    throw jaiphError(
-      filePath,
-      loc.line,
-      loc.col,
-      "E_VALIDATE",
-      `nested inline script calls in argument position must be explicit; use "run \`...\`(...)" inside the argument list`,
-    );
-  }
+/** Legacy throwing per-module wrapper (kept for `emitScriptsForModuleFromGraph`). */
+export function validateModule(ast: jaiphModule, graph: ModuleGraph): void {
+  const diag = new Diagnostics();
+  validateModuleInto(ast, graph, diag);
+  diag.throwFirstIfAny();
 }
 
-/** Resolve a route target workflow ref to its declared parameter count. Returns undefined if unresolvable. */
-function resolveRouteTargetParams(
-  ref: string,
+export function validateModuleInto(
   ast: jaiphModule,
-  refCtx: RefResolutionContext,
-): number | undefined {
-  const dotIdx = ref.indexOf(".");
-  if (dotIdx >= 0) {
-    const alias = ref.slice(0, dotIdx);
-    const name = ref.slice(dotIdx + 1);
-    const importPath = refCtx.importsByAlias.get(alias);
-    if (!importPath) return undefined;
-    const importedAst = refCtx.importedAstCache.get(importPath);
-    if (!importedAst) return undefined;
-    const wf = importedAst.workflows.find((w) => w.name === name);
-    return wf?.params.length;
-  }
-  const wf = ast.workflows.find((w) => w.name === ref);
-  return wf?.params.length;
-}
-
-/** Resolve a script import path relative to the importing file's directory. */
-export function resolveScriptImportPath(fromFile: string, importPath: string): string {
-  return resolve(dirname(fromFile), importPath);
-}
-
-export function validateReferences(ast: jaiphModule, ctx: ValidateContext): void {
+  graph: ModuleGraph,
+  diag: Diagnostics,
+): void {
   const localChannels = new Set(ast.channels.map((c) => c.name));
   const localRules = new Set(ast.rules.map((r) => r.name));
   const localWorkflows = new Set(ast.workflows.map((w) => w.name));
@@ -500,497 +217,115 @@ export function validateReferences(ast: jaiphModule, ctx: ValidateContext): void
   const importsByAlias = new Map<string, string>();
   const importedAstCache = new Map<string, jaiphModule>();
 
-  // Validate script imports: resolve paths and check existence.
   if (ast.scriptImports) {
     for (const si of ast.scriptImports) {
-      const resolved = resolveScriptImportPath(ast.filePath, si.path);
-      if (!ctx.existsSync(resolved)) {
-        throw jaiphError(
-          ast.filePath,
-          si.loc.line,
-          si.loc.col,
-          "E_IMPORT_NOT_FOUND",
-          `import script "${si.alias}" resolves to missing file "${resolved}"`,
-        );
-      }
-      localScripts.add(si.alias);
+      diag.capture(() => {
+        const resolved = resolveScriptImportPath(ast.filePath, si.path);
+        if (!existsSync(resolved)) {
+          diag.error(
+            ast.filePath,
+            si.loc.line,
+            si.loc.col,
+            "E_IMPORT_NOT_FOUND",
+            `import script "${si.alias}" resolves to missing file "${resolved}"`,
+          );
+        }
+        localScripts.add(si.alias);
+      });
     }
   }
 
+  const node = graph.modules.get(ast.filePath);
   for (const imp of ast.imports) {
-    if (importsByAlias.has(imp.alias)) {
-      throw jaiphError(
-        ast.filePath,
-        imp.loc.line,
-        imp.loc.col,
-        "E_VALIDATE",
-        `duplicate import alias "${imp.alias}"`,
-      );
-    }
-    const resolved = ctx.resolveImportPath(ast.filePath, imp.path, ctx.workspaceRoot);
-    importsByAlias.set(imp.alias, resolved);
-    if (!ctx.existsSync(resolved)) {
-      throw jaiphError(
-        ast.filePath,
-        imp.loc.line,
-        imp.loc.col,
-        "E_IMPORT_NOT_FOUND",
-        `import "${imp.alias}" resolves to missing file "${resolved}"`,
-      );
-    }
-    importedAstCache.set(resolved, ctx.parse(ctx.readFile(resolved), resolved));
-  }
-
-  const refCtx: RefResolutionContext = {
-    importsByAlias,
-    importedAstCache,
-    localRules,
-    localWorkflows,
-    localScripts,
-  };
-
-  const expectRuleRef = { mode: "expect" as const, expect: RULE_REF_EXPECT };
-  const expectWorkflowRef = { mode: "expect" as const, expect: WORKFLOW_REF_EXPECT };
-  const expectRunInRuleRef = { mode: "expect" as const, expect: RUN_IN_RULE_REF_EXPECT };
-  const expectRunTargetRef = { mode: "expect" as const, expect: RUN_TARGET_REF_EXPECT };
-
-  const lookupImportedKind = (alias: string, name: string): RefTargetKind | undefined => {
-    const importedFile = importsByAlias.get(alias);
-    if (!importedFile) return undefined;
-    const importedAst = importedAstCache.get(importedFile)!;
-    return lookupKind(importedAst, name);
-  };
-
-  const bareSendRefSpec = {
-    mode: "bare_send_rhs" as const,
-    bareSend: BARE_SEND_REF_MSG,
-    lookupImportedKind,
-  };
-
-  const makeSubEnv = (loc: { line: number; col: number }): SubstitutionValidateEnv => ({
-    filePath: ast.filePath,
-    loc,
-    localRules,
-    localWorkflows,
-    localScripts,
-    importsByAlias,
-    lookupImported: lookupImportedKind,
-  });
-
-  const stripDQ = (s: string): string =>
-    s.length >= 2 && s[0] === '"' && s[s.length - 1] === '"' ? s.slice(1, -1) : s;
-
-  /**
-   * Detect `const x = scriptName` and its parser sugar form `const x = "${scriptName}"`.
-   * Both should report the same domain error ("scripts are not values").
-   */
-  const extractConstScriptName = (rhs: string): string | undefined => {
-    const trimmed = rhs.trim();
-    if (/^[a-zA-Z_][a-zA-Z0-9_]*$/.test(trimmed)) return trimmed;
-    const inner = stripDQ(trimmed);
-    const m = inner.match(/^\$\{([a-zA-Z_][a-zA-Z0-9_]*)\}$/);
-    return m?.[1];
-  };
-
-  /** Inner string for validation: same margin removal as runtime for `"""` orchestration text. */
-  const semanticQuotedOrchestrationInner = (dqRaw: string, tripleQuoted: boolean): string => {
-    if (!tripleQuoted) return stripDQ(dqRaw);
-    return stripDQ(tripleQuotedRawForRuntime(dqRaw));
-  };
-
-  /** Parse field names from a returns schema string like '{ name: string, age: number }'. */
-  const parseSchemaFieldNames = (rawSchema: string): string[] => {
-    const inner = rawSchema.trim().replace(/^\s*\{\s*/, "").replace(/\s*\}\s*$/, "").trim();
-    if (!inner) return [];
-    const names: string[] = [];
-    for (const part of inner.split(",")) {
-      const m = part.trim().match(/^\s*([A-Za-z_][A-Za-z0-9_]*)\s*:\s*\S+\s*$/);
-      if (m) names.push(m[1]);
-    }
-    return names;
-  };
-
-  /** Collect prompt capture schemas from all steps in a workflow (pre-pass). */
-  const collectPromptSchemas = (steps: WorkflowStepDef[]): Map<string, string[]> => {
-    const schemas = new Map<string, string[]>();
-    for (const s of steps) {
-      if (s.type === "prompt" && s.captureName && s.returns !== undefined) {
-        schemas.set(s.captureName, parseSchemaFieldNames(s.returns));
-      }
-      if (s.type === "const" && s.value.kind === "prompt_capture" && s.value.returns !== undefined) {
-        schemas.set(s.name, parseSchemaFieldNames(s.value.returns));
-      }
-    }
-    return schemas;
-  };
-
-  /** Validate ${var.field} references against known prompt schemas. */
-  const validateDotFieldRefs = (
-    content: string,
-    loc: { line: number; col: number },
-    promptSchemas: Map<string, string[]>,
-  ): void => {
-    for (const ref of extractDotFieldRefs(content)) {
-      const fields = promptSchemas.get(ref.varName);
-      if (!fields) {
-        throw jaiphError(
-          ast.filePath,
-          loc.line,
-          loc.col,
-          "E_VALIDATE",
-          `\${${ref.varName}.${ref.fieldName}}: "${ref.varName}" is not a typed prompt capture; dot notation requires a prompt with "returns" schema`,
-        );
-      }
-      if (!fields.includes(ref.fieldName)) {
-        throw jaiphError(
+    diag.capture(() => {
+      if (importsByAlias.has(imp.alias)) {
+        diag.error(
           ast.filePath,
-          loc.line,
-          loc.col,
+          imp.loc.line,
+          imp.loc.col,
           "E_VALIDATE",
-          `\${${ref.varName}.${ref.fieldName}}: field "${ref.fieldName}" is not defined in the returns schema for "${ref.varName}"; available fields: ${fields.join(", ")}`,
-        );
-      }
-    }
-  };
-
-  const validateWorkflowStringCaptures = (content: string, loc: { line: number; col: number }): void => {
-    for (const cap of extractInlineCaptures(content)) {
-      if (cap.kind === "run") {
-        validateNoShellRedirection(ast.filePath, loc, "run", cap.args);
-        validateRef({ value: cap.ref, loc }, ast, refCtx, expectRunTargetRef);
-      } else {
-        validateNoShellRedirection(ast.filePath, loc, "ensure", cap.args);
-        validateRef({ value: cap.ref, loc }, ast, refCtx, expectRuleRef);
-      }
-    }
-  };
-
-  const validateRuleStringCaptures = (content: string, loc: { line: number; col: number }): void => {
-    for (const cap of extractInlineCaptures(content)) {
-      if (cap.kind === "run") {
-        validateNoShellRedirection(ast.filePath, loc, "run", cap.args);
-        validateRef({ value: cap.ref, loc }, ast, refCtx, expectRunInRuleRef);
-      } else {
-        validateNoShellRedirection(ast.filePath, loc, "ensure", cap.args);
-        validateRef({ value: cap.ref, loc }, ast, refCtx, expectRuleRef);
-      }
-    }
-  };
-
-  for (const rule of ast.rules) {
-    validateImmutableBindings(ast.filePath, rule.steps, rule.params, rule.loc, ast.envDecls, localScripts);
-    const ruleKnownVars = collectKnownVars(rule.steps, ast.envDecls, rule.params);
-    // Named params are validated via knownVars; positional argN access was removed.
-    const validateRuleStep = (s: WorkflowStepDef): void => {
-      if (s.type === "prompt" || s.type === "send") {
-        throw jaiphError(
-          ast.filePath,
-          s.loc.line,
-          s.loc.col,
-          "E_VALIDATE",
-          `${s.type} is not allowed in rules`,
-        );
-      }
-      if (s.type === "comment" || s.type === "blank_line") {
-        return;
-      }
-      if (s.type === "ensure") {
-        validateNoShellRedirection(ast.filePath, s.ref.loc, "ensure", s.args);
-        validateNestedManagedCallArgs(ast.filePath, s.ref.loc, s.args);
-        validateRef(s.ref, ast, refCtx, expectRuleRef);
-        validateArity(ast.filePath, s.ref.loc, s.ref.value, s.args, "rule", ast, refCtx);
-
-        validateBareIdentifierArgs(ast.filePath, s.ref.loc, s.bareIdentifierArgs, ruleKnownVars);
-        if (s.catch) {
-          const steps = "single" in s.catch ? [s.catch.single] : s.catch.block;
-          const rb = new Set<string>();
-          rb.add(s.catch.bindings.failure);
-          for (const r of steps) validateRuleStep(r);
-        }
-        return;
-      }
-      if (s.type === "run") {
-        validateNoShellRedirection(ast.filePath, s.workflow.loc, "run", s.args);
-        validateNestedManagedCallArgs(ast.filePath, s.workflow.loc, s.args);
-        if (s.async) {
-          throw jaiphError(
-            ast.filePath,
-            s.workflow.loc.line,
-            s.workflow.loc.col,
-            "E_VALIDATE",
-            "run async is not allowed in rules; use it in workflows only",
-          );
-        }
-        if (!s.workflow.value.includes(".") && ruleKnownVars.has(s.workflow.value) && !localScripts.has(s.workflow.value)) {
-          throw jaiphError(ast.filePath, s.workflow.loc.line, s.workflow.loc.col, "E_VALIDATE", `strings are not executable; "${s.workflow.value}" is a string — use a script instead`);
-        }
-        validateRef(s.workflow, ast, refCtx, expectRunInRuleRef);
-        validateArity(ast.filePath, s.workflow.loc, s.workflow.value, s.args, "workflow", ast, refCtx);
-
-        validateBareIdentifierArgs(ast.filePath, s.workflow.loc, s.bareIdentifierArgs, ruleKnownVars);
-        if (s.catch) {
-          const steps = "single" in s.catch ? [s.catch.single] : s.catch.block;
-          const rb = new Set<string>();
-          rb.add(s.catch.bindings.failure);
-          for (const r of steps) validateRuleStep(r);
-        }
-        if (s.recover) {
-          const steps = "single" in s.recover ? [s.recover.single] : s.recover.block;
-          const rb = new Set<string>();
-          rb.add(s.recover.bindings.failure);
-          for (const r of steps) validateRuleStep(r);
-        }
-        return;
-      }
-      if (s.type === "fail") {
-        validateFailString(s.message, ast.filePath, s.loc.line, s.loc.col, { tripleQuoted: s.tripleQuoted });
-        const failInner = semanticQuotedOrchestrationInner(s.message, s.tripleQuoted === true);
-        validateRuleStringCaptures(failInner, s.loc);
-        validateSimpleInterpolationIdentifiers(
-          failInner,
-          ast.filePath,
-          s.loc.line,
-          s.loc.col,
-          "fail",
-          ruleKnownVars,
-          "rule",
-          undefined,
-          undefined,
-          localScripts,
+          `duplicate import alias "${imp.alias}"`,
         );
-        return;
       }
-      if (s.type === "log") {
-        if (s.managed?.kind === "run_inline_script") return; // inline script — no ref to validate
-        validateLogString(s.message, ast.filePath, s.loc.line, s.loc.col, "log", { tripleQuoted: s.tripleQuoted });
-        const logRuleInner = s.tripleQuoted ? dedentCommonLeadingWhitespace(s.message) : s.message;
-        validateRuleStringCaptures(logRuleInner, s.loc);
-        validateSimpleInterpolationIdentifiers(
-          logRuleInner,
+      const resolved = node?.imports.get(imp.alias);
+      if (!resolved) {
+        diag.error(
           ast.filePath,
-          s.loc.line,
-          s.loc.col,
-          "log",
-          ruleKnownVars,
-          "rule",
-          undefined,
-          undefined,
-          localScripts,
+          imp.loc.line,
+          imp.loc.col,
+          "E_IMPORT_NOT_FOUND",
+          `import "${imp.alias}" could not be resolved`,
         );
-        return;
       }
-      if (s.type === "logerr") {
-        if (s.managed?.kind === "run_inline_script") return; // inline script — no ref to validate
-        validateLogString(s.message, ast.filePath, s.loc.line, s.loc.col, "logerr", {
-          tripleQuoted: s.tripleQuoted,
-        });
-        const logerrRuleInner = s.tripleQuoted ? dedentCommonLeadingWhitespace(s.message) : s.message;
-        validateRuleStringCaptures(logerrRuleInner, s.loc);
-        validateSimpleInterpolationIdentifiers(
-          logerrRuleInner,
+      importsByAlias.set(imp.alias, resolved);
+      const importedAst = graph.modules.get(resolved)?.ast;
+      if (!importedAst) {
+        diag.error(
           ast.filePath,
-          s.loc.line,
-          s.loc.col,
-          "logerr",
-          ruleKnownVars,
-          "rule",
-          undefined,
-          undefined,
-          localScripts,
+          imp.loc.line,
+          imp.loc.col,
+          "E_IMPORT_NOT_FOUND",
+          `import "${imp.alias}" resolves to missing file "${resolved}"`,
         );
-        return;
-      }
-      if (s.type === "return") {
-        if (s.managed) {
-          if (s.managed.kind === "run") {
-            validateNoShellRedirection(ast.filePath, s.managed.ref.loc, "run", s.managed.args);
-            validateNestedManagedCallArgs(ast.filePath, s.managed.ref.loc, s.managed.args);
-            validateRef(s.managed.ref, ast, refCtx, expectRunInRuleRef);
-            validateArity(ast.filePath, s.managed.ref.loc, s.managed.ref.value, s.managed.args, "workflow", ast, refCtx);
-
-            validateBareIdentifierArgs(ast.filePath, s.managed.ref.loc, s.managed.bareIdentifierArgs, ruleKnownVars);
-          } else if (s.managed.kind === "ensure") {
-            validateNoShellRedirection(ast.filePath, s.managed.ref.loc, "ensure", s.managed.args);
-            validateNestedManagedCallArgs(ast.filePath, s.managed.ref.loc, s.managed.args);
-            validateRef(s.managed.ref, ast, refCtx, expectRuleRef);
-            validateArity(ast.filePath, s.managed.ref.loc, s.managed.ref.value, s.managed.args, "rule", ast, refCtx);
-
-            validateBareIdentifierArgs(ast.filePath, s.managed.ref.loc, s.managed.bareIdentifierArgs, ruleKnownVars);
-          } else if (s.managed.kind === "match") {
-            validateMatchExpr(ast.filePath, s.managed.match, ruleKnownVars);
-          }
-          // run_inline_script — no ref to validate
-        } else {
-          validateReturnString(s.value, ast.filePath, s.loc.line, s.loc.col, { tripleQuoted: s.tripleQuoted });
-          if (s.value.startsWith('"')) {
-            const retRuleInner = semanticQuotedOrchestrationInner(s.value, s.tripleQuoted === true);
-            validateRuleStringCaptures(retRuleInner, s.loc);
-            validateSimpleInterpolationIdentifiers(
-              retRuleInner,
-              ast.filePath,
-              s.loc.line,
-              s.loc.col,
-              "return",
-              ruleKnownVars,
-              "rule",
-              undefined,
-              undefined,
-              localScripts,
-            );
-          }
-        }
-        return;
       }
-      if (s.type === "const") {
-        const v = s.value;
-        if (v.kind === "run_capture") {
-          validateNoShellRedirection(ast.filePath, v.ref.loc, "run", v.args);
-          validateNestedManagedCallArgs(ast.filePath, v.ref.loc, v.args);
-          if (!v.ref.value.includes(".") && ruleKnownVars.has(v.ref.value) && !localScripts.has(v.ref.value)) {
-            throw jaiphError(ast.filePath, v.ref.loc.line, v.ref.loc.col, "E_VALIDATE", `strings are not executable; "${v.ref.value}" is a string — use a script instead`);
-          }
-          validateRef(v.ref, ast, refCtx, expectRunInRuleRef);
-          validateArity(ast.filePath, v.ref.loc, v.ref.value, v.args, "workflow", ast, refCtx);
+      importedAstCache.set(resolved, importedAst);
+    });
+  }
 
-          validateBareIdentifierArgs(ast.filePath, v.ref.loc, v.bareIdentifierArgs, ruleKnownVars);
-        } else if (v.kind === "ensure_capture") {
-          validateNoShellRedirection(ast.filePath, v.ref.loc, "ensure", v.args);
-          validateNestedManagedCallArgs(ast.filePath, v.ref.loc, v.args);
-          validateRef(v.ref, ast, refCtx, expectRuleRef);
-          validateArity(ast.filePath, v.ref.loc, v.ref.value, v.args, "rule", ast, refCtx);
+  const refCtx = {
+    importsByAlias,
+    importedAstCache,
+    localRules,
+    localWorkflows,
+    localScripts,
+  };
 
-          validateBareIdentifierArgs(ast.filePath, v.ref.loc, v.bareIdentifierArgs, ruleKnownVars);
-        } else if (v.kind === "prompt_capture") {
-          throw jaiphError(ast.filePath, s.loc.line, s.loc.col, "E_VALIDATE", "const ... = prompt is not allowed in rules");
-        } else if (v.kind === "run_inline_script_capture") {
-          // inline script capture — no ref to validate
-        } else if (v.kind === "match_expr") {
-          validateMatchExpr(ast.filePath, v.match, ruleKnownVars);
-        } else if (v.kind === "expr") {
-          const scriptName = extractConstScriptName(v.bashRhs);
-          if (scriptName && localScripts.has(scriptName)) {
-            throw jaiphError(ast.filePath, s.loc.line, s.loc.col, "E_VALIDATE", `scripts are not values; "${scriptName}" is a script definition`);
-          }
-          validateRuleStringCaptures(stripDQ(v.bashRhs), s.loc);
-          validateSimpleInterpolationIdentifiers(
-            stripDQ(v.bashRhs),
-            ast.filePath,
-            s.loc.line,
-            s.loc.col,
-            "const",
-            ruleKnownVars,
-            "rule",
-            undefined,
-            undefined,
-            localScripts,
-          );
-        }
-        return;
-      }
-      if (s.type === "match") {
-        validateMatchExpr(ast.filePath, s.expr, ruleKnownVars);
-        return;
-      }
-      if (s.type === "if") {
-        if (s.operand.kind === "regex") {
-          try { new RegExp(s.operand.source); } catch {
-            throw jaiphError(ast.filePath, s.loc.line, s.loc.col, "E_VALIDATE", `invalid regex in if condition: /${s.operand.source}/`);
-          }
-        }
-        for (const bodyStep of s.body) validateRuleStep(bodyStep);
-        return;
-      }
-      if (s.type === "for_lines") {
-        if (!ruleKnownVars.has(s.sourceVar)) {
-          throw jaiphError(
-            ast.filePath,
-            s.loc.line,
-            s.loc.col,
-            "E_VALIDATE",
-            `for ... in <name>: "${s.sourceVar}" is not a known variable in this scope`,
-          );
-        }
-        for (const bodyStep of s.body) validateRuleStep(bodyStep);
-        return;
-      }
-      if (s.type === "run_inline_script") {
-        return;
-      }
-      if (s.type === "shell") {
-        throw jaiphError(
-          ast.filePath,
-          s.loc.line,
-          s.loc.col,
-          "E_VALIDATE",
-          "inline shell steps are forbidden in rules; use explicit script blocks",
-        );
-      }
-      const _never: never = s;
-      return _never;
-    };
-    for (const st of rule.steps) {
-      validateRuleStep(st);
-    }
-  }
+  const baseCtx = {
+    diag,
+    ast,
+    refCtx,
+    localChannels,
+    localScripts,
+    localWorkflows,
+    importsByAlias,
+    importedAstCache,
+  } as const;
 
-  const validateChannelRef = (
-    channel: string,
-    loc: { line: number; col: number },
-  ): void => {
-    const parts = channel.split(".");
-    if (parts.length === 1) {
-      if (!localChannels.has(channel)) {
-        throw jaiphError(
-          ast.filePath,
-          loc.line,
-          loc.col,
-          "E_VALIDATE",
-          `Channel "${channel}" is not defined`,
-        );
-      }
-      return;
-    }
-    if (parts.length !== 2) {
-      throw jaiphError(
-        ast.filePath,
-        loc.line,
-        loc.col,
-        "E_VALIDATE",
-        `Channel "${channel}" is not defined`,
-      );
-    }
-    const [alias, importedChannel] = parts;
-    const importedFile = importsByAlias.get(alias);
-    if (!importedFile) {
-      throw jaiphError(
-        ast.filePath,
-        loc.line,
-        loc.col,
-        "E_VALIDATE",
-        `Channel "${channel}" is not defined`,
-      );
-    }
-    const importedAst = importedAstCache.get(importedFile)!;
-    const importedChannels = new Set(importedAst.channels.map((c) => c.name));
-    if (!importedChannels.has(importedChannel)) {
-      throw jaiphError(
+  for (const rule of ast.rules) {
+    let ruleWalk: StepTreeWalk | undefined;
+    diag.capture(() => {
+      ruleWalk = walkStepTree(
+        diag,
         ast.filePath,
-        loc.line,
-        loc.col,
-        "E_VALIDATE",
-        `Channel "${channel}" is not defined`,
+        rule.steps,
+        ast.envDecls,
+        rule.params,
+        rule.loc,
+        localScripts,
+        { withPromptSchemas: false },
       );
+    });
+    if (!ruleWalk) continue;
+    const ctx: ValidatorCtx = {
+      ...baseCtx,
+      scope: RULE_SCOPE,
+      knownVars: ruleWalk.knownVars,
+      promptSchemas: ruleWalk.promptSchemas,
+      recoverBindings: undefined,
+    };
+    for (const entry of ruleWalk.flat) {
+      diag.capture(() => validateStep(entry.step, { ...ctx, recoverBindings: entry.recoverBindings }));
     }
-  };
+  }
 
-  // Validate channel-level route declarations.
   for (const ch of ast.channels) {
-    if (ch.routes) {
-      for (const wfRef of ch.routes) {
-        validateRef(wfRef, ast, refCtx, expectWorkflowRef);
+    if (!ch.routes) continue;
+    for (const wfRef of ch.routes) {
+      diag.capture(() => {
+        validateRef(wfRef, ast, refCtx, { mode: "expect", expect: ROUTE_REF_EXPECT });
         const targetParams = resolveRouteTargetParams(wfRef.value, ast, refCtx);
         if (targetParams !== undefined && targetParams !== 3) {
-          throw jaiphError(
+          diag.error(
             ast.filePath,
             wfRef.loc.line,
             wfRef.loc.col,
@@ -998,444 +333,122 @@ export function validateReferences(ast: jaiphModule, ctx: ValidateContext): void
             `inbox route target "${wfRef.value}" must declare exactly 3 parameters (message, channel, sender), but declares ${targetParams}`,
           );
         }
-      }
+      });
     }
   }
 
   for (const workflow of ast.workflows) {
-    validateImmutableBindings(ast.filePath, workflow.steps, workflow.params, workflow.loc, ast.envDecls, localScripts);
-    const promptSchemas = collectPromptSchemas(workflow.steps);
-    const wfKnownVars = collectKnownVars(workflow.steps, ast.envDecls, workflow.params);
-    // Named params are validated via knownVars; positional argN access was removed.
-
-    const validateStep = (s: WorkflowStepDef, recoverBindings?: Set<string>): void => {
-      if (s.type === "comment" || s.type === "blank_line") {
-        return;
-      }
-      if (s.type === "send") {
-        validateChannelRef(s.channel, s.loc);
-        if (s.rhs.kind === "run") {
-          validateNoShellRedirection(ast.filePath, s.rhs.ref.loc, "run", s.rhs.args);
-          validateNestedManagedCallArgs(ast.filePath, s.rhs.ref.loc, s.rhs.args);
-          validateRef(s.rhs.ref, ast, refCtx, expectRunTargetRef);
-          validateArity(ast.filePath, s.rhs.ref.loc, s.rhs.ref.value, s.rhs.args, "workflow", ast, refCtx);
-
-          validateBareIdentifierArgs(ast.filePath, s.rhs.ref.loc, s.rhs.bareIdentifierArgs, wfKnownVars, recoverBindings);
-        } else if (s.rhs.kind === "literal") {
-          const inner = s.rhs.token.startsWith('"') && s.rhs.token.endsWith('"')
-            ? s.rhs.token.slice(1, -1) : s.rhs.token;
-          validateJaiphStringContent(inner, ast.filePath, s.loc.line, s.loc.col, "send");
-          validateWorkflowStringCaptures(inner, s.loc);
-          validateDotFieldRefs(inner, s.loc, promptSchemas);
-          validateSimpleInterpolationIdentifiers(
-            inner,
-            ast.filePath,
-            s.loc.line,
-            s.loc.col,
-            "send",
-            wfKnownVars,
-            "workflow",
-            promptSchemas,
-            recoverBindings,
-            localScripts,
-          );
-        } else if (s.rhs.kind === "bare_ref") {
-          validateRef(s.rhs.ref, ast, refCtx, bareSendRefSpec);
-        } else if (s.rhs.kind === "shell") {
-          validateManagedWorkflowShell(
-            s.rhs.command,
-            makeSubEnv({ line: s.rhs.loc.line, col: s.rhs.loc.col }),
-          );
-        }
-        return;
-      }
-      if (s.type === "ensure") {
-        validateNoShellRedirection(ast.filePath, s.ref.loc, "ensure", s.args);
-        validateNestedManagedCallArgs(ast.filePath, s.ref.loc, s.args);
-        validateRef(s.ref, ast, refCtx, expectRuleRef);
-        validateArity(ast.filePath, s.ref.loc, s.ref.value, s.args, "rule", ast, refCtx);
+    let wfWalk: StepTreeWalk | undefined;
+    diag.capture(() => {
+      wfWalk = walkStepTree(
+        diag,
+        ast.filePath,
+        workflow.steps,
+        ast.envDecls,
+        workflow.params,
+        workflow.loc,
+        localScripts,
+        { withPromptSchemas: true },
+      );
+    });
+    if (!wfWalk) continue;
+    const ctx: ValidatorCtx = {
+      ...baseCtx,
+      scope: WORKFLOW_SCOPE,
+      knownVars: wfWalk.knownVars,
+      promptSchemas: wfWalk.promptSchemas,
+      recoverBindings: undefined,
+    };
+    for (const entry of wfWalk.flat) {
+      diag.capture(() => validateStep(entry.step, { ...ctx, recoverBindings: entry.recoverBindings }));
+    }
+  }
 
-        validateBareIdentifierArgs(ast.filePath, s.ref.loc, s.bareIdentifierArgs, wfKnownVars, recoverBindings);
-        if (s.catch) {
-          const steps = "single" in s.catch ? [s.catch.single] : s.catch.block;
-          const rb = new Set<string>();
-          rb.add(s.catch.bindings.failure);
-          for (const r of steps) validateStep(r, rb);
-        }
-        return;
-      }
-      if (s.type === "run") {
-        validateNoShellRedirection(ast.filePath, s.workflow.loc, "run", s.args);
-        validateNestedManagedCallArgs(ast.filePath, s.workflow.loc, s.args);
-        if (!s.workflow.value.includes(".") && wfKnownVars.has(s.workflow.value) && !localScripts.has(s.workflow.value) && !localWorkflows.has(s.workflow.value)) {
-          throw jaiphError(ast.filePath, s.workflow.loc.line, s.workflow.loc.col, "E_VALIDATE", `strings are not executable; "${s.workflow.value}" is a string — use a script instead`);
-        }
-        validateRef(s.workflow, ast, refCtx, expectRunTargetRef);
-        validateArity(ast.filePath, s.workflow.loc, s.workflow.value, s.args, "workflow", ast, refCtx);
+  if (ast.tests && ast.tests.length > 0) {
+    validateTestBlocks(diag, ast, ast.tests);
+  }
+}
 
-        validateBareIdentifierArgs(ast.filePath, s.workflow.loc, s.bareIdentifierArgs, wfKnownVars, recoverBindings);
-        if (s.catch) {
-          const steps = "single" in s.catch ? [s.catch.single] : s.catch.block;
-          const rb = new Set<string>();
-          rb.add(s.catch.bindings.failure);
-          for (const r of steps) validateStep(r, rb);
-        }
-        if (s.recover) {
-          const steps = "single" in s.recover ? [s.recover.single] : s.recover.block;
-          const rb = new Set<string>();
-          rb.add(s.recover.bindings.failure);
-          for (const r of steps) validateStep(r, rb);
-        }
-        return;
-      }
-      if (s.type === "prompt") {
-        if (s.bodyKind === "identifier" && s.bodyIdentifier && localScripts.has(s.bodyIdentifier)) {
-          throw jaiphError(ast.filePath, s.loc.line, s.loc.col, "E_VALIDATE", `scripts are not promptable; "${s.bodyIdentifier}" is a script — use a string const instead`);
-        }
-        validatePromptString(s.raw, ast.filePath, s.loc.line, s.loc.col, {
-          tripleQuoted: s.bodyKind === "triple_quoted",
-        });
-        validatePromptStepReturns(s, ast.filePath);
-        const promptInner = semanticQuotedOrchestrationInner(s.raw, s.bodyKind === "triple_quoted");
-        validateWorkflowStringCaptures(promptInner, s.loc);
-        validateDotFieldRefs(promptInner, s.loc, promptSchemas);
-        validateSimpleInterpolationIdentifiers(
-          promptInner,
-          ast.filePath,
-          s.loc.line,
-          s.loc.col,
-          "prompt",
-          wfKnownVars,
-          "workflow",
-          promptSchemas,
-          recoverBindings,
-          localScripts,
-        );
-        return;
-      }
-      if (s.type === "log") {
-        if (s.managed?.kind === "run_inline_script") return; // inline script — no ref to validate
-        validateLogString(s.message, ast.filePath, s.loc.line, s.loc.col, "log", {
-          tripleQuoted: s.tripleQuoted,
-        });
-        const logInner = s.tripleQuoted ? dedentCommonLeadingWhitespace(s.message) : s.message;
-        validateWorkflowStringCaptures(logInner, s.loc);
-        validateDotFieldRefs(logInner, s.loc, promptSchemas);
-        validateSimpleInterpolationIdentifiers(
-          logInner,
-          ast.filePath,
-          s.loc.line,
-          s.loc.col,
-          "log",
-          wfKnownVars,
-          "workflow",
-          promptSchemas,
-          recoverBindings,
-          localScripts,
-        );
-        return;
-      }
-      if (s.type === "logerr") {
-        if (s.managed?.kind === "run_inline_script") return; // inline script — no ref to validate
-        validateLogString(s.message, ast.filePath, s.loc.line, s.loc.col, "logerr", {
-          tripleQuoted: s.tripleQuoted,
-        });
-        const logerrInner = s.tripleQuoted ? dedentCommonLeadingWhitespace(s.message) : s.message;
-        validateWorkflowStringCaptures(logerrInner, s.loc);
-        validateDotFieldRefs(logerrInner, s.loc, promptSchemas);
-        validateSimpleInterpolationIdentifiers(
-          logerrInner,
+function validateTestBlocks(
+  diag: Diagnostics,
+  ast: jaiphModule,
+  tests: import("../types").TestBlockDef[],
+): void {
+  for (const tb of tests) {
+    // Reject mixing `mock prompt { … }` with queued `mock prompt "…"` /
+    // `mock prompt <const>` in one test block — previously the queue entries
+    // were silently ignored when a block was present, so authored mocks
+    // could mask bugs by going unused.
+    diag.capture(() => {
+      let blockStep: { loc: { line: number; col: number } } | undefined;
+      let queueStep: { loc: { line: number; col: number } } | undefined;
+      for (const step of tb.steps) {
+        if (step.type === "test_mock_prompt_block" && !blockStep) blockStep = step;
+        if (step.type === "test_mock_prompt" && !queueStep) queueStep = step;
+        if (blockStep && queueStep) break;
+      }
+      if (blockStep && queueStep) {
+        const loc = blockStep.loc.line > queueStep.loc.line ? blockStep.loc : queueStep.loc;
+        diag.error(
           ast.filePath,
-          s.loc.line,
-          s.loc.col,
-          "logerr",
-          wfKnownVars,
-          "workflow",
-          promptSchemas,
-          recoverBindings,
-          localScripts,
+          loc.line,
+          loc.col,
+          "E_VALIDATE",
+          'cannot mix "mock prompt { … }" with queued "mock prompt …" in one test block; choose one style',
         );
-        return;
       }
-      if (s.type === "return") {
-        if (s.managed) {
-          if (s.managed.kind === "run") {
-            validateNoShellRedirection(ast.filePath, s.managed.ref.loc, "run", s.managed.args);
-            validateNestedManagedCallArgs(ast.filePath, s.managed.ref.loc, s.managed.args);
-            validateRef(s.managed.ref, ast, refCtx, expectRunTargetRef);
-            validateArity(ast.filePath, s.managed.ref.loc, s.managed.ref.value, s.managed.args, "workflow", ast, refCtx);
+    });
 
-            validateBareIdentifierArgs(ast.filePath, s.managed.ref.loc, s.managed.bareIdentifierArgs, wfKnownVars, recoverBindings);
-          } else if (s.managed.kind === "ensure") {
-            validateNoShellRedirection(ast.filePath, s.managed.ref.loc, "ensure", s.managed.args);
-            validateNestedManagedCallArgs(ast.filePath, s.managed.ref.loc, s.managed.args);
-            validateRef(s.managed.ref, ast, refCtx, expectRuleRef);
-            validateArity(ast.filePath, s.managed.ref.loc, s.managed.ref.value, s.managed.args, "rule", ast, refCtx);
-
-            validateBareIdentifierArgs(ast.filePath, s.managed.ref.loc, s.managed.bareIdentifierArgs, wfKnownVars, recoverBindings);
-          } else if (s.managed.kind === "match") {
-            validateMatchExpr(ast.filePath, s.managed.match, wfKnownVars);
-          }
+    const inScope = new Set<string>();
+    for (const step of tb.steps) {
+      diag.capture(() => {
+        if (step.type === "test_const") {
+          inScope.add(step.name);
           return;
         }
-        validateReturnString(s.value, ast.filePath, s.loc.line, s.loc.col, { tripleQuoted: s.tripleQuoted });
-        if (s.value.startsWith('"')) {
-          const retInner = semanticQuotedOrchestrationInner(s.value, s.tripleQuoted === true);
-          validateWorkflowStringCaptures(retInner, s.loc);
-          validateDotFieldRefs(retInner, s.loc, promptSchemas);
-          validateSimpleInterpolationIdentifiers(
-            retInner,
-            ast.filePath,
-            s.loc.line,
-            s.loc.col,
-            "return",
-            wfKnownVars,
-            "workflow",
-            promptSchemas,
-            recoverBindings,
-            localScripts,
-          );
+        if (step.type === "test_run_workflow") {
+          if (step.captureName) inScope.add(step.captureName);
+          return;
         }
-        return;
-      }
-      if (s.type === "fail") {
-        validateFailString(s.message, ast.filePath, s.loc.line, s.loc.col, { tripleQuoted: s.tripleQuoted });
-        const failWfInner = semanticQuotedOrchestrationInner(s.message, s.tripleQuoted === true);
-        validateWorkflowStringCaptures(failWfInner, s.loc);
-        validateDotFieldRefs(failWfInner, s.loc, promptSchemas);
-        validateSimpleInterpolationIdentifiers(
-          failWfInner,
-          ast.filePath,
-          s.loc.line,
-          s.loc.col,
-          "fail",
-          wfKnownVars,
-          "workflow",
-          promptSchemas,
-          recoverBindings,
-          localScripts,
-        );
-        return;
-      }
-      if (s.type === "const") {
-        const v = s.value;
-        if (v.kind === "run_capture") {
-          validateNoShellRedirection(ast.filePath, v.ref.loc, "run", v.args);
-          validateNestedManagedCallArgs(ast.filePath, v.ref.loc, v.args);
-          if (!v.ref.value.includes(".") && wfKnownVars.has(v.ref.value) && !localScripts.has(v.ref.value) && !localWorkflows.has(v.ref.value)) {
-            throw jaiphError(ast.filePath, v.ref.loc.line, v.ref.loc.col, "E_VALIDATE", `strings are not executable; "${v.ref.value}" is a string — use a script instead`);
-          }
-          validateRef(v.ref, ast, refCtx, expectRunTargetRef);
-          validateArity(ast.filePath, v.ref.loc, v.ref.value, v.args, "workflow", ast, refCtx);
-
-          validateBareIdentifierArgs(ast.filePath, v.ref.loc, v.bareIdentifierArgs, wfKnownVars, recoverBindings);
-        } else if (v.kind === "ensure_capture") {
-          validateNoShellRedirection(ast.filePath, v.ref.loc, "ensure", v.args);
-          validateNestedManagedCallArgs(ast.filePath, v.ref.loc, v.args);
-          validateRef(v.ref, ast, refCtx, expectRuleRef);
-          validateArity(ast.filePath, v.ref.loc, v.ref.value, v.args, "rule", ast, refCtx);
-
-          validateBareIdentifierArgs(ast.filePath, v.ref.loc, v.bareIdentifierArgs, wfKnownVars, recoverBindings);
-        } else if (v.kind === "prompt_capture") {
-          if (v.bodyKind === "identifier" && v.bodyIdentifier && localScripts.has(v.bodyIdentifier)) {
-            throw jaiphError(ast.filePath, s.loc.line, s.loc.col, "E_VALIDATE", `scripts are not promptable; "${v.bodyIdentifier}" is a script — use a string const instead`);
-          }
-          validatePromptString(v.raw, ast.filePath, s.loc.line, s.loc.col, {
-            tripleQuoted: v.bodyKind === "triple_quoted",
-          });
-          if (v.returns !== undefined) {
-            validatePromptReturnsSchema(v.returns, ast.filePath, s.loc.line, s.loc.col);
-          }
-          const pcInner = semanticQuotedOrchestrationInner(v.raw, v.bodyKind === "triple_quoted");
-          validateWorkflowStringCaptures(pcInner, s.loc);
-          validateDotFieldRefs(pcInner, s.loc, promptSchemas);
-          validateSimpleInterpolationIdentifiers(
-            pcInner,
-            ast.filePath,
-            s.loc.line,
-            s.loc.col,
-            "prompt",
-            wfKnownVars,
-            "workflow",
-            promptSchemas,
-            recoverBindings,
-            localScripts,
-          );
-        } else if (v.kind === "run_inline_script_capture") {
-          // inline script capture — no ref to validate
-        } else if (v.kind === "match_expr") {
-          validateMatchExpr(ast.filePath, v.match, wfKnownVars);
-        } else if (v.kind === "expr") {
-          const scriptName = extractConstScriptName(v.bashRhs);
-          if (scriptName && localScripts.has(scriptName)) {
-            throw jaiphError(ast.filePath, s.loc.line, s.loc.col, "E_VALIDATE", `scripts are not values; "${scriptName}" is a script definition`);
+        if (step.type === "test_mock_prompt" && step.responseVar) {
+          if (!inScope.has(step.responseVar)) {
+            diag.error(
+              ast.filePath,
+              step.loc.line,
+              step.loc.col,
+              "E_VALIDATE",
+              `mock prompt: undefined name "${step.responseVar}" (declare it earlier with: const ${step.responseVar} = "…")`,
+            );
           }
-          const exprInner = semanticQuotedOrchestrationInner(v.bashRhs, v.tripleQuoted === true);
-          validateWorkflowStringCaptures(exprInner, s.loc);
-          validateDotFieldRefs(exprInner, s.loc, promptSchemas);
-          validateSimpleInterpolationIdentifiers(
-            exprInner,
-            ast.filePath,
-            s.loc.line,
-            s.loc.col,
-            "const",
-            wfKnownVars,
-            "workflow",
-            promptSchemas,
-            recoverBindings,
-            localScripts,
-          );
+          return;
         }
-        return;
-      }
-      if (s.type === "match") {
-        validateMatchExpr(ast.filePath, s.expr, wfKnownVars);
-        return;
-      }
-      if (s.type === "if") {
-        if (s.operand.kind === "regex") {
-          try { new RegExp(s.operand.source); } catch {
-            throw jaiphError(ast.filePath, s.loc.line, s.loc.col, "E_VALIDATE", `invalid regex in if condition: /${s.operand.source}/`);
+        if (
+          step.type === "test_expect_contain" ||
+          step.type === "test_expect_not_contain" ||
+          step.type === "test_expect_equal"
+        ) {
+          if (!inScope.has(step.variable)) {
+            diag.error(
+              ast.filePath,
+              step.loc.line,
+              step.loc.col,
+              "E_VALIDATE",
+              `${step.type.replace("test_", "")}: undefined name "${step.variable}" (capture it first with: const ${step.variable} = run …)`,
+            );
           }
-        }
-        for (const bodyStep of s.body) validateStep(bodyStep, recoverBindings);
-        return;
-      }
-      if (s.type === "for_lines") {
-        if (!wfKnownVars.has(s.sourceVar)) {
-          throw jaiphError(
-            ast.filePath,
-            s.loc.line,
-            s.loc.col,
-            "E_VALIDATE",
-            `for ... in <name>: "${s.sourceVar}" is not a known variable in this scope`,
-          );
-        }
-        for (const bodyStep of s.body) validateStep(bodyStep, recoverBindings);
-        return;
-      }
-      if (s.type === "run_inline_script") {
-        return;
-      }
-      if (s.type === "shell") {
-        if (hasUnquotedSendArrow(s.command) && matchSendOperator(s.command) === null) {
-          throw jaiphError(
-            ast.filePath,
-            s.loc.line,
-            s.loc.col,
-            "E_VALIDATE",
-            "invalid send: channel must be a single name or `alias.name` (at most one dot in the channel part)",
-          );
-        }
-        const t = s.command.trim();
-        if (/^(?:[A-Za-z_][A-Za-z0-9_]*)(?:\.[A-Za-z_][A-Za-z0-9_]*)*$/.test(t)) {
-          if (!t.includes(".")) {
-            if (localScripts.has(t) || localWorkflows.has(t)) {
-              throw jaiphError(
-                ast.filePath,
-                s.loc.line,
-                s.loc.col,
-                "E_VALIDATE",
-                `use run ${t}() — a bare name that refers to a script or workflow must use a managed run step`,
-              );
-            }
-          } else {
-            validateRef({ value: t, loc: s.loc }, ast, refCtx, expectRunTargetRef);
-            throw jaiphError(
+          const refName =
+            step.type === "test_expect_equal" ? step.expectedVar : step.substringVar;
+          if (refName !== undefined && !inScope.has(refName)) {
+            diag.error(
               ast.filePath,
-              s.loc.line,
-              s.loc.col,
+              step.loc.line,
+              step.loc.col,
               "E_VALIDATE",
-              `use run ${t}() — "${t}" is a valid script or workflow reference; use a managed run step`,
+              `${step.type.replace("test_", "")}: undefined name "${refName}" (declare it earlier with: const ${refName} = "…")`,
             );
           }
         }
-        return;
-      }
-      const _never: never = s;
-      return _never;
-    };
-
-
-    for (const step of workflow.steps) {
-      validateStep(step);
+      });
     }
   }
-
-  if (ast.tests && ast.tests.length > 0) {
-    validateTestBlocks(ast, ast.tests);
-  }
 }
-
-/**
- * Validate variable references inside `test` blocks. The only names in scope are
- * those introduced by `const NAME = …` (literal or `run … capture`) earlier in
- * the same block. There is no implicit `response`: an `expect_*` step that
- * references an undeclared name is a compile-time error.
- *
- * Errors raised:
- * - `mock prompt <ident>` where `<ident>` was not declared earlier
- * - `expect_*` LHS variable not declared earlier
- * - `expect_* var <ident>` RHS where `<ident>` was not declared earlier
- */
-function validateTestBlocks(ast: jaiphModule, tests: import("../types").TestBlockDef[]): void {
-  for (const tb of tests) {
-    const inScope = new Set<string>();
-    for (const step of tb.steps) {
-      if (step.type === "test_const") {
-        inScope.add(step.name);
-        continue;
-      }
-      if (step.type === "test_run_workflow") {
-        if (step.captureName) inScope.add(step.captureName);
-        continue;
-      }
-      if (step.type === "test_mock_prompt" && step.responseVar) {
-        if (!inScope.has(step.responseVar)) {
-          throw jaiphError(
-            ast.filePath,
-            step.loc.line,
-            step.loc.col,
-            "E_VALIDATE",
-            `mock prompt: undefined name "${step.responseVar}" (declare it earlier with: const ${step.responseVar} = "…")`,
-          );
-        }
-        continue;
-      }
-      if (
-        step.type === "test_expect_contain" ||
-        step.type === "test_expect_not_contain" ||
-        step.type === "test_expect_equal"
-      ) {
-        if (!inScope.has(step.variable)) {
-          throw jaiphError(
-            ast.filePath,
-            step.loc.line,
-            step.loc.col,
-            "E_VALIDATE",
-            `${step.type.replace("test_", "")}: undefined name "${step.variable}" (capture it first with: const ${step.variable} = run …)`,
-          );
-        }
-        const refName =
-          step.type === "test_expect_equal"
-            ? step.expectedVar
-            : step.substringVar;
-        if (refName !== undefined && !inScope.has(refName)) {
-          throw jaiphError(
-            ast.filePath,
-            step.loc.line,
-            step.loc.col,
-            "E_VALIDATE",
-            `${step.type.replace("test_", "")}: undefined name "${refName}" (declare it earlier with: const ${refName} = "…")`,
-          );
-        }
-        continue;
-      }
-      // Other step types (mock_workflow/rule/script bodies, blank_line, comment) are
-      // out of scope for this pass: their bodies are validated as workflow/rule steps
-      // by the regular path when materialized, and they do not contribute to the
-      // test-level `vars` map.
-    }
-  }
-}
-
diff --git a/src/transpiler.ts b/src/transpiler.ts
index 86ab5141..d6ceba0b 100644
--- a/src/transpiler.ts
+++ b/src/transpiler.ts
@@ -1,47 +1,52 @@
-import { existsSync, readFileSync } from "node:fs";
-import { dirname } from "node:path";
-import { parsejaiph } from "./parser";
-import { buildScripts as buildScriptsImpl, walkTestFiles } from "./transpile/build";
-import { buildScriptFiles, type ScriptArtifact } from "./transpile/emit-script";
-import { resolveImportPath, workflowSymbolForFile } from "./transpile/resolve";
-import { resolveScriptImportPath, validateReferences } from "./transpile/validate";
+import type { ModuleGraph } from "./transpile/module-graph";
+import { loadModuleGraph } from "./transpile/module-graph";
+import { buildScripts as buildScriptsImpl, buildScriptsFromGraph as buildScriptsFromGraphImpl, walkTestFiles } from "./transpile/build";
+import { emitScriptsForModuleFromGraph } from "./transpile/emit-from-graph";
+import type { ScriptArtifact } from "./transpile/emit-script";
 
 export { resolveImportPath, workflowSymbolForFile } from "./transpile/resolve";
 export type { ScriptArtifact } from "./transpile/emit-script";
+export type { ModuleGraph, ModuleNode } from "./transpile/module-graph";
+export { loadModuleGraph } from "./transpile/module-graph";
+export { emitScriptsForModuleFromGraph } from "./transpile/emit-from-graph";
 
 /**
- * Parse, validate, and extract per-`script` bash files for one module (no workflow bash emission).
+ * Path-based wrapper for callers that don't already have a graph (tests and
+ * legacy entry points). Loads a single-entry graph and emits scripts for the
+ * entry module. Imported modules are validated transitively as part of the
+ * shared graph but their script bodies are not emitted from this call.
  */
-export function emitScriptsForModule(inputFile: string, rootDir: string, workspaceRoot?: string): ScriptArtifact[] {
-  const ast = parsejaiph(readFileSync(inputFile, "utf8"), inputFile);
-  validateReferences(ast, {
-    resolveImportPath,
-    existsSync,
-    readFile: (path: string) => readFileSync(path, "utf8"),
-    parse: parsejaiph,
-    workspaceRoot,
-  });
-  const workflowSymbol = workflowSymbolForFile(inputFile, rootDir);
-  const importedWorkflowSymbols = new Map<string, string>();
-  for (const imp of ast.imports) {
-    const importedFile = resolveImportPath(ast.filePath, imp.path, workspaceRoot);
-    importedWorkflowSymbols.set(imp.alias, workflowSymbolForFile(importedFile, rootDir));
-  }
-  // Resolve script imports: read external script files so they are emitted as artifacts.
-  let resolvedScriptImports: Map<string, string> | undefined;
-  if (ast.scriptImports && ast.scriptImports.length > 0) {
-    resolvedScriptImports = new Map();
-    for (const si of ast.scriptImports) {
-      const resolved = resolveScriptImportPath(ast.filePath, si.path);
-      resolvedScriptImports.set(si.alias, readFileSync(resolved, "utf8"));
-    }
-  }
-  return buildScriptFiles(ast, importedWorkflowSymbols, workflowSymbol, resolvedScriptImports);
+export function emitScriptsForModule(
+  inputFile: string,
+  rootDir: string,
+  workspaceRoot?: string,
+): ScriptArtifact[] {
+  const graph = loadModuleGraph(inputFile, workspaceRoot);
+  return emitScriptsForModuleFromGraph(graph, graph.entryFile, rootDir);
 }
 
 export { walkTestFiles };
 
-export function buildScripts(inputPath: string, targetDir?: string, workspaceRoot?: string): { scriptsDir: string } {
-  const emitFn = (file: string, root: string) => emitScriptsForModule(file, root, workspaceRoot);
-  return buildScriptsImpl(inputPath, targetDir, emitFn, workspaceRoot);
+/**
+ * Path-based wrapper. Loads the module graph and emits per-script bash files
+ * for every reachable module (file entry) or every non-test `.jh` under the
+ * directory (directory entry). Kept for tests and the `jaiph test` path.
+ */
+export function buildScripts(
+  inputPath: string,
+  targetDir?: string,
+  workspaceRoot?: string,
+): { scriptsDir: string } {
+  return buildScriptsImpl(inputPath, targetDir, workspaceRoot);
+}
+
+/**
+ * Graph-based entry point. Used by `jaiph run` where the parent CLI already
+ * built the graph and wants to skip a second discovery walk.
+ */
+export function buildScriptsFromGraph(
+  graph: ModuleGraph,
+  targetDir: string,
+): { scriptsDir: string } {
+  return buildScriptsFromGraphImpl(graph, targetDir);
 }
diff --git a/src/types-shape.test.ts b/src/types-shape.test.ts
new file mode 100644
index 00000000..ad2045e6
--- /dev/null
+++ b/src/types-shape.test.ts
@@ -0,0 +1,160 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { readdirSync, readFileSync, statSync } from "node:fs";
+import { join, resolve } from "node:path";
+import type { Expr, WorkflowStepDef } from "./types";
+import * as TypesModule from "./types";
+
+// Tests run from dist/src/, so source files live two levels up under src/.
+const repoRoot = resolve(__dirname, "../..");
+const srcRoot = join(repoRoot, "src");
+
+/**
+ * AC1 — Placeholder strings deleted from the AST.
+ *
+ * After collapsing the three managed-call encodings into `Expr`, no source
+ * file under `src/` should ever produce the legacy sentinel values that
+ * existed only so the formatter could print something while the real
+ * payload sat in a `managed:` sidecar.
+ *
+ * If anyone reintroduces one of these strings as a placeholder, this test
+ * fails with the offending file:line.
+ */
+const PLACEHOLDER_STRINGS = ['"__match__"', '"run inline_script"', '"__JAIPH_MANAGED__"'];
+
+function listSourceFiles(dir: string, acc: string[]): void {
+  for (const entry of readdirSync(dir)) {
+    const full = join(dir, entry);
+    const st = statSync(full);
+    if (st.isDirectory()) {
+      // Skip the test file itself so it's allowed to mention the strings.
+      listSourceFiles(full, acc);
+      continue;
+    }
+    if (!entry.endsWith(".ts")) continue;
+    if (entry.endsWith(".test.ts")) continue; // tests may reference strings in assertions
+    if (full.endsWith("types-shape.test.ts")) continue;
+    acc.push(full);
+  }
+}
+
+test("AC1: no AST placeholder strings linger in src/", () => {
+  const files: string[] = [];
+  listSourceFiles(srcRoot, files);
+  const offenders: string[] = [];
+  for (const file of files) {
+    const text = readFileSync(file, "utf8");
+    for (const placeholder of PLACEHOLDER_STRINGS) {
+      if (text.includes(placeholder)) {
+        offenders.push(`${file} contains ${placeholder}`);
+      }
+    }
+  }
+  assert.deepEqual(offenders, [], `Placeholder strings reappeared in src/:\n${offenders.join("\n")}`);
+});
+
+/**
+ * AC2 — `WorkflowStepDef` has at most 8 variants. The exhaustive switch
+ * below fails to compile if a new variant is silently added (the `never`
+ * fallback widens), and the runtime tuple lookup pins the count to 8.
+ */
+type StepType = WorkflowStepDef["type"];
+type AllStepTypes = readonly ["exec", "const", "return", "send", "say", "if", "for_lines", "trivia"];
+type _StepTypesCoverAllVariants = StepType extends AllStepTypes[number]
+  ? AllStepTypes[number] extends StepType
+    ? true
+    : never
+  : never;
+const _stepTypesAtMost8: _StepTypesCoverAllVariants = true;
+
+function _exhaustiveStepSwitch(s: WorkflowStepDef): void {
+  switch (s.type) {
+    case "exec":
+    case "const":
+    case "return":
+    case "send":
+    case "say":
+    case "if":
+    case "for_lines":
+    case "trivia":
+      return;
+    default: {
+      const _never: never = s;
+      return _never;
+    }
+  }
+}
+
+test("AC2: WorkflowStepDef has exactly 8 variants", () => {
+  const declaredTypes: AllStepTypes = ["exec", "const", "return", "send", "say", "if", "for_lines", "trivia"];
+  assert.equal(declaredTypes.length, 8);
+  assert.equal(_stepTypesAtMost8, true);
+  // Reference the exhaustive switch so the unused-symbol check is happy and
+  // the dead-code eliminator can't drop the type-level assertion.
+  void _exhaustiveStepSwitch;
+});
+
+/**
+ * AC2 (companion) — `Expr` is exhaustive too. The Refactor 3 design carries
+ * 7 base kinds from the task spec; this implementation adds `shell` and
+ * `bare_ref` for send-RHS shapes that the validator either rejects or
+ * specializes. If a kind is added or removed without updating both the
+ * declared list and the exhaustive switch, this fails to compile.
+ */
+type ExprKind = Expr["kind"];
+type AllExprKinds = readonly ["literal", "call", "ensure_call", "inline_script", "prompt", "match", "shell", "bare_ref"];
+type _ExprKindsExhaustive = ExprKind extends AllExprKinds[number]
+  ? AllExprKinds[number] extends ExprKind
+    ? true
+    : never
+  : never;
+const _exprExhaustive: _ExprKindsExhaustive = true;
+
+function _exhaustiveExprSwitch(e: Expr): void {
+  switch (e.kind) {
+    case "literal":
+    case "call":
+    case "ensure_call":
+    case "inline_script":
+    case "prompt":
+    case "match":
+    case "shell":
+    case "bare_ref":
+      return;
+    default: {
+      const _never: never = e;
+      return _never;
+    }
+  }
+}
+
+test("AC2: Expr has exactly 8 kinds (literal/call/ensure_call/inline_script/prompt/match/shell/bare_ref)", () => {
+  const declaredKinds: AllExprKinds = ["literal", "call", "ensure_call", "inline_script", "prompt", "match", "shell", "bare_ref"];
+  assert.equal(declaredKinds.length, 8);
+  assert.equal(_exprExhaustive, true);
+  void _exhaustiveExprSwitch;
+});
+
+/**
+ * AC3 — `ConstRhs` and `SendRhsDef` are deleted as separate exported
+ * symbols; their fields now live inside `Expr`.
+ */
+test("AC3: ConstRhs and SendRhsDef are not exported from src/types.ts", () => {
+  const exported = Object.keys(TypesModule);
+  // Both symbol names should be absent from the module's export surface.
+  assert.ok(!exported.includes("ConstRhs"), `ConstRhs should not be exported`);
+  assert.ok(!exported.includes("SendRhsDef"), `SendRhsDef should not be exported`);
+
+  // Belt-and-suspenders: re-check the source file. (Pure types don't show up
+  // in runtime exports, so the textual check is what catches them.)
+  const typesPath = join(srcRoot, "types.ts");
+  const typesText = readFileSync(typesPath, "utf8");
+  assert.ok(
+    !/export\s+type\s+ConstRhs\b/.test(typesText),
+    "src/types.ts must not export ConstRhs",
+  );
+  assert.ok(
+    !/export\s+type\s+SendRhsDef\b/.test(typesText),
+    "src/types.ts must not export SendRhsDef",
+  );
+});
diff --git a/src/types.ts b/src/types.ts
index 61e6abff..6f7c0b02 100644
--- a/src/types.ts
+++ b/src/types.ts
@@ -7,8 +7,6 @@ export interface ImportDef {
   path: string;
   alias: string;
   loc: SourceLoc;
-  /** Top-level `#` lines immediately before this import (formatter). */
-  leadingComments?: string[];
 }
 
 /** `import script "<path>" as <name>` — binds an external script file as a local script symbol. */
@@ -18,8 +16,6 @@ export interface ScriptImportDef {
   /** Bound script name. */
   alias: string;
   loc: SourceLoc;
-  /** Top-level `#` lines immediately before this import (formatter). */
-  leadingComments?: string[];
 }
 
 export interface RuleRefDef {
@@ -51,32 +47,58 @@ export interface MatchExprDef {
   loc: SourceLoc;
 }
 
-export type ConstRhs =
-  | { kind: "expr"; bashRhs: string; /** `const x = """..."""` — runtime dedents margin. */ tripleQuoted?: boolean }
-  | { kind: "run_capture"; ref: WorkflowRefDef; args?: string; bareIdentifierArgs?: string[]; async?: boolean }
-  | { kind: "ensure_capture"; ref: RuleRefDef; args?: string; bareIdentifierArgs?: string[] }
-  | {
-      kind: "prompt_capture";
-      raw: string;
-      /** Body source: "string" (quoted literal), "identifier" (bare var ref), "triple_quoted" (""" block). */
-      bodyKind?: "string" | "identifier" | "triple_quoted";
-      /** Original identifier name when bodyKind is "identifier". */
-      bodyIdentifier?: string;
-      loc: SourceLoc;
-      returns?: string;
-    }
-  | { kind: "run_inline_script_capture"; body: string; lang?: string; args?: string; bareIdentifierArgs?: string[] }
-  | { kind: "match_expr"; match: MatchExprDef };
+/**
+ * Single call argument, classified at parse time.
+ *
+ * - `var`: a bare identifier reference (e.g. `foo(task)` → `{ kind: "var", name: "task" }`).
+ *   The validator checks `name` against in-scope bindings; the runtime sees `${name}`.
+ * - `literal`: any other form (quoted string, `${…}` interpolation, nested `run …` /
+ *   `ensure …` / inline-script call). Stored verbatim as authored, between the surrounding commas.
+ */
+export type Arg =
+  | { kind: "literal"; raw: string }
+  | { kind: "var"; name: string };
 
-/** RHS of `channel <- …` */
-export type SendRhsDef =
-  | { kind: "literal"; token: string; /** `channel <- """..."""` — runtime dedents margin. */ tripleQuoted?: boolean }
-  | { kind: "var"; bash: string }
-  | { kind: "run"; ref: WorkflowRefDef; args?: string; bareIdentifierArgs?: string[] }
-  /** Parsed then rejected in validation (use `run ref` to capture a return value). */
-  | { kind: "bare_ref"; ref: WorkflowRefDef }
-  /** Shell fragment emitted as `"$(...)"` for inbox send. */
-  | { kind: "shell"; command: string; loc: SourceLoc };
+/**
+ * One expression — used wherever a value can appear:
+ * - `const name = <Expr>`
+ * - `return <Expr>`
+ * - `send channel <- <Expr>`
+ * - `log <Expr>` / `logerr <Expr>` / `fail <Expr>`
+ * - body of an `exec` step (managed call statement form, where the value is consumed
+ *   for its side effects + optional capture)
+ *
+ * Replaces the prior `ConstRhs` / `SendRhsDef` unions and the placeholder-string
+ * `managed:` sidecar on `return` / `log` / `logerr`.
+ *
+ * Kinds:
+ * - `literal`: a string or `$var` / `${var}` form — the raw text as it appears in source
+ *   (post-dedent for triple-quoted bodies; the formatter consults trivia for surface form).
+ * - `call`: a managed workflow/script call `ref(args)`. `async` is set when the source said
+ *   `run async ref(...)` in capture position.
+ * - `ensure_call`: a managed rule call `ref(args)`.
+ * - `inline_script`: an inline-script call (`` `body`(args) `` or fenced).
+ * - `prompt`: a prompt body. `raw` carries the JSON-quoted prompt text (or `"${identifier}"`
+ *   sugar). `returns` carries an optional flat returns schema.
+ * - `match`: a `match <subject> { ... }` expression evaluated for its value.
+ * - `shell`: a raw shell fragment used as a managed substitution on the send RHS.
+ * - `bare_ref`: a bare symbol on a send RHS (e.g. `channel <- foo`). Always rejected by the
+ *   validator; preserved so the error message can name the symbol.
+ */
+export type Expr =
+  | { kind: "literal"; raw: string }
+  | { kind: "call"; callee: WorkflowRefDef; args?: Arg[]; async?: boolean }
+  | { kind: "ensure_call"; callee: RuleRefDef; args?: Arg[] }
+  | { kind: "inline_script"; lang?: string; body: string; args?: Arg[] }
+  | { kind: "prompt"; raw: string; loc: SourceLoc; returns?: string }
+  | { kind: "match"; match: MatchExprDef }
+  | { kind: "shell"; command: string; loc: SourceLoc }
+  | { kind: "bare_ref"; ref: WorkflowRefDef };
+
+/** Body attached to a `catch` or `recover` clause on an exec step. */
+export type CatchBody =
+  | { single: WorkflowStepDef; bindings: { failure: string } }
+  | { block: WorkflowStepDef[]; bindings: { failure: string } };
 
 export interface RuleDef {
   name: string;
@@ -92,8 +114,6 @@ export interface ChannelDef {
   name: string;
   routes?: WorkflowRefDef[];
   loc: SourceLoc;
-  /** Top-level `#` lines immediately before this channel (formatter). */
-  leadingComments?: string[];
 }
 
 export interface WorkflowDef {
@@ -114,135 +134,58 @@ export interface ScriptDef {
   body: string;
   /** Fence language tag (e.g. "python3", "node"). Maps to `#!/usr/bin/env <lang>`. */
   lang?: string;
-  /** How the body was provided: "backtick" (single `), "fenced" (``` block). */
-  bodyKind: "backtick" | "fenced";
   loc: SourceLoc;
 }
 
+/**
+ * Eight workflow-step variants — all values that flow through a step live in `Expr`.
+ *
+ * - `exec`: side-effecting managed call statement (was: `run` / `ensure` /
+ *   `run_inline_script` / `prompt` / `shell` step / standalone `match`). The
+ *   discriminator now lives inside `body.kind`; `captureName` / `async` /
+ *   `catch` / `recover` are step-level attributes.
+ * - `const` / `return` / `send`: bind, propagate, or emit an `Expr` value.
+ * - `say`: was `log` / `logerr` / `fail`. `level: "fail"` aborts the workflow
+ *   with the message; otherwise the message is written to the corresponding
+ *   stream.
+ * - `if` / `for_lines`: control flow (unchanged shape).
+ * - `trivia`: formatter-only `comment` / `blank_line` slots — they have no
+ *   execution semantics and are skipped by the runtime / validator.
+ */
 export type WorkflowStepDef =
   | {
-      type: "ensure";
-      ref: RuleRefDef;
-      args?: string;
-      bareIdentifierArgs?: string[];
-      /** When set, capture step stdout into this variable name. */
+      type: "exec";
+      body: Expr;
+      /** When set, capture the result into this variable name. */
       captureName?: string;
       /** When set, catch failure and run recovery body once. */
-      catch?:
-        | { single: WorkflowStepDef; bindings: { failure: string } }
-        | { block: WorkflowStepDef[]; bindings: { failure: string } };
-    }
-  | {
-      type: "run";
-      workflow: WorkflowRefDef;
-      args?: string;
-      bareIdentifierArgs?: string[];
-      /** When set, capture step stdout into this variable name. */
-      captureName?: string;
-      /** When set, execute asynchronously with implicit join before workflow completes. */
-      async?: boolean;
-      /** When set, catch failure and run recovery body once. */
-      catch?:
-        | { single: WorkflowStepDef; bindings: { failure: string } }
-        | { block: WorkflowStepDef[]; bindings: { failure: string } };
+      catch?: CatchBody;
       /** When set, retry with repair loop semantics (try → fail → recover body → retry). */
-      recover?:
-        | { single: WorkflowStepDef; bindings: { failure: string } }
-        | { block: WorkflowStepDef[]; bindings: { failure: string } };
-    }
-  | {
-      type: "prompt";
-      raw: string;
-      /** Body source: "string" (quoted literal), "identifier" (bare var ref), "triple_quoted" (""" block). */
-      bodyKind?: "string" | "identifier" | "triple_quoted";
-      /** Original identifier name when bodyKind is "identifier". */
-      bodyIdentifier?: string;
-      loc: SourceLoc;
-      /** When set, capture prompt stdout into this variable name. */
-      captureName?: string;
-      /** When set, validate response JSON against this flat schema (field: string|number|boolean). */
-      returns?: string;
-    }
-  | {
-      type: "comment";
-      text: string;
-      loc: SourceLoc;
-    }
-  | {
-      type: "fail";
-      message: string;
-      /** Set when `fail """..."""`; runtime dedents margin. */
-      tripleQuoted?: boolean;
+      recover?: CatchBody;
       loc: SourceLoc;
     }
   | {
       type: "const";
       name: string;
-      value: ConstRhs;
+      value: Expr;
       loc: SourceLoc;
     }
   | {
-      type: "log";
-      message: string;
-      /** Set when `log """..."""`; runtime dedents margin. */
-      tripleQuoted?: boolean;
-      loc: SourceLoc;
-      /** When set, log message comes from a managed inline-script call. */
-      managed?: { kind: "run_inline_script"; body: string; lang?: string; args?: string; bareIdentifierArgs?: string[] };
-    }
-  | {
-      type: "logerr";
-      message: string;
-      /** Set when `logerr """..."""`; runtime dedents margin. */
-      tripleQuoted?: boolean;
+      type: "return";
+      value: Expr;
       loc: SourceLoc;
-      /** When set, logerr message comes from a managed inline-script call. */
-      managed?: { kind: "run_inline_script"; body: string; lang?: string; args?: string; bareIdentifierArgs?: string[] };
     }
   | {
       type: "send";
       channel: string;
-      rhs: SendRhsDef;
-      loc: SourceLoc;
-    }
-  | {
-      type: "return";
-      value: string;
-      /** Set when `return """..."""`; runtime dedents margin. */
-      tripleQuoted?: boolean;
-      /**
-       * Original source expression when `return <expr>` was bare-identifier
-       * sugar (`return response` → value `"${response}"`). Preserved so the
-       * formatter can emit the bare form authored by the user.
-       */
-      bareSource?: string;
+      value: Expr;
       loc: SourceLoc;
-      /** When set, return value comes from a managed run/ensure/match instead of the literal `value`. */
-      managed?:
-        | { kind: "run"; ref: WorkflowRefDef; args?: string; bareIdentifierArgs?: string[] }
-        | { kind: "ensure"; ref: RuleRefDef; args?: string; bareIdentifierArgs?: string[] }
-        | { kind: "match"; match: MatchExprDef }
-        | { kind: "run_inline_script"; body: string; lang?: string; args?: string; bareIdentifierArgs?: string[] };
     }
   | {
-      type: "run_inline_script";
-      body: string;
-      /** Fence language tag (e.g. "node", "python3"). Maps to `#!/usr/bin/env <lang>`. */
-      lang?: string;
-      args?: string;
-      bareIdentifierArgs?: string[];
-      captureName?: string;
-      loc: SourceLoc;
-    }
-  | {
-      type: "shell";
-      command: string;
+      type: "say";
+      level: "log" | "logerr" | "fail";
+      message: Expr;
       loc: SourceLoc;
-      captureName?: string;
-    }
-  | {
-      type: "match";
-      expr: MatchExprDef;
     }
   | {
       type: "if";
@@ -250,6 +193,8 @@ export type WorkflowStepDef =
       operator: "==" | "!=" | "=~" | "!~";
       operand: { kind: "string_literal"; value: string } | { kind: "regex"; source: string };
       body: WorkflowStepDef[];
+      /** Optional `else { ... }` branch on `} else {`. */
+      elseBody?: WorkflowStepDef[];
       loc: SourceLoc;
     }
   | {
@@ -261,8 +206,11 @@ export type WorkflowStepDef =
       loc: SourceLoc;
     }
   | {
-      /** Preserved intentional blank line between steps (formatter only). */
-      type: "blank_line";
+      /** Formatter-only: `# comment` line or preserved blank line between steps. */
+      type: "trivia";
+      kind: "comment" | "blank_line";
+      text?: string;
+      loc?: SourceLoc;
     };
 
 export interface EnvDeclDef {
@@ -270,6 +218,8 @@ export interface EnvDeclDef {
   value: string;
   loc: SourceLoc;
   comments?: string[];
+  /** True when the source value was written as a double-quoted string (single-line `"..."` or triple-quoted `"""..."""`). False/undefined for bare tokens. The formatter preserves this distinction so a quoted value stays quoted. */
+  wasQuoted?: boolean;
 }
 
 /** Source order of definitions below imports / config / channels (formatter and round-trip). */
@@ -284,8 +234,6 @@ export interface jaiphModule {
   filePath: string;
   /** Optional in-file workflow metadata (agent model, command, run options). */
   metadata?: WorkflowMetadata;
-  /** Top-level `#` lines immediately before `config {` (formatter). */
-  configLeadingComments?: string[];
   imports: ImportDef[];
   /** `import script "<path>" as <name>` declarations. */
   scriptImports?: ScriptImportDef[];
@@ -298,10 +246,6 @@ export interface jaiphModule {
   envDecls?: EnvDeclDef[];
   /** Present only when parsing a *.test.jh file. */
   tests?: TestBlockDef[];
-  /** Encounter order of rule / script / workflow / env / test (excludes imports, config, channels). */
-  topLevelOrder?: TopLevelEmitOrder[];
-  /** Top-level `#` lines after the last declaration (formatter). */
-  trailingTopLevelComments?: string[];
 }
 
 /** Docker sandbox runtime configuration. */
@@ -311,11 +255,6 @@ export interface RuntimeConfig {
   dockerTimeoutSeconds?: number;
 }
 
-/** One line inside `config { }`: comment or assignment (formatter round-trip order). */
-export type ConfigBodyPart =
-  | { kind: "comment"; text: string }
-  | { kind: "assign"; key: string };
-
 /** In-file workflow metadata (replaces config file for V1). */
 export interface WorkflowMetadata {
   agent?: {
@@ -329,8 +268,6 @@ export interface WorkflowMetadata {
   run?: { debug?: boolean; logsDir?: string; recoverLimit?: number };
   runtime?: RuntimeConfig;
   module?: { name?: string; version?: string; description?: string };
-  /** Preserves `#` lines and assignment order inside `config { }` (formatter). */
-  configBodySequence?: ConfigBodyPart[];
 }
 
 /** Step inside a test block. Only present when module is a test file (*.test.jh). */
@@ -397,8 +334,6 @@ export interface TestBlockDef {
   description: string;
   steps: TestStepDef[];
   loc: SourceLoc;
-  /** Top-level `#` lines immediately before this `test` block (formatter). */
-  leadingComments?: string[];
 }
 
 export interface JaiphTestModule {
diff --git a/test-fixtures/compiler-txtar/parse-errors-snapshot.json b/test-fixtures/compiler-txtar/parse-errors-snapshot.json
new file mode 100644
index 00000000..008f300b
--- /dev/null
+++ b/test-fixtures/compiler-txtar/parse-errors-snapshot.json
@@ -0,0 +1,1997 @@
+{
+  "unterminated workflow block": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated block, expected \"}\""
+  },
+  "invalid script declaration": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "invalid script declaration"
+  },
+  "invalid rule declaration": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "invalid rule declaration"
+  },
+  "invalid workflow declaration": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "invalid workflow declaration"
+  },
+  "duplicate config block": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "duplicate config block (only one allowed per file)"
+  },
+  "unknown config key": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unknown config key: invalid.key. Allowed: agent.default_model, agent.command, agent.backend, agent.trusted_workspace, agent.cursor_flags, agent.claude_flags, run.logs_dir, run.debug, run.recover_limit, runtime.docker_image, runtime.docker_network, runtime.docker_timeout_seconds, module.name, module.version, module.description"
+  },
+  "single-quoted import path": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "single-quoted strings are not supported; use double quotes (\"...\") instead"
+  },
+  "import missing alias": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "import must match: import \"<path>\" as <alias>"
+  },
+  "command substitution in prompt": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "rule without braces": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "rule declarations require parentheses: rule foo() { … } or rule foo(params) { … }"
+  },
+  "rule with parentheses (unterminated)": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated rule block: foo"
+  },
+  "rule with colon instead of braces": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "rule declarations require parentheses: rule foo() { … } or rule foo(params) { … }"
+  },
+  "export rule without braces": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "rule declarations require parentheses: rule bar() { … } or rule bar(params) { … }"
+  },
+  "rule with parentheses but no brace": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "rule declarations require braces: rule gate() { … } or rule gate(params) { … }"
+  },
+  "script without braces": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "script definitions require = after the name: script greet = `...`"
+  },
+  "script with parentheses": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "definitions must not use parentheses: script greet = `...`"
+  },
+  "script with parens but no braces": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "definitions must not use parentheses: script greet = `...`"
+  },
+  "workflow without braces": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "workflow declarations require parentheses: workflow default() { … } or workflow default(params) { … }"
+  },
+  "workflow with parentheses (unterminated)": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated block, expected \"}\""
+  },
+  "export workflow without braces": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "workflow declarations require parentheses: workflow main() { … } or workflow main(params) { … }"
+  },
+  "workflow with parentheses but no brace": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "workflow declarations require braces: workflow main() { … } or workflow main(params) { … }"
+  },
+  "duplicate config in same workflow": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "duplicate config block inside workflow (only one allowed per workflow)"
+  },
+  "config after steps in workflow": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "config block inside workflow must appear before any steps"
+  },
+  "runtime keys in workflow config": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "runtime.* keys are not allowed in workflow-level config (only agent.* and run.* keys)"
+  },
+  "script tag with manual shebang conflict": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "fence tag \"node\" already sets the shebang — remove the manual \"#!\" line"
+  },
+  "script tag with parentheses": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unsupported top-level statement: script:node transform() {"
+  },
+  "script tag without braces": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unsupported top-level statement: script:node transform"
+  },
+  "capture with run async rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "assignment without \"const\" is no longer supported; use \"const x = run async some_wf()\""
+  },
+  "run async with inline script rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "run async is not supported with inline scripts"
+  },
+  "old inline script syntax rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "inline script syntax has changed: use run `body`(args) instead of run script(args) \"body\""
+  },
+  "invalid agent.backend value": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "agent.backend must be \"cursor\", \"claude\", or \"codex\""
+  },
+  "invalid config value not quoted": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "config value must be a quoted string or true/false: yes"
+  },
+  "config integer key rejects string value": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "runtime.docker_timeout_seconds must be an integer"
+  },
+  "config array key rejects runtime.workspace (no longer supported)": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unknown config key: runtime.workspace. Allowed: agent.default_model, agent.command, agent.backend, agent.trusted_workspace, agent.cursor_flags, agent.claude_flags, run.logs_dir, run.debug, run.recover_limit, runtime.docker_image, runtime.docker_network, runtime.docker_timeout_seconds, module.name, module.version, module.description"
+  },
+  "config rejects runtime.docker_enabled (no longer supported)": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unknown config key: runtime.docker_enabled. Allowed: agent.default_model, agent.command, agent.backend, agent.trusted_workspace, agent.cursor_flags, agent.claude_flags, run.logs_dir, run.debug, run.recover_limit, runtime.docker_image, runtime.docker_network, runtime.docker_timeout_seconds, module.name, module.version, module.description"
+  },
+  "unknown runtime config key": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unknown config key: runtime.unknown_key. Allowed: agent.default_model, agent.command, agent.backend, agent.trusted_workspace, agent.cursor_flags, agent.claude_flags, run.logs_dir, run.debug, run.recover_limit, runtime.docker_image, runtime.docker_network, runtime.docker_timeout_seconds, module.name, module.version, module.description"
+  },
+  "if keyword with old syntax produces error": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "invalid if syntax; expected: if <identifier> <op> <operand> { ... } where op is ==, !=, =~, or !~ and operand is \"string\" or /regex/"
+  },
+  "channel declaration must be single per line": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "invalid channel declaration; expected: channel <name> or channel <name> -> <workflow>"
+  },
+  "capture and send cannot be combined": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "top-level local keyword is rejected": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unsupported top-level statement: local greeting = \"hello world\""
+  },
+  "top-level const name collision with rule": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "duplicate name \"foo\" — variable name collides with rule of the same name"
+  },
+  "top-level const name collision with workflow": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "duplicate name \"default\" — variable name collides with workflow of the same name"
+  },
+  "top-level const name collision with script": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "duplicate name \"helper\" — variable name collides with script of the same name"
+  },
+  "const rejects bare call-like rhs without run": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "Script calls in const assignments must use run. Use: const x = run some_script(\"${arg}\")"
+  },
+  "unterminated rule block": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated rule block: bad"
+  },
+  "unsupported top-level statement": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unsupported top-level statement: echo \"not allowed at top level\""
+  },
+  "multiline prompt string rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "multiline prompt strings are no longer supported; use a triple-quoted block instead: prompt \"\"\"...\"\"\"\""
+  },
+  "if keyword with not produces error": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "invalid if syntax; expected: if <identifier> <op> <operand> { ... } where op is ==, !=, =~, or !~ and operand is \"string\" or /regex/"
+  },
+  "invalid workflow reference shape with extra dots": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "run must target a valid reference: run ref() or run ref(args) — parentheses are required"
+  },
+  "prompt with returns without capture name": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "ensure catch with args after catch": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 22,
+    "code": "E_PARSE",
+    "message": "catch requires explicit bindings: catch (<name>) { ... }"
+  },
+  "ensure catch with multiple args after catch": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 25,
+    "code": "E_PARSE",
+    "message": "catch requires explicit bindings: catch (<name>) { ... }"
+  },
+  "ensure catch without block": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 33,
+    "code": "E_PARSE",
+    "message": "catch requires explicit bindings and a body: catch (<name>) { ... }"
+  },
+  "ensure catch without bindings (bare catch block)": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "catch requires explicit bindings: catch (<name>) { ... }"
+  },
+  "capture and send combined alt form": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject bare $name in log message": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject bare $name in prompt": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject bare $1 in log message": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject braced numeric ${1} in log message": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject bare $name in fail message": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject bare $name in return string": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject shell fallback ${var:-fallback} in log": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject shell fallback ${var:-fallback} in fail": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject shell fallback ${var:-fallback} in prompt": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject shell fallback ${var:-fallback} in const RHS": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "shell fallback syntax (e.g. ${var:-default}) is not supported; use conditional logic or named params instead"
+  },
+  "reject shell expansion ${var:+alt} in log": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject command substitution in log": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject command substitution in logerr": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "reject shell fallback in rule log": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "nested inline capture rejected": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "invalid inline run reference bad identifier": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "match: unterminated string in pattern": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated string in match pattern"
+  },
+  "match: unterminated regex in pattern": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated regex in match pattern"
+  },
+  "match: empty regex in pattern": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "empty regex in match pattern"
+  },
+  "match: invalid regex in pattern": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "invalid regex in match pattern: /[invalid/"
+  },
+  "match: empty arm body": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "match arm body cannot be empty"
+  },
+  "match: unterminated string in arm body": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated string in match arm body"
+  },
+  "match: single-quoted pattern": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "single-quoted strings are not supported; use double quotes (\"...\") instead"
+  },
+  "match: single-quoted arm body": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "single-quoted strings are not supported; use double quotes (\"...\") instead"
+  },
+  "match: missing arrow after pattern": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "expected \"=>\" after match pattern"
+  },
+  "run async without parentheses requires parens": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "run async must target a valid reference: run async ref() or run async ref(args) — parentheses are required"
+  },
+  "log format not double-quoted": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "log must match: log \"<message>\" or log <identifier>"
+  },
+  "unterminated log string": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: log \"\"\"...\"\"\""
+  },
+  "logerr format not double-quoted": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "logerr must match: logerr \"<message>\" or logerr <identifier>"
+  },
+  "unterminated logerr string": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: logerr \"\"\"...\"\"\""
+  },
+  "invalid workflow reference in channel route": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "invalid workflow reference in channel route: \"123bad\""
+  },
+  "route inside workflow body is parse error": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "route declarations belong at the top level: channel findings -> analyst"
+  },
+  "if keyword in workflow with args produces error": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "invalid if syntax; expected: if <identifier> <op> <operand> { ... } where op is ==, !=, =~, or !~ and operand is \"string\" or /regex/"
+  },
+  "brace-if: wait in rules": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "\"wait\" has been removed from the language"
+  },
+  "brace-if: prompt in rules": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "prompt is not allowed in rules"
+  },
+  "brace-if: send in rules": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "send operator is not allowed in rules"
+  },
+  "if keyword with else branch produces error": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "invalid if syntax; expected: if <identifier> <op> <operand> { ... } where op is ==, !=, =~, or !~ and operand is \"string\" or /regex/"
+  },
+  "brace-if: const prompt in rules": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const ... = prompt is not allowed in rules"
+  },
+  "unterminated script block": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated fenced block: no closing ``` before end of file"
+  },
+  "metadata: runtime.workspace array rejected (single-quoted element)": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unknown config key: runtime.workspace. Allowed: agent.default_model, agent.command, agent.backend, agent.trusted_workspace, agent.cursor_flags, agent.claude_flags, run.logs_dir, run.debug, run.recover_limit, runtime.docker_image, runtime.docker_network, runtime.docker_timeout_seconds, module.name, module.version, module.description"
+  },
+  "metadata: runtime.workspace array rejected (unquoted element)": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unknown config key: runtime.workspace. Allowed: agent.default_model, agent.command, agent.backend, agent.trusted_workspace, agent.cursor_flags, agent.claude_flags, run.logs_dir, run.debug, run.recover_limit, runtime.docker_image, runtime.docker_network, runtime.docker_timeout_seconds, module.name, module.version, module.description"
+  },
+  "metadata: runtime.workspace array rejected (unclosed)": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unknown config key: runtime.workspace. Allowed: agent.default_model, agent.command, agent.backend, agent.trusted_workspace, agent.cursor_flags, agent.claude_flags, run.logs_dir, run.debug, run.recover_limit, runtime.docker_image, runtime.docker_network, runtime.docker_timeout_seconds, module.name, module.version, module.description"
+  },
+  "unterminated test block": {
+    "file": "input.test.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated test block: broken test"
+  },
+  "mock function deprecated": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "\"mock function\" is no longer supported; use \"mock script\""
+  },
+  "send rhs: unterminated braced interpolation": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 12,
+    "code": "E_PARSE",
+    "message": "unterminated ${...} in send right-hand side"
+  },
+  "send rhs: command substitution inside braced interpolation": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 12,
+    "code": "E_PARSE",
+    "message": "send right-hand side must be a quoted string (\"...\"), a variable ($name or ${...}), or \"run <ref> [args]\" — not raw shell; use a script or use const"
+  },
+  "inline script: unexpected content after": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unexpected content after anonymous inline script: 'extra_stuff'"
+  },
+  "inline script: unterminated parentheses": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "run must target a valid reference: run ref() or run ref(args) — parentheses are required"
+  },
+  "inline script without parentheses": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "run must target a valid reference: run ref() or run ref(args) — parentheses are required"
+  },
+  "old inline script empty body rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "inline script syntax has changed: use run `body`(args) instead of run script(args) \"body\""
+  },
+  "inline script unterminated backtick": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unterminated inline script backtick — missing closing `"
+  },
+  "match: invalid pattern type": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "match pattern must be a string literal (\"...\"), regex (/…/), or wildcard (_)"
+  },
+  "match: unterminated match block": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated match block"
+  },
+  "match: empty match block": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "match must have at least one arm"
+  },
+  "catch: fail without double quote": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "fail must match: fail \"<reason>\" or fail \"\"\"...\"\"\""
+  },
+  "catch: unterminated fail string": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: fail \"\"\"...\"\"\""
+  },
+  "catch: log without double quote": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "log must match: log \"<message>\" or log <identifier>"
+  },
+  "catch: unterminated log string": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: log \"\"\"...\"\"\""
+  },
+  "catch: logerr without double quote": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "logerr must match: logerr \"<message>\" or logerr <identifier>"
+  },
+  "catch: unterminated logerr string": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: logerr \"\"\"...\"\"\""
+  },
+  "test: empty mock prompt block": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "mock prompt block must have at least one arm"
+  },
+  "test: unterminated mock block": {
+    "file": "input.test.jh",
+    "line": 5,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated mock block"
+  },
+  "test: mock prompt invalid format": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 2,
+    "code": "E_PARSE",
+    "message": "mock prompt must be: mock prompt \"<response>\", mock prompt <const_name>, or mock prompt { \"pattern\" => \"response\", _ => \"default\" }"
+  },
+  "test: mock workflow with invalid ref (no parens)": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unrecognized test step: mock workflow a.b.c {"
+  },
+  "test: mock rule with invalid ref (no parens)": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unrecognized test step: mock rule a.b.c {"
+  },
+  "test: mock script with invalid ref (no parens)": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unrecognized test step: mock script a.b.c {"
+  },
+  "run async without parens in workflow requires parens": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "run async must target a valid reference: run async ref() or run async ref(args) — parentheses are required"
+  },
+  "config block with content on same line as opening": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "config block must be exactly 'config {' on its own line"
+  },
+  "unterminated string in top-level const": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: const name = \"\"\"...\"\"\"\""
+  },
+  "top-level const with trailing content after quote": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after closing quote in const declaration"
+  },
+  "top-level const single-quoted string": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "single-quoted strings are not supported; use double quotes (\"...\") instead"
+  },
+  "workflow const with command substitution": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const value cannot use command substitution \"$(...)\"; use a script and const name = run ref"
+  },
+  "workflow const with bash percent expansion": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const value cannot use ${var%%...} expansion; use a script"
+  },
+  "workflow const with bash replace expansion": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const value cannot use ${var//...} expansion; use a script"
+  },
+  "workflow const with bash length expansion": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const value cannot use ${#var}; use a script"
+  },
+  "workflow const with shell fallback": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "shell fallback syntax (e.g. ${var:-default}) is not supported; use conditional logic or named params instead"
+  },
+  "run without parentheses in workflow requires parens": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "run must target a valid reference: run ref() or run ref(args) — parentheses are required"
+  },
+  "return with single-quoted string": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "single-quoted strings are not supported; use double quotes (\"...\") instead"
+  },
+  "capture and send combined in workflow body": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "if keyword at top of workflow produces error": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "invalid if syntax; expected: if <identifier> <op> <operand> { ... } where op is ==, !=, =~, or !~ and operand is \"string\" or /regex/"
+  },
+  "capture run without parentheses requires const": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "assignment without \"const\" is no longer supported; use \"const x = run helper\""
+  },
+  "const run without parentheses requires parens": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const ... = run must target a valid reference"
+  },
+  "const ensure without parentheses requires parens": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const ... = ensure must target a valid reference"
+  },
+  "triple-backtick prompt is rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "prompt blocks use triple quotes: prompt \"\"\"...\"\"\"; triple backticks are for scripts"
+  },
+  "unterminated triple-quoted prompt block": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated triple-quoted block: no closing \"\"\" before end of file"
+  },
+  "script with returns on closing fence rejected": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after closing fence: 'returns \"{ x: string }\"'"
+  },
+  "script with double-quoted body rejected": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "script bodies use backticks: script broken = `...`"
+  },
+  "script body with Jaiph interpolation rejected": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "script bodies cannot contain Jaiph interpolation (${name}); use $1, $2 positional arguments instead"
+  },
+  "script with brace-style body rejected": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "brace-style script bodies are no longer supported; use: script name = `...` or script name = ```...```"
+  },
+  "script body with bare identifier rejected": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "script bodies must be backtick or fenced block: script broken = `...` or script broken = ```...```"
+  },
+  "script body with trailing content after backtick": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after script body backtick: 'extra'"
+  },
+  "inline script fenced without argument list": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "anonymous inline script requires argument list after closing fence: ```(args) or ```()"
+  },
+  "inline script fenced with shebang and lang tag conflict": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "fence tag \"node\" already sets the shebang — remove the manual \"#!\" line"
+  },
+  "inline script fenced unterminated in workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated fenced block: no closing ``` before end of file"
+  },
+  "inline script single backtick without argument list": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "anonymous inline script requires argument list after closing backtick: `body`(args) or `body`()"
+  },
+  "inline script fenced with invalid lang token": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "invalid opening fence: only a single lang token is allowed after ```"
+  },
+  "config block unterminated": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "config block not closed with '}'"
+  },
+  "config block with trailing content after close brace": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "config block must be exactly 'config {' on its own line"
+  },
+  "match subject with dollar prefix rejected": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "match subject should be a bare identifier: match varName { ... }"
+  },
+  "match subject with invalid identifier": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "match subject must be a valid identifier, got: 123"
+  },
+  "const run with invalid reference": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const ... = run must target a valid reference"
+  },
+  "const ensure with invalid reference": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const ... = ensure must target a valid reference"
+  },
+  "const ensure cannot use catch": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const ... = ensure cannot use catch"
+  },
+  "run with invalid reference in workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "run must target a valid reference: run ref() or run ref(args) — parentheses are required"
+  },
+  "run async with invalid reference in workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "run async must target a valid reference: run async ref() or run async ref(args) — parentheses are required"
+  },
+  "empty parameter name in parameter list": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "empty parameter name in parameter list"
+  },
+  "invalid parameter name in workflow": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "invalid parameter name \"123bad\"; must be an identifier"
+  },
+  "duplicate parameter name in workflow": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "duplicate parameter name \"a\""
+  },
+  "send with unterminated string": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 12,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: channel <- \"\"\"...\"\"\""
+  },
+  "triple-quote opening with content on same line": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "opening \"\"\" must not have content on the same line"
+  },
+  "log with trailing content after string": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unexpected content after log string: 'extra'"
+  },
+  "logerr with trailing content after string": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unexpected content after logerr string: 'extra'"
+  },
+  "catch: prompt capture without const": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "use \"const name = prompt ...\" to capture the prompt result (e.g. const answer = prompt \"...\" )"
+  },
+  "top-level const triple-quote with trailing content after close": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after closing \"\"\" in const declaration"
+  },
+  "unterminated return string in workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: return \"\"\"...\"\"\""
+  },
+  "unterminated fail string in workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: fail \"\"\"...\"\"\""
+  },
+  "if keyword after other steps produces error": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "invalid if syntax; expected: if <identifier> <op> <operand> { ... } where op is ==, !=, =~, or !~ and operand is \"string\" or /regex/"
+  },
+  "prompt assign without const in workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "use \"const name = prompt ...\" to capture the prompt result (e.g. const answer = prompt \"...\" )"
+  },
+  "fail without double quote in workflow body": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "fail must match: fail \"<reason>\" or fail \"\"\"...\"\"\""
+  },
+  "unterminated multiline catch block": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "unterminated catch block, expected \"}\""
+  },
+  "duplicate name: rule and workflow": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "duplicate name \"foo\" — channels, rules, workflows, and scripts share a single namespace (already declared as rule)"
+  },
+  "duplicate name: script and workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "duplicate name \"helper\" — channels, rules, workflows, and scripts share a single namespace (already declared as script)"
+  },
+  "duplicate name: rule and script": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "duplicate name \"foo\" — channels, rules, workflows, and scripts share a single namespace (already declared as rule)"
+  },
+  "channel route with no target after arrow": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "channel route requires at least one target workflow after ->"
+  },
+  "empty multiline catch block": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "catch block must contain at least one statement"
+  },
+  "ensure with invalid reference": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "ensure must target a valid reference: ensure ref() or ensure ref(args) — parentheses are required"
+  },
+  "config line without equals sign": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "config line must be key = value: agent.backend"
+  },
+  "prompt with trailing non-returns content": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "after prompt string expected keyword \"returns\" with quoted schema (e.g. returns \"{ type: string }\") or end of line"
+  },
+  "prompt returns with single-quoted schema": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "single-quoted strings are not supported; use double quotes (\"...\") instead"
+  },
+  "unterminated returns schema string": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated returns schema string"
+  },
+  "test block without opening brace": {
+    "file": "input.test.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "test block must match: test \"description\" {"
+  },
+  "send with trailing content after string": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 12,
+    "code": "E_PARSE",
+    "message": "send right-hand side must be a quoted string (\"...\"), a variable ($name or ${...}), or \"run <ref> [args]\" — not raw shell; use a script or use const"
+  },
+  "capture run with invalid reference in workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "assignment without \"const\" is no longer supported; use \"const x = run 123bad\""
+  },
+  "fenced script with shell parameter expansion is valid": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "empty inline catch block": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "catch block must contain at least one statement"
+  },
+  "test: old camelCase expectContain rejected": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "camelCase assertions are no longer supported; use \"expect_contain\""
+  },
+  "test: old camelCase expectNotContain rejected": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "camelCase assertions are no longer supported; use \"expect_not_contain\""
+  },
+  "test: old camelCase expectEqual rejected": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "camelCase assertions are no longer supported; use \"expect_equal\""
+  },
+  "test: bare assignment without const/run rejected": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "use \"const out = run lib.default(…)\" to capture workflow output"
+  },
+  "test: bare workflow call without run rejected": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "use \"run lib.default(…)\" to call a workflow in tests"
+  },
+  "test: mock workflow without parens rejected": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "mock workflow requires parentheses: mock workflow lib.default() { … }"
+  },
+  "test: mock rule without parens rejected": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "mock rule requires parentheses: mock rule lib.check() { … }"
+  },
+  "test: mock script without parens rejected": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "mock script requires parentheses: mock script lib.helper() { … }"
+  },
+  "test: unrecognized line is E_PARSE": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unrecognized test step: echo \"not valid\""
+  },
+  "ensure catch with unterminated bindings paren": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "unterminated catch bindings: expected \")\""
+  },
+  "ensure catch with empty bindings": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "catch requires exactly one binding: catch (<name>) { ... }"
+  },
+  "ensure catch with invalid binding name": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "invalid catch binding name: \"123bad\" — must be a valid identifier"
+  },
+  "ensure catch with no body after bindings": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "catch requires a body after bindings"
+  },
+  "run catch with unterminated bindings paren": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 16,
+    "code": "E_PARSE",
+    "message": "unterminated catch bindings: expected \")\""
+  },
+  "run catch with empty bindings": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 16,
+    "code": "E_PARSE",
+    "message": "catch requires exactly one binding: catch (<name>) { ... }"
+  },
+  "run catch with invalid binding name": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 16,
+    "code": "E_PARSE",
+    "message": "invalid catch binding name: \"123bad\" — must be a valid identifier"
+  },
+  "run catch with no body after bindings": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 16,
+    "code": "E_PARSE",
+    "message": "catch requires a body after bindings"
+  },
+  "ensure catch with multiple bindings rejected": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "catch accepts exactly one binding: catch (<name>) — the second binding (attempt) has been removed"
+  },
+  "run catch with multiple bindings rejected": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 16,
+    "code": "E_PARSE",
+    "message": "catch accepts exactly one binding: catch (<name>) — the second binding (attempt) has been removed"
+  },
+  "inline catch fail without double quote": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "fail must match: fail \"<reason>\" or fail \"\"\"...\"\"\""
+  },
+  "inline catch unterminated fail string": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: fail \"\"\"...\"\"\""
+  },
+  "inline config block missing equals sign": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "config block must be exactly 'config {' on its own line"
+  },
+  "inline config block with unknown key": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "config block must be exactly 'config {' on its own line"
+  },
+  "inline config block rejects runtime.workspace (array opening)": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "config block must be exactly 'config {' on its own line"
+  },
+  "inline config block rejects runtime.workspace (non-empty array)": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "config block must be exactly 'config {' on its own line"
+  },
+  "config block header not exactly config brace": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "config block must be exactly 'config {' on its own line"
+  },
+  "config value with single-quoted string": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "single-quoted strings are not supported; use double quotes (\"...\") instead"
+  },
+  "workflow body content after brace without closing on same line": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "expected newline after '{'"
+  },
+  "runtime keys in inline workflow config": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "expected newline after '{'"
+  },
+  "rule body content after brace without closing on same line": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "expected newline after '{'"
+  },
+  "prompt triple-quote closing with invalid trailing content": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "closing \"\"\" must be alone, or followed by returns \"{ ... }\" (same line)"
+  },
+  "prompt identifier body with single-quoted returns": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "single-quoted strings are not supported; use double quotes (\"...\") instead"
+  },
+  "prompt identifier body with non-returns trailing content": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "after prompt body expected keyword \"returns\" with quoted schema (e.g. returns \"{ type: string }\") or end of line"
+  },
+  "prompt identifier body with unterminated returns schema": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated returns schema string"
+  },
+  "script body with invalid rhs character": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "script body must be a backtick or fenced block: script broken = `...` or script broken = ```...```"
+  },
+  "match triple-quote arm closing with trailing content": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "closing \"\"\" in match arm must not have content on the same line"
+  },
+  "match: opening triple-quote in arm with content on same line": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "opening \"\"\" in match arm must not have content on the same line"
+  },
+  "match: unterminated triple-quoted block in arm": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated triple-quoted block in match arm: no closing \"\"\" before end of match"
+  },
+  "send with empty payload rejected": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 12,
+    "code": "E_PARSE",
+    "message": "send requires an explicit payload: channel <- \"message\" — bare forward syntax (channel <-) has been removed"
+  },
+  "config after semicolon-separated steps in workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "unexpected content after log string: '; config { agent.backend = \"claude\" }'"
+  },
+  "mock prompt single-quoted string rejected": {
+    "file": "input.test.jh",
+    "line": 4,
+    "col": 2,
+    "code": "E_PARSE",
+    "message": "single-quoted strings are not supported; use double quotes (\"...\") instead"
+  },
+  "wait in catch block rejected": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "\"wait\" has been removed from the language"
+  },
+  "reserved keyword as parameter name": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "parameter name \"run\" is a reserved keyword"
+  },
+  "log triple-quote with trailing content": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after closing \"\"\""
+  },
+  "logerr triple-quote with trailing content": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after closing \"\"\""
+  },
+  "fail triple-quote with trailing content": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after closing \"\"\""
+  },
+  "return triple-quote with trailing content": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after closing \"\"\""
+  },
+  "send triple-quote with trailing content": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after closing \"\"\""
+  },
+  "wait in inline catch statement": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "\"wait\" has been removed from the language"
+  },
+  "catch block: assignment without const rejected": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "assignment without \"const\" is no longer supported; use \"const x = run helper()\""
+  },
+  "catch block: prompt assign without const": {
+    "file": "input.jh",
+    "line": 6,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "use \"const name = prompt ...\" to capture the prompt result (e.g. const answer = prompt \"...\" )"
+  },
+  "const run with old inline script syntax": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "inline script syntax has changed: use const name = run `body`(args) instead of run script(args) \"body\""
+  },
+  "top-level const with invalid name": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unsupported top-level statement: const 123bad = \"hello\""
+  },
+  "wait in workflow body rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "\"wait\" has been removed from the language"
+  },
+  "wait in workflow body after other steps rejected": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "\"wait\" has been removed from the language"
+  },
+  "shell redirection after const run call rejected": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after run call: '| grep ok'; shell redirection (>, |, &) is not supported — use a script block"
+  },
+  "shell redirection after send run call rejected": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after run call: '> output.txt'; shell redirection (>, |, &) is not supported — use a script block"
+  },
+  "prompt body must be string or identifier not number": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "prompt body must be a quoted string, identifier, or triple-quoted block: const name = prompt \"text\" | prompt myVar | prompt \"\"\" ... \"\"\""
+  },
+  "send rhs trailing content after braced var": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 12,
+    "code": "E_PARSE",
+    "message": "send right-hand side must be a quoted string (\"...\"), a variable ($name or ${...}), or \"run <ref> [args]\" — not raw shell; use a script or use const"
+  },
+  "config string key with boolean value": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "agent.default_model must be a string"
+  },
+  "config boolean key with string value": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "run.debug must be true or false"
+  },
+  "config keyword alone on a line": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unsupported top-level statement: config"
+  },
+  "send multiline string without triple quotes": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "multiline strings use triple quotes: channel <- \"\"\"...\"\"\""
+  },
+  "send triple-quoted payload valid": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "top-level script single backtick unterminated": {
+    "file": "input.jh",
+    "line": 1,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated inline script backtick — missing closing `"
+  },
+  "inline catch return without value": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "catch requires explicit bindings: catch (<name>) { ... }"
+  },
+  "run catch unterminated multiline block": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 16,
+    "code": "E_PARSE",
+    "message": "unterminated catch block, expected \"}\""
+  },
+  "ensure catch unterminated multiline block": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 18,
+    "code": "E_PARSE",
+    "message": "unterminated catch block, expected \"}\""
+  },
+  "inline script fenced unterminated in rule body": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated fenced block: no closing ``` before end of file"
+  },
+  "fail triple-quote opening with content on same line": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "opening \"\"\" must not have content on the same line"
+  },
+  "return triple-quote opening with content on same line": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "opening \"\"\" must not have content on the same line"
+  },
+  "logerr triple-quote opening with content on same line": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "opening \"\"\" must not have content on the same line"
+  },
+  "unterminated triple-quoted send block": {
+    "file": "input.jh",
+    "line": 3,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated triple-quoted block: no closing \"\"\" before end of file"
+  },
+  "run catch without bindings bare catch block": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 16,
+    "code": "E_PARSE",
+    "message": "catch requires explicit bindings: catch (<name>) { ... }"
+  },
+  "log triple-quote opening with content on same line": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "opening \"\"\" must not have content on the same line"
+  },
+  "const triple-quote opening with content on same line": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "opening \"\"\" must not have content on the same line"
+  },
+  "unterminated triple-quoted log block": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated triple-quoted block: no closing \"\"\" before end of file"
+  },
+  "unterminated triple-quoted fail block": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated triple-quoted block: no closing \"\"\" before end of file"
+  },
+  "unterminated triple-quoted return block": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated triple-quoted block: no closing \"\"\" before end of file"
+  },
+  "unterminated triple-quoted const block": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unterminated triple-quoted block: no closing \"\"\" before end of file"
+  },
+  "inline run catch with single fail statement": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "send rhs with run to workflow": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "send rhs with run to script": {
+    "file": "<no-error>",
+    "line": 0,
+    "col": 0,
+    "code": "OK",
+    "message": "compilation succeeded but fixture expected a parse error"
+  },
+  "return with bash exit code rejected in workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "bash exit codes are only valid in scripts; use return \"...\" for a workflow value"
+  },
+  "return with bash dollar-question rejected in workflow": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "bash exit codes are only valid in scripts; use return \"...\" for a workflow value"
+  },
+  "if equality operator with regex operand rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "operator \"==\" requires a string operand (\"...\"), not a regex"
+  },
+  "if inequality operator with regex operand rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "operator \"!=\" requires a string operand (\"...\"), not a regex"
+  },
+  "if regex-match operator with string operand rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "operator \"=~\" requires a regex operand (/pattern/), not a string"
+  },
+  "if negative regex-match operator with string operand rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "operator \"!~\" requires a regex operand (/pattern/), not a string"
+  },
+  "const run async with inline script rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "run async is not supported with inline scripts"
+  },
+  "const run async with invalid reference": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 13,
+    "code": "E_PARSE",
+    "message": "const ... = run async must target a valid reference"
+  },
+  "if/else on its own line without preceding closing brace": {
+    "file": "input.jh",
+    "line": 5,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "\"else\" must appear on the same line as the closing \"}\" of an \"if\" block (e.g., \"} else {\")"
+  },
+  "if/else without preceding if": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 3,
+    "code": "E_PARSE",
+    "message": "\"else\" must appear on the same line as the closing \"}\" of an \"if\" block (e.g., \"} else {\")"
+  },
+  "if/else if chaining not supported": {
+    "file": "input.jh",
+    "line": 4,
+    "col": 5,
+    "code": "E_PARSE",
+    "message": "\"else if\" chaining is not supported; nest an \"if\" inside the \"else\" block, or use \"match\" for multi-way branching"
+  },
+  "inline script recover and catch on same step rejected": {
+    "file": "input.jh",
+    "line": 2,
+    "col": 1,
+    "code": "E_PARSE",
+    "message": "unexpected content after log string: '} catch (e) { log \"c\"'"
+  }
+}
diff --git a/test-fixtures/compiler-txtar/parse-errors.txt b/test-fixtures/compiler-txtar/parse-errors.txt
index 35f01712..77a3b9a0 100644
--- a/test-fixtures/compiler-txtar/parse-errors.txt
+++ b/test-fixtures/compiler-txtar/parse-errors.txt
@@ -919,7 +919,9 @@ workflow default() {
 }
 
 === catch: fail without double quote
-# @expect error E_PARSE "fail must match" @5:1
+# Body parsing unified with parseBlockStatement (Refactor 2). Error now points
+# to the inner statement's actual line/col.
+# @expect error E_PARSE "fail must match" @6:5
 --- input.jh
 rule check() {
   return "ok"
@@ -931,7 +933,7 @@ workflow default() {
 }
 
 === catch: unterminated fail string
-# @expect error E_PARSE "unterminated fail string" @5:1
+# @expect error E_PARSE "multiline strings use triple quotes: fail" @6:5
 --- input.jh
 rule check() {
   return "ok"
@@ -943,7 +945,7 @@ workflow default() {
 }
 
 === catch: log without double quote
-# @expect error E_PARSE "log must match" @5:1
+# @expect error E_PARSE "log must match" @6:5
 --- input.jh
 rule check() {
   return "ok"
@@ -955,7 +957,7 @@ workflow default() {
 }
 
 === catch: unterminated log string
-# @expect error E_PARSE "unterminated log string" @5:1
+# @expect error E_PARSE "multiline strings use triple quotes: log" @6:5
 --- input.jh
 rule check() {
   return "ok"
@@ -967,7 +969,7 @@ workflow default() {
 }
 
 === catch: logerr without double quote
-# @expect error E_PARSE "logerr must match" @5:1
+# @expect error E_PARSE "logerr must match" @6:5
 --- input.jh
 rule check() {
   return "ok"
@@ -979,7 +981,7 @@ workflow default() {
 }
 
 === catch: unterminated logerr string
-# @expect error E_PARSE "unterminated logerr string" @5:1
+# @expect error E_PARSE "multiline strings use triple quotes: logerr" @6:5
 --- input.jh
 rule check() {
   return "ok"
@@ -1439,7 +1441,7 @@ workflow default() {
 }
 
 === catch: prompt capture without const
-# @expect error E_PARSE "const name = prompt" @5:1
+# @expect error E_PARSE "const name = prompt" @6:5
 --- input.jh
 rule check() {
   return "ok"
@@ -1899,7 +1901,7 @@ workflow default() {
 }
 
 === inline catch unterminated fail string
-# @expect error E_PARSE "unterminated fail string"
+# @expect error E_PARSE "multiline strings use triple quotes: fail"
 --- input.jh
 rule check() {
   return "ok"
@@ -2522,3 +2524,44 @@ workflow default() {
   const x = run async 123bad()
 }
 
+=== if/else on its own line without preceding closing brace
+# @expect error E_PARSE "must appear on the same line as the closing" @5:3
+--- input.jh
+workflow default(x) {
+  if x == "y" {
+    log "yes"
+  }
+  else {
+    log "no"
+  }
+}
+
+=== if/else without preceding if
+# @expect error E_PARSE "must appear on the same line as the closing" @2:3
+--- input.jh
+workflow default() {
+  else {
+    log "no"
+  }
+}
+
+=== if/else if chaining not supported
+# @expect error E_PARSE "chaining is not supported" @4:5
+--- input.jh
+workflow default(x) {
+  if x == "a" {
+    log "a"
+  } else if x == "b" {
+    log "b"
+  } else {
+    log "c"
+  }
+}
+
+
+=== inline script recover and catch on same step rejected
+# @expect error E_PARSE "unexpected content after log string"
+--- input.jh
+workflow default() {
+  run `false`() recover(e) { log "r" } catch (e) { log "c" }
+}
diff --git a/test-fixtures/compiler-txtar/valid.txt b/test-fixtures/compiler-txtar/valid.txt
index 06dedd39..d9699a41 100644
--- a/test-fixtures/compiler-txtar/valid.txt
+++ b/test-fixtures/compiler-txtar/valid.txt
@@ -288,7 +288,7 @@ workflow other_wf(a, b) {
   log "ok"
 }
 workflow default() {
-  run async other_wf("hello" "$x")
+  run async other_wf("hello", "$x")
 }
 
 === run async with qualified ref
@@ -1172,3 +1172,162 @@ workflow default() {
 workflow default(name) {
   return name
 }
+
+=== if/else in workflow
+# @expect ok
+--- input.jh
+workflow default(status) {
+  if status == "ok" {
+    log "healthy"
+  } else {
+    logerr "unhealthy: ${status}"
+  }
+}
+
+=== if/else in rule
+# @expect ok
+--- input.jh
+rule check(value) {
+  if value == "" {
+    fail "value required"
+  } else {
+    log "value: ${value}"
+  }
+}
+
+workflow default(value) {
+  ensure check(value)
+}
+
+=== if/else nested if in else block
+# @expect ok
+--- input.jh
+workflow default(mode) {
+  if mode == "fast" {
+    log "fast path"
+  } else {
+    if mode == "slow" {
+      log "slow path"
+    } else {
+      log "default path"
+    }
+  }
+}
+
+=== inline script catch in workflow
+# @expect ok
+--- input.jh
+workflow default() {
+  run `false`() catch (err) {
+    log "caught: ${err}"
+  }
+}
+
+=== inline script recover in workflow
+# @expect ok
+--- input.jh
+workflow default() {
+  run `test -f .gate`() recover(err) {
+    run `touch .gate`()
+  }
+}
+
+=== inline script catch in rule
+# @expect ok
+--- input.jh
+script noop = `true`
+rule check() {
+  run `false`() catch (err) {
+    run noop()
+  }
+}
+workflow default() {
+  ensure check()
+}
+
+=== inline script recover in rule
+# @expect ok
+--- input.jh
+script noop = `true`
+rule check() {
+  run `test -f .gate`() recover(err) {
+    run noop()
+  }
+}
+workflow default() {
+  ensure check()
+}
+
+=== fenced inline script catch in workflow
+# @expect ok
+--- input.jh
+workflow default() {
+  run ```
+exit 1
+```() catch (err) {
+    log "fenced caught: ${err}"
+  }
+}
+
+=== inline script with args and catch
+# @expect ok
+--- input.jh
+workflow default() {
+  run `false $1`("x") catch (err) {
+    log "caught: ${err}"
+  }
+}
+
+=== inline script catch single-statement body
+# @expect ok
+--- input.jh
+workflow default() {
+  run `false`() catch (err) log "recovered: ${err}"
+}
+
+=== if with dot-notation subject on typed prompt capture
+# @expect ok
+--- input.jh
+workflow default() {
+  const r = prompt "Classify" returns "{ verdict: string }"
+  if r.verdict == "ok" {
+    log "approved"
+  }
+}
+
+=== match with dot-notation subject on typed prompt capture
+# @expect ok
+--- input.jh
+workflow default() {
+  const r = prompt "Classify" returns "{ verdict: string }"
+  const x = match r.verdict {
+    "ok" => "approved"
+    _ => "rejected"
+  }
+  log "${x}"
+}
+
+=== test file: mock prompt block and queued mock prompt in separate test blocks
+# @expect ok
+--- input.test.jh
+import "lib.jh" as m
+
+test "uses pattern-dispatch mock" {
+  mock prompt {
+    /hi/ => "hello"
+    _ => "default"
+  }
+  const response = run m.ask()
+  expect_contain response "hello"
+}
+
+test "uses queue-style mock" {
+  mock prompt "queued"
+  const response = run m.ask()
+  expect_contain response "queued"
+}
+--- lib.jh
+workflow ask() {
+  const r = prompt "say hi"
+  return r
+}
diff --git a/test-fixtures/compiler-txtar/validate-diagnostics-snapshot.json b/test-fixtures/compiler-txtar/validate-diagnostics-snapshot.json
new file mode 100644
index 00000000..7a534620
--- /dev/null
+++ b/test-fixtures/compiler-txtar/validate-diagnostics-snapshot.json
@@ -0,0 +1,1053 @@
+{
+  "validate-errors.txt > unknown local rule reference": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown local rule reference \"missing_rule\""
+    }
+  ],
+  "validate-errors.txt > unknown local workflow or script reference in run": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown local workflow or script reference \"missing_workflow\""
+    }
+  ],
+  "validate-errors.txt > unknown local channel in send": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 1,
+      "code": "E_VALIDATE",
+      "message": "Channel \"typo\" is not defined"
+    }
+  ],
+  "validate-errors.txt > rule with inline brace group fails shell-step ban": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "inline shell steps are forbidden in rules; use explicit script blocks"
+    }
+  ],
+  "validate-errors.txt > rule with multi-line brace group fails shell-step ban": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "inline shell steps are forbidden in rules; use explicit script blocks"
+    }
+  ],
+  "validate-errors.txt > unsupported type in returns schema": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_SCHEMA",
+      "message": "unsupported type in returns schema: \"array\" (only string, number, boolean allowed)"
+    }
+  ],
+  "validate-errors.txt > workflow raw shell that names a script must use run": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "use run f() — a bare name that refers to a script or workflow must use a managed run step"
+    }
+  ],
+  "validate-errors.txt > workflow raw shell that names a workflow must use run": [
+    {
+      "file": "input.jh",
+      "line": 6,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "use run w() — a bare name that refers to a script or workflow must use a managed run step"
+    }
+  ],
+  "validate-errors.txt > send RHS cannot invoke workflow via shell": [
+    {
+      "file": "input.jh",
+      "line": 7,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "workflow \"w\" must be called with run"
+    }
+  ],
+  "validate-errors.txt > bare identifier arg unknown name fails": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown identifier \"unknown_var\" used as bare argument; declare it with \"const\", use a capture, or add a workflow/rule parameter"
+    }
+  ],
+  "validate-errors.txt > run async is rejected in rules": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "run async is not allowed in rules; use it in workflows only"
+    }
+  ],
+  "validate-errors.txt > route with unknown workflow": [
+    {
+      "file": "input.jh",
+      "line": 1,
+      "col": 21,
+      "code": "E_VALIDATE",
+      "message": "unknown local workflow reference \"missing_wf\""
+    }
+  ],
+  "validate-errors.txt > route with rule ref": [
+    {
+      "file": "input.jh",
+      "line": 1,
+      "col": 21,
+      "code": "E_VALIDATE",
+      "message": "rule \"check\" must be called with ensure"
+    }
+  ],
+  "validate-errors.txt > route inside workflow body is parse error": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 1,
+      "code": "E_PARSE",
+      "message": "route declarations belong at the top level: channel findings -> analyst"
+    }
+  ],
+  "validate-errors.txt > inline run ref with unknown script": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown local workflow or script reference \"nonexistent\""
+    }
+  ],
+  "validate-errors.txt > dot field ref where var has no schema": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "${x.field}: \"x\" is not a typed prompt capture; dot notation requires a prompt with \"returns\" schema"
+    }
+  ],
+  "validate-errors.txt > dot field ref with nonexistent field in schema": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "${result.bogus}: field \"bogus\" is not defined in the returns schema for \"result\"; available fields: type, risk"
+    }
+  ],
+  "validate-errors.txt > unknown import alias in rule reference": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown import alias \"ghost\" for rule reference \"ghost.guard\""
+    }
+  ],
+  "validate-errors.txt > match: missing wildcard arm": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "match must have exactly one wildcard (_) arm"
+    }
+  ],
+  "validate-errors.txt > match: multiple wildcard arms": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "match must have exactly one wildcard (_) arm, found multiple"
+    }
+  ],
+  "validate-errors.txt > shell redirection in ensure args rejected": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 1,
+      "code": "E_PARSE",
+      "message": "unexpected content after ensure call: '| grep ok'; shell redirection (>, |, &) is not supported — use a script block"
+    }
+  ],
+  "validate-errors.txt > run in workflow targeting a rule is rejected": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "rule \"check\" must be called with ensure, not run"
+    }
+  ],
+  "validate-errors.txt > run in rule targeting a rule is rejected": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "rule \"other_rule\" must be called with ensure, not run"
+    }
+  ],
+  "validate-errors.txt > ensure rejects local script reference": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "script \"my_script\" cannot be called with ensure"
+    }
+  ],
+  "validate-errors.txt > const prompt in rules (caught at parse time)": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 13,
+      "code": "E_PARSE",
+      "message": "const ... = prompt is not allowed in rules"
+    }
+  ],
+  "validate-errors.txt > returns schema cannot be empty": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_SCHEMA",
+      "message": "returns schema cannot be empty"
+    }
+  ],
+  "validate-errors.txt > returns schema rejects array types": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_SCHEMA",
+      "message": "returns schema must be flat (no arrays or union types); only string, number, boolean allowed"
+    }
+  ],
+  "validate-errors.txt > returns schema rejects union types": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_SCHEMA",
+      "message": "returns schema must be flat (no arrays or union types); only string, number, boolean allowed"
+    }
+  ],
+  "validate-errors.txt > returns schema rejects malformed entry": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_SCHEMA",
+      "message": "invalid returns schema entry: expected \"fieldName: type\" (got badentry...)"
+    }
+  ],
+  "validate-errors.txt > returns schema rejects unsupported type": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_SCHEMA",
+      "message": "unsupported type in returns schema: \"array\" (only string, number, boolean allowed)"
+    }
+  ],
+  "validate-errors.txt > run in workflow targeting a rule via import": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "rule \"lib.check\" must be called with ensure, not run"
+    }
+  ],
+  "validate-errors.txt > ensure imported workflow requires run": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "workflow \"lib.deploy\" must be called with run"
+    }
+  ],
+  "validate-errors.txt > ensure rejects imported script": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "script \"lib.helper\" cannot be called with ensure"
+    }
+  ],
+  "validate-errors.txt > run inside rule must target script not imported workflow": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "run inside a rule must target a script, not workflow \"lib.deploy\""
+    }
+  ],
+  "validate-errors.txt > route with imported rule ref rejected": [
+    {
+      "file": "main.jh",
+      "line": 2,
+      "col": 21,
+      "code": "E_VALIDATE",
+      "message": "rule \"lib.check\" must be called with ensure"
+    }
+  ],
+  "validate-errors.txt > arity mismatch: too few args to workflow": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "workflow \"helper\" expects 2 argument(s) (a, b), but got 1"
+    }
+  ],
+  "validate-errors.txt > arity mismatch: too many args to workflow": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "workflow \"helper\" expects 1 argument(s) (a), but got 2"
+    }
+  ],
+  "validate-errors.txt > arity mismatch: zero args to workflow expecting two": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "workflow \"helper\" expects 2 argument(s) (a, b), but got 0"
+    }
+  ],
+  "validate-errors.txt > arity mismatch: too few args to rule": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "rule \"check\" expects 1 argument(s) (x), but got 0"
+    }
+  ],
+  "validate-errors.txt > route target with wrong parameter count": [
+    {
+      "file": "input.jh",
+      "line": 1,
+      "col": 21,
+      "code": "E_VALIDATE",
+      "message": "inbox route target \"handler\" must declare exactly 3 parameters (message, channel, sender), but declares 1"
+    }
+  ],
+  "validate-errors.txt > route target with zero parameters": [
+    {
+      "file": "input.jh",
+      "line": 1,
+      "col": 21,
+      "code": "E_VALIDATE",
+      "message": "inbox route target \"handler\" must declare exactly 3 parameters (message, channel, sender), but declares 0"
+    }
+  ],
+  "validate-errors.txt > inline run ref with unknown rule": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown local workflow or script reference \"nonexistent\""
+    }
+  ],
+  "validate-errors.txt > match: missing wildcard arm with single pattern": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "match must have exactly one wildcard (_) arm"
+    }
+  ],
+  "validate-errors.txt > send RHS with local rule bare ref": [
+    {
+      "file": "input.jh",
+      "line": 6,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "rule \"check\" must be called with ensure"
+    }
+  ],
+  "validate-errors.txt > shell redirection in run args rejected in rule": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 1,
+      "code": "E_PARSE",
+      "message": "unexpected content after run call: '| grep ok'; shell redirection (>, |, &) is not supported — use a script block"
+    }
+  ],
+  "validate-errors.txt > shell redirection in run args rejected in workflow": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 1,
+      "code": "E_PARSE",
+      "message": "unexpected content after run call: '> /tmp/out'; shell redirection (>, |, &) is not supported — use a script block"
+    }
+  ],
+  "validate-errors.txt > shell redirection in ensure args rejected in workflow": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 1,
+      "code": "E_PARSE",
+      "message": "unexpected content after ensure call: '| grep ok'; shell redirection (>, |, &) is not supported — use a script block"
+    }
+  ],
+  "validate-errors.txt > channel ref with unknown import alias": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 1,
+      "code": "E_VALIDATE",
+      "message": "Channel \"ghost.mychan\" is not defined"
+    }
+  ],
+  "validate-errors.txt > imported route target with wrong parameter count": [
+    {
+      "file": "main.jh",
+      "line": 2,
+      "col": 21,
+      "code": "E_VALIDATE",
+      "message": "inbox route target \"lib.handler\" must declare exactly 3 parameters (message, channel, sender), but declares 1"
+    }
+  ],
+  "validate-errors.txt > const run of string variable in rule rejected": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 13,
+      "code": "E_VALIDATE",
+      "message": "strings are not executable; \"name\" is a string — use a script instead"
+    }
+  ],
+  "validate-errors.txt > channel reference with three dot parts is rejected": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "invalid send: channel must be a single name or `alias.name` (at most one dot in the channel part)"
+    }
+  ],
+  "validate-errors.txt > command substitution invokes workflow in send shell RHS": [
+    {
+      "file": "input.jh",
+      "line": 6,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "command substitution cannot invoke workflow \"helper\"; use run helper ... in a workflow step"
+    }
+  ],
+  "validate-errors.txt > command substitution invokes script in send shell RHS": [
+    {
+      "file": "input.jh",
+      "line": 4,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "command substitution cannot invoke script \"helper\"; use run helper ... for managed calls (or use pure shell inside $(...))"
+    }
+  ],
+  "validate-errors.txt > scripts are not values in rule const": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "scripts are not values; \"helper\" is a script definition"
+    }
+  ],
+  "validate-errors.txt > scripts are not values in workflow const": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "scripts are not values; \"helper\" is a script definition"
+    }
+  ],
+  "validate-errors.txt > scripts are not promptable in workflow": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "scripts are not promptable; \"helper\" is a script — use a string const instead"
+    }
+  ],
+  "validate-errors.txt > scripts cannot be interpolated in log": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "scripts cannot be interpolated; \"helper\" is a script definition"
+    }
+  ],
+  "validate-errors.txt > match arm body cannot start with return": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "match arm body must not start with \"return\"; the match expression itself produces the value — use the expression directly after =>"
+    }
+  ],
+  "validate-errors.txt > inline script in match arm body rejected": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "inline scripts are not allowed in match arm bodies; use a named script with \"run script_name(…)\" instead"
+    }
+  ],
+  "validate-errors.txt > strings are not executable in workflow run": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "strings are not executable; \"name\" is a string — use a script instead"
+    }
+  ],
+  "validate-errors.txt > match arm body cannot start with return in const context": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 13,
+      "code": "E_VALIDATE",
+      "message": "match arm body must not start with \"return\"; the match expression itself produces the value — use the expression directly after =>"
+    }
+  ],
+  "validate-errors.txt > unknown identifier in fail string": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown identifier \"ghost\" in fail; declare it with `const`, use a capture, or add a workflow parameter"
+    }
+  ],
+  "validate-errors.txt > unknown identifier in rule log string": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown identifier \"ghost\" in log; declare it with `const`, use a capture, or add a rule parameter"
+    }
+  ],
+  "validate-errors.txt > unknown identifier in send literal": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 1,
+      "code": "E_VALIDATE",
+      "message": "unknown identifier \"ghost\" in send; declare it with `const`, use a capture, or add a workflow parameter"
+    }
+  ],
+  "validate-errors.txt > send RHS with local script bare ref requires run": [
+    {
+      "file": "input.jh",
+      "line": 4,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "script \"helper\" must be called with run"
+    }
+  ],
+  "validate-errors.txt > unknown identifier in workflow logerr string": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown identifier \"ghost\" in logerr; declare it with `const`, use a capture, or add a workflow parameter"
+    }
+  ],
+  "validate-errors.txt > unknown identifier in workflow return string": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown identifier \"ghost\" in return; declare it with `const`, use a capture, or add a workflow parameter"
+    }
+  ],
+  "validate-errors.txt > scripts cannot be interpolated in logerr": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "scripts cannot be interpolated; \"helper\" is a script definition"
+    }
+  ],
+  "validate-errors.txt > scripts cannot be interpolated in fail": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "scripts cannot be interpolated; \"helper\" is a script definition"
+    }
+  ],
+  "validate-errors.txt > scripts cannot be interpolated in return": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "scripts cannot be interpolated; \"helper\" is a script definition"
+    }
+  ],
+  "validate-errors.txt > strings are not executable in workflow const run": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 13,
+      "code": "E_VALIDATE",
+      "message": "strings are not executable; \"name\" is a string — use a script instead"
+    }
+  ],
+  "validate-errors.txt > ensure rejects local workflow reference": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "workflow \"helper\" must be called with run"
+    }
+  ],
+  "validate-errors.txt > run async is rejected in rules with imported workflow": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "run async is not allowed in rules; use it in workflows only"
+    }
+  ],
+  "validate-errors.txt > scripts cannot be interpolated in send literal": [
+    {
+      "file": "input.jh",
+      "line": 4,
+      "col": 1,
+      "code": "E_VALIDATE",
+      "message": "scripts cannot be interpolated; \"helper\" is a script definition"
+    }
+  ],
+  "validate-errors.txt > unknown identifier in inline run capture in log": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown local workflow or script reference \"nonexistent_script\""
+    }
+  ],
+  "validate-errors.txt > strings are not executable in rule run": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 13,
+      "code": "E_VALIDATE",
+      "message": "strings are not executable; \"greeting\" is a string — use a script instead"
+    }
+  ],
+  "validate-errors.txt > unknown identifier in workflow log string": [
+    {
+      "file": "input.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown identifier \"ghost\" in log; declare it with `const`, use a capture, or add a workflow parameter"
+    }
+  ],
+  "validate-errors.txt > match arm body with ensure arm in const context": [],
+  "validate-errors.txt > return bare unknown identifier": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown identifier \"missing_name\" in return; declare it with `const`, use a capture, or add a workflow parameter"
+    }
+  ],
+  "validate-errors.txt > test block: expect_equal LHS variable not captured (no implicit `response`)": [
+    {
+      "file": "input.test.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "expect_equal: undefined name \"response\" (capture it first with: const response = run …)"
+    }
+  ],
+  "validate-errors.txt > test block: expect_equal RHS const reference not declared": [
+    {
+      "file": "input.test.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "expect_equal: undefined name \"expected\" (declare it earlier with: const expected = \"…\")"
+    }
+  ],
+  "validate-errors.txt > test block: mock prompt <ident> references undeclared const": [
+    {
+      "file": "input.test.jh",
+      "line": 4,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "mock prompt: undefined name \"reply\" (declare it earlier with: const reply = \"…\")"
+    }
+  ],
+  "validate-errors.txt > test block: explicit capture + const reference is valid": [],
+  "validate-errors.txt > invalid regex in if condition in workflow": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "invalid regex in if condition: /[bad(/"
+    }
+  ],
+  "validate-errors.txt > invalid regex in if condition in rule": [
+    {
+      "file": "input.jh",
+      "line": 4,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "invalid regex in if condition: /[bad(/"
+    }
+  ],
+  "validate-errors.txt > import script resolves to missing file": [
+    {
+      "file": "input.jh",
+      "line": 1,
+      "col": 1,
+      "code": "E_IMPORT_NOT_FOUND",
+      "message": "import script \"queue\" resolves to missing file \"<TMP>/missing.py\""
+    },
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown local workflow or script reference \"queue\""
+    }
+  ],
+  "validate-errors.txt > bare imported workflow as shell line must use run": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "use run lib.deploy() — \"lib.deploy\" is a valid script or workflow reference; use a managed run step"
+    }
+  ],
+  "validate-errors.txt > bare imported script as shell line must use run": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "use run lib.helper() — \"lib.helper\" is a valid script or workflow reference; use a managed run step"
+    }
+  ],
+  "validate-errors.txt > command substitution invokes rule in send shell RHS": [
+    {
+      "file": "input.jh",
+      "line": 6,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "command substitution cannot invoke rule \"check\"; use ensure check ... in a workflow step"
+    }
+  ],
+  "validate-errors.txt > command substitution contains channel send": [
+    {
+      "file": "input.jh",
+      "line": 4,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "command substitution cannot contain channel send (<-); use a workflow send step instead"
+    }
+  ],
+  "validate-errors.txt > prompt inside else block in rule": [
+    {
+      "file": "input.jh",
+      "line": 5,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "const ... = prompt is not allowed in rules"
+    }
+  ],
+  "validate-errors.txt > if dot subject where var is not a typed prompt capture": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "${r.verdict}: \"r\" is not a typed prompt capture; dot notation requires a prompt with \"returns\" schema"
+    }
+  ],
+  "validate-errors.txt > if dot subject with unknown field": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "${r.bogus}: field \"bogus\" is not defined in the returns schema for \"r\"; available fields: verdict"
+    }
+  ],
+  "validate-errors.txt > match dot subject where var is not a typed prompt capture": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 13,
+      "code": "E_VALIDATE",
+      "message": "${r.verdict}: \"r\" is not a typed prompt capture; dot notation requires a prompt with \"returns\" schema"
+    }
+  ],
+  "validate-errors.txt > match dot subject with unknown field": [
+    {
+      "file": "input.jh",
+      "line": 3,
+      "col": 13,
+      "code": "E_VALIDATE",
+      "message": "${r.bogus}: field \"bogus\" is not defined in the returns schema for \"r\"; available fields: verdict"
+    }
+  ],
+  "validate-errors.txt > test block: mix mock prompt block with queued mock prompt (block first)": [
+    {
+      "file": "input.test.jh",
+      "line": 8,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "cannot mix \"mock prompt { … }\" with queued \"mock prompt …\" in one test block; choose one style"
+    }
+  ],
+  "validate-errors.txt > test block: mix mock prompt block with queued mock prompt (queue first)": [
+    {
+      "file": "input.test.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "cannot mix \"mock prompt { … }\" with queued \"mock prompt …\" in one test block; choose one style"
+    }
+  ],
+  "validate-errors-multi-module.txt > duplicate import alias": [
+    {
+      "file": "main.jh",
+      "line": 2,
+      "col": 1,
+      "code": "E_VALIDATE",
+      "message": "duplicate import alias \"mod\""
+    },
+    {
+      "file": "main.jh",
+      "line": 5,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "imported rule \"mod.one\" does not exist"
+    }
+  ],
+  "validate-errors-multi-module.txt > imported workflow missing": [
+    {
+      "file": "main.jh",
+      "line": 4,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "imported workflow or script \"lib.missing\" does not exist"
+    }
+  ],
+  "validate-errors-multi-module.txt > send RHS with unknown imported symbol": [
+    {
+      "file": "main.jh",
+      "line": 4,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "unknown symbol \"lib.nonexistent\" in send right-hand side"
+    }
+  ],
+  "validate-errors-multi-module.txt > missing channel import fails": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 1,
+      "code": "E_VALIDATE",
+      "message": "Channel \"shared.typo\" is not defined"
+    }
+  ],
+  "validate-errors-multi-module.txt > unknown import alias in run reference": [
+    {
+      "file": "main.jh",
+      "line": 2,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "unknown import alias \"ghost\" for run target \"ghost.deploy\""
+    }
+  ],
+  "validate-errors-multi-module.txt > imported script does not exist": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "imported workflow or script \"lib.nonexistent\" does not exist"
+    }
+  ],
+  "validate-errors-multi-module.txt > run in rule targeting imported rule rejected": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "rule \"lib.other_rule\" must be called with ensure, not run"
+    }
+  ],
+  "validate-errors-multi-module.txt > import resolves to missing file": [
+    {
+      "file": "main.jh",
+      "line": 1,
+      "col": 1,
+      "code": "E_IMPORT_NOT_FOUND",
+      "message": "import \"lib\" resolves to missing file \"<TMP>/nonexistent.jh\""
+    }
+  ],
+  "validate-errors-multi-module.txt > arity mismatch on imported workflow": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "workflow \"lib.helper\" expects 2 argument(s) (a, b), but got 1"
+    }
+  ],
+  "validate-errors-multi-module.txt > send RHS with imported script bare ref": [
+    {
+      "file": "main.jh",
+      "line": 4,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "script \"lib.helper\" must be called with run"
+    }
+  ],
+  "validate-errors-multi-module.txt > send RHS with imported rule bare ref": [
+    {
+      "file": "main.jh",
+      "line": 4,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "rule \"lib.check\" must be called with ensure"
+    }
+  ],
+  "validate-errors-multi-module.txt > imported channel name not found": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 1,
+      "code": "E_VALIDATE",
+      "message": "Channel \"lib.nonexistent_chan\" is not defined"
+    }
+  ],
+  "validate-errors-multi-module.txt > ensure non-exported rule from module with exports": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "\"private_check\" is not exported from module \"lib\""
+    }
+  ],
+  "validate-errors-multi-module.txt > run non-exported workflow from module with exports": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "\"private_wf\" is not exported from module \"lib\""
+    }
+  ],
+  "validate-errors-multi-module.txt > shell line with unknown imported symbol in workflow": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "imported workflow or script \"lib.nonexistent_thing\" does not exist"
+    }
+  ],
+  "validate-errors-multi-module.txt > run non-exported script from module with exports": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "\"private_script\" is not exported from module \"lib\""
+    }
+  ],
+  "validate-errors-multi-module.txt > send RHS with non-exported workflow bare ref": [
+    {
+      "file": "main.jh",
+      "line": 4,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "\"private_wf\" is not exported from module \"lib\""
+    }
+  ],
+  "validate-errors-multi-module.txt > arity mismatch on imported rule": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 3,
+      "code": "E_VALIDATE",
+      "message": "rule \"lib.check\" expects 2 argument(s) (a, b), but got 1"
+    }
+  ],
+  "validate-errors-multi-module.txt > send RHS with non-exported script bare ref": [
+    {
+      "file": "main.jh",
+      "line": 4,
+      "col": 5,
+      "code": "E_VALIDATE",
+      "message": "\"private_script\" is not exported from module \"lib\""
+    }
+  ],
+  "validate-errors-multi-module.txt > const ensure on imported workflow rejected": [
+    {
+      "file": "main.jh",
+      "line": 3,
+      "col": 13,
+      "code": "E_VALIDATE",
+      "message": "workflow \"lib.deploy\" must be called with run"
+    }
+  ]
+}
diff --git a/test-fixtures/compiler-txtar/validate-errors.txt b/test-fixtures/compiler-txtar/validate-errors.txt
index 1fc4d9d8..b847d90e 100644
--- a/test-fixtures/compiler-txtar/validate-errors.txt
+++ b/test-fixtures/compiler-txtar/validate-errors.txt
@@ -919,3 +919,101 @@ workflow default() {
   c <- $(d <- "x")
 }
 
+=== prompt inside else block in rule
+# @expect error E_VALIDATE "const ... = prompt is not allowed in rules" @5:5
+--- input.jh
+rule check(value) {
+  if value == "" {
+    fail "value required"
+  } else {
+    const answer = prompt "what next?"
+  }
+}
+workflow default(value) {
+  ensure check(value)
+}
+
+=== if dot subject where var is not a typed prompt capture
+# @expect error E_VALIDATE "not a typed prompt capture" @3:3
+--- input.jh
+workflow default() {
+  const r = "plain"
+  if r.verdict == "ok" {
+    log "ok"
+  }
+}
+
+=== if dot subject with unknown field
+# @expect error E_VALIDATE "is not defined in the returns schema" @3:3
+--- input.jh
+workflow default() {
+  const r = prompt "Classify" returns "{ verdict: string }"
+  if r.bogus == "ok" {
+    log "ok"
+  }
+}
+
+=== match dot subject where var is not a typed prompt capture
+# @expect error E_VALIDATE "not a typed prompt capture"
+--- input.jh
+workflow default() {
+  const r = "plain"
+  const x = match r.verdict {
+    "ok" => "approved"
+    _ => "rejected"
+  }
+  log "${x}"
+}
+
+=== match dot subject with unknown field
+# @expect error E_VALIDATE "is not defined in the returns schema"
+--- input.jh
+workflow default() {
+  const r = prompt "Classify" returns "{ verdict: string }"
+  const x = match r.bogus {
+    "ok" => "approved"
+    _ => "rejected"
+  }
+  log "${x}"
+}
+
+=== test block: mix mock prompt block with queued mock prompt (block first)
+# @expect error E_VALIDATE "cannot mix "mock prompt { … }" with queued "mock prompt …" in one test block; choose one style"
+--- input.test.jh
+import "lib.jh" as m
+
+test "mixed mock prompt" {
+  mock prompt {
+    /hi/ => "hello"
+    _ => "default"
+  }
+  mock prompt "queued"
+  const response = run m.ask()
+  expect_contain response "hello"
+}
+--- lib.jh
+workflow ask() {
+  const r = prompt "say hi"
+  return r
+}
+
+=== test block: mix mock prompt block with queued mock prompt (queue first)
+# @expect error E_VALIDATE "cannot mix "mock prompt { … }" with queued "mock prompt …" in one test block; choose one style"
+--- input.test.jh
+import "lib.jh" as m
+
+test "mixed mock prompt" {
+  mock prompt "queued"
+  mock prompt {
+    /hi/ => "hello"
+    _ => "default"
+  }
+  const response = run m.ask()
+  expect_contain response "hello"
+}
+--- lib.jh
+workflow ask() {
+  const r = prompt "say hi"
+  return r
+}
+
diff --git a/test-fixtures/golden-ast/expected/brace-if.json b/test-fixtures/golden-ast/expected/brace-if.json
index 1da5f6a0..7adc1c95 100644
--- a/test-fixtures/golden-ast/expected/brace-if.json
+++ b/test-fixtures/golden-ast/expected/brace-if.json
@@ -9,10 +9,13 @@
       "params": [],
       "steps": [
         {
-          "type": "run",
-          "workflow": {
-            "value": "ok_impl"
-          }
+          "body": {
+            "callee": {
+              "value": "ok_impl"
+            },
+            "kind": "call"
+          },
+          "type": "exec"
         }
       ]
     }
@@ -20,35 +23,15 @@
   "scripts": [
     {
       "body": "true",
-      "bodyKind": "backtick",
       "comments": [],
       "name": "ok_impl"
     },
     {
       "body": "printf '%s' \"$1\" > \"$2\"",
-      "bodyKind": "backtick",
       "comments": [],
       "name": "save"
     }
   ],
-  "topLevelOrder": [
-    {
-      "index": 0,
-      "kind": "rule"
-    },
-    {
-      "index": 0,
-      "kind": "script"
-    },
-    {
-      "index": 1,
-      "kind": "script"
-    },
-    {
-      "index": 0,
-      "kind": "workflow"
-    }
-  ],
   "workflows": [
     {
       "comments": [],
@@ -56,27 +39,39 @@
       "params": [],
       "steps": [
         {
+          "body": {
+            "callee": {
+              "value": "ok"
+            },
+            "kind": "ensure_call"
+          },
           "catch": {
             "bindings": {
               "failure": "err"
             },
             "block": [
               {
-                "args": "${err} \"error.log\"",
-                "bareIdentifierArgs": [
-                  "err"
-                ],
-                "type": "run",
-                "workflow": {
-                  "value": "save"
-                }
+                "body": {
+                  "args": [
+                    {
+                      "kind": "var",
+                      "name": "err"
+                    },
+                    {
+                      "kind": "literal",
+                      "raw": "\"error.log\""
+                    }
+                  ],
+                  "callee": {
+                    "value": "save"
+                  },
+                  "kind": "call"
+                },
+                "type": "exec"
               }
             ]
           },
-          "ref": {
-            "value": "ok"
-          },
-          "type": "ensure"
+          "type": "exec"
         }
       ]
     }
diff --git a/test-fixtures/golden-ast/expected/if-dot-subject.json b/test-fixtures/golden-ast/expected/if-dot-subject.json
new file mode 100644
index 00000000..767cdd3c
--- /dev/null
+++ b/test-fixtures/golden-ast/expected/if-dot-subject.json
@@ -0,0 +1,54 @@
+{
+  "channels": [],
+  "exports": [],
+  "imports": [],
+  "rules": [],
+  "scripts": [],
+  "workflows": [
+    {
+      "comments": [],
+      "name": "default",
+      "params": [],
+      "steps": [
+        {
+          "name": "r",
+          "type": "const",
+          "value": {
+            "kind": "prompt",
+            "raw": "\"Classify\"",
+            "returns": "{ verdict: string }"
+          }
+        },
+        {
+          "body": [
+            {
+              "level": "log",
+              "message": {
+                "kind": "literal",
+                "raw": "approved"
+              },
+              "type": "say"
+            }
+          ],
+          "elseBody": [
+            {
+              "level": "log",
+              "message": {
+                "kind": "literal",
+                "raw": "rejected"
+              },
+              "type": "say"
+            }
+          ],
+          "operand": {
+            "kind": "string_literal",
+            "value": "ok"
+          },
+          "operator": "==",
+          "subject": "r.verdict",
+          "type": "if"
+        }
+      ]
+    }
+  ]
+}
diff --git a/test-fixtures/golden-ast/expected/if-else.json b/test-fixtures/golden-ast/expected/if-else.json
new file mode 100644
index 00000000..ad01cb7a
--- /dev/null
+++ b/test-fixtures/golden-ast/expected/if-else.json
@@ -0,0 +1,47 @@
+{
+  "channels": [],
+  "exports": [],
+  "imports": [],
+  "rules": [],
+  "scripts": [],
+  "workflows": [
+    {
+      "comments": [],
+      "name": "default",
+      "params": [
+        "status"
+      ],
+      "steps": [
+        {
+          "body": [
+            {
+              "level": "log",
+              "message": {
+                "kind": "literal",
+                "raw": "healthy"
+              },
+              "type": "say"
+            }
+          ],
+          "elseBody": [
+            {
+              "level": "logerr",
+              "message": {
+                "kind": "literal",
+                "raw": "unhealthy: ${status}"
+              },
+              "type": "say"
+            }
+          ],
+          "operand": {
+            "kind": "string_literal",
+            "value": "ok"
+          },
+          "operator": "==",
+          "subject": "status",
+          "type": "if"
+        }
+      ]
+    }
+  ]
+}
diff --git a/test-fixtures/golden-ast/expected/imports.json b/test-fixtures/golden-ast/expected/imports.json
index b6143de6..de8dfae2 100644
--- a/test-fixtures/golden-ast/expected/imports.json
+++ b/test-fixtures/golden-ast/expected/imports.json
@@ -9,12 +9,6 @@
   ],
   "rules": [],
   "scripts": [],
-  "topLevelOrder": [
-    {
-      "index": 0,
-      "kind": "workflow"
-    }
-  ],
   "workflows": [
     {
       "comments": [],
@@ -22,16 +16,22 @@
       "params": [],
       "steps": [
         {
-          "type": "run",
-          "workflow": {
-            "value": "lib.setup"
-          }
+          "body": {
+            "callee": {
+              "value": "lib.setup"
+            },
+            "kind": "call"
+          },
+          "type": "exec"
         },
         {
-          "ref": {
-            "value": "lib.check"
+          "body": {
+            "callee": {
+              "value": "lib.check"
+            },
+            "kind": "ensure_call"
           },
-          "type": "ensure"
+          "type": "exec"
         }
       ]
     }
diff --git a/test-fixtures/golden-ast/expected/log.json b/test-fixtures/golden-ast/expected/log.json
index 6e7ead45..d62d4398 100644
--- a/test-fixtures/golden-ast/expected/log.json
+++ b/test-fixtures/golden-ast/expected/log.json
@@ -4,12 +4,6 @@
   "imports": [],
   "rules": [],
   "scripts": [],
-  "topLevelOrder": [
-    {
-      "index": 0,
-      "kind": "workflow"
-    }
-  ],
   "workflows": [
     {
       "comments": [],
@@ -17,16 +11,28 @@
       "params": [],
       "steps": [
         {
-          "message": "hello world",
-          "type": "log"
+          "level": "log",
+          "message": {
+            "kind": "literal",
+            "raw": "hello world"
+          },
+          "type": "say"
         },
         {
-          "message": "${USER} logged in",
-          "type": "log"
+          "level": "log",
+          "message": {
+            "kind": "literal",
+            "raw": "${USER} logged in"
+          },
+          "type": "say"
         },
         {
-          "message": "something went wrong",
-          "type": "logerr"
+          "level": "logerr",
+          "message": {
+            "kind": "literal",
+            "raw": "something went wrong"
+          },
+          "type": "say"
         }
       ]
     }
diff --git a/test-fixtures/golden-ast/expected/match-multiline.json b/test-fixtures/golden-ast/expected/match-multiline.json
index b8bdc32a..0fa46581 100644
--- a/test-fixtures/golden-ast/expected/match-multiline.json
+++ b/test-fixtures/golden-ast/expected/match-multiline.json
@@ -4,12 +4,6 @@
   "imports": [],
   "rules": [],
   "scripts": [],
-  "topLevelOrder": [
-    {
-      "index": 0,
-      "kind": "workflow"
-    }
-  ],
   "workflows": [
     {
       "comments": [],
@@ -20,12 +14,13 @@
           "name": "input",
           "type": "const",
           "value": {
-            "bashRhs": "\"hello\"",
-            "kind": "expr"
+            "kind": "literal",
+            "raw": "\"hello\""
           }
         },
         {
-          "managed": {
+          "type": "return",
+          "value": {
             "kind": "match",
             "match": {
               "arms": [
@@ -46,9 +41,7 @@
               ],
               "subject": "input"
             }
-          },
-          "type": "return",
-          "value": "__match__"
+          }
         }
       ]
     }
diff --git a/test-fixtures/golden-ast/expected/match.json b/test-fixtures/golden-ast/expected/match.json
index 7d9ee26e..24853eab 100644
--- a/test-fixtures/golden-ast/expected/match.json
+++ b/test-fixtures/golden-ast/expected/match.json
@@ -4,12 +4,6 @@
   "imports": [],
   "rules": [],
   "scripts": [],
-  "topLevelOrder": [
-    {
-      "index": 0,
-      "kind": "workflow"
-    }
-  ],
   "workflows": [
     {
       "comments": [],
@@ -20,12 +14,13 @@
           "name": "input",
           "type": "const",
           "value": {
-            "bashRhs": "\"hello\"",
-            "kind": "expr"
+            "kind": "literal",
+            "raw": "\"hello\""
           }
         },
         {
-          "managed": {
+          "type": "return",
+          "value": {
             "kind": "match",
             "match": {
               "arms": [
@@ -52,9 +47,7 @@
               ],
               "subject": "input"
             }
-          },
-          "type": "return",
-          "value": "__match__"
+          }
         }
       ]
     }
diff --git a/test-fixtures/golden-ast/expected/params.json b/test-fixtures/golden-ast/expected/params.json
index 30b00be5..fdf0457f 100644
--- a/test-fixtures/golden-ast/expected/params.json
+++ b/test-fixtures/golden-ast/expected/params.json
@@ -11,10 +11,13 @@
       ],
       "steps": [
         {
-          "type": "run",
-          "workflow": {
-            "value": "checker"
-          }
+          "body": {
+            "callee": {
+              "value": "checker"
+            },
+            "kind": "call"
+          },
+          "type": "exec"
         }
       ]
     }
@@ -22,25 +25,10 @@
   "scripts": [
     {
       "body": "echo ok",
-      "bodyKind": "backtick",
       "comments": [],
       "name": "checker"
     }
   ],
-  "topLevelOrder": [
-    {
-      "index": 0,
-      "kind": "workflow"
-    },
-    {
-      "index": 0,
-      "kind": "rule"
-    },
-    {
-      "index": 0,
-      "kind": "script"
-    }
-  ],
   "workflows": [
     {
       "comments": [],
@@ -51,8 +39,12 @@
       ],
       "steps": [
         {
-          "message": "${greeting}, ${name}!",
-          "type": "log"
+          "level": "log",
+          "message": {
+            "kind": "literal",
+            "raw": "${greeting}, ${name}!"
+          },
+          "type": "say"
         }
       ]
     }
diff --git a/test-fixtures/golden-ast/expected/prompt-capture.json b/test-fixtures/golden-ast/expected/prompt-capture.json
index f853797a..56a7c61a 100644
--- a/test-fixtures/golden-ast/expected/prompt-capture.json
+++ b/test-fixtures/golden-ast/expected/prompt-capture.json
@@ -4,12 +4,6 @@
   "imports": [],
   "rules": [],
   "scripts": [],
-  "topLevelOrder": [
-    {
-      "index": 0,
-      "kind": "workflow"
-    }
-  ],
   "workflows": [
     {
       "comments": [],
@@ -20,14 +14,17 @@
           "name": "answer",
           "type": "const",
           "value": {
-            "bodyKind": "string",
-            "kind": "prompt_capture",
+            "kind": "prompt",
             "raw": "\"What is your name?\""
           }
         },
         {
-          "message": "${answer}",
-          "type": "log"
+          "level": "log",
+          "message": {
+            "kind": "literal",
+            "raw": "${answer}"
+          },
+          "type": "say"
         }
       ]
     }
diff --git a/test-fixtures/golden-ast/expected/run-ensure.json b/test-fixtures/golden-ast/expected/run-ensure.json
index 0c450c19..7bf91647 100644
--- a/test-fixtures/golden-ast/expected/run-ensure.json
+++ b/test-fixtures/golden-ast/expected/run-ensure.json
@@ -9,10 +9,13 @@
       "params": [],
       "steps": [
         {
-          "type": "run",
-          "workflow": {
-            "value": "validator"
-          }
+          "body": {
+            "callee": {
+              "value": "validator"
+            },
+            "kind": "call"
+          },
+          "type": "exec"
         }
       ]
     }
@@ -20,29 +23,10 @@
   "scripts": [
     {
       "body": "true",
-      "bodyKind": "backtick",
       "comments": [],
       "name": "validator"
     }
   ],
-  "topLevelOrder": [
-    {
-      "index": 0,
-      "kind": "rule"
-    },
-    {
-      "index": 0,
-      "kind": "script"
-    },
-    {
-      "index": 0,
-      "kind": "workflow"
-    },
-    {
-      "index": 1,
-      "kind": "workflow"
-    }
-  ],
   "workflows": [
     {
       "comments": [],
@@ -50,16 +34,22 @@
       "params": [],
       "steps": [
         {
-          "ref": {
-            "value": "check"
+          "body": {
+            "callee": {
+              "value": "check"
+            },
+            "kind": "ensure_call"
           },
-          "type": "ensure"
+          "type": "exec"
         },
         {
-          "type": "run",
-          "workflow": {
-            "value": "helper"
-          }
+          "body": {
+            "callee": {
+              "value": "helper"
+            },
+            "kind": "call"
+          },
+          "type": "exec"
         }
       ]
     },
@@ -69,8 +59,12 @@
       "params": [],
       "steps": [
         {
-          "message": "helping",
-          "type": "log"
+          "level": "log",
+          "message": {
+            "kind": "literal",
+            "raw": "helping"
+          },
+          "type": "say"
         }
       ]
     }
diff --git a/test-fixtures/golden-ast/expected/script-defs.json b/test-fixtures/golden-ast/expected/script-defs.json
index b72757d1..dca2963f 100644
--- a/test-fixtures/golden-ast/expected/script-defs.json
+++ b/test-fixtures/golden-ast/expected/script-defs.json
@@ -6,41 +6,20 @@
   "scripts": [
     {
       "body": "echo hello",
-      "bodyKind": "backtick",
       "comments": [],
       "name": "greet"
     },
     {
       "body": "echo \"line 1\"\necho \"line 2\"",
-      "bodyKind": "fenced",
       "comments": [],
       "name": "multiline"
     },
     {
       "body": "echo \"Hello ${USER}\"\necho \"${PATH:-/usr/bin}\"",
-      "bodyKind": "fenced",
       "comments": [],
       "name": "with_shell_expansion"
     }
   ],
-  "topLevelOrder": [
-    {
-      "index": 0,
-      "kind": "script"
-    },
-    {
-      "index": 1,
-      "kind": "script"
-    },
-    {
-      "index": 2,
-      "kind": "script"
-    },
-    {
-      "index": 0,
-      "kind": "workflow"
-    }
-  ],
   "workflows": [
     {
       "comments": [],
@@ -48,16 +27,22 @@
       "params": [],
       "steps": [
         {
-          "type": "run",
-          "workflow": {
-            "value": "greet"
-          }
+          "body": {
+            "callee": {
+              "value": "greet"
+            },
+            "kind": "call"
+          },
+          "type": "exec"
         },
         {
-          "type": "run",
-          "workflow": {
-            "value": "multiline"
-          }
+          "body": {
+            "callee": {
+              "value": "multiline"
+            },
+            "kind": "call"
+          },
+          "type": "exec"
         }
       ]
     }
diff --git a/test-fixtures/golden-ast/fixtures/if-dot-subject.jh b/test-fixtures/golden-ast/fixtures/if-dot-subject.jh
new file mode 100644
index 00000000..d407acb0
--- /dev/null
+++ b/test-fixtures/golden-ast/fixtures/if-dot-subject.jh
@@ -0,0 +1,8 @@
+workflow default() {
+  const r = prompt "Classify" returns "{ verdict: string }"
+  if r.verdict == "ok" {
+    log "approved"
+  } else {
+    log "rejected"
+  }
+}
diff --git a/test-fixtures/golden-ast/fixtures/if-else.jh b/test-fixtures/golden-ast/fixtures/if-else.jh
new file mode 100644
index 00000000..68117c4e
--- /dev/null
+++ b/test-fixtures/golden-ast/fixtures/if-else.jh
@@ -0,0 +1,7 @@
+workflow default(status) {
+  if status == "ok" {
+    log "healthy"
+  } else {
+    logerr "unhealthy: ${status}"
+  }
+}
diff --git a/test-infra/compiler-test-runner.ts b/test-infra/compiler-test-runner.ts
index 7db6c0cd..8302b7fe 100644
--- a/test-infra/compiler-test-runner.ts
+++ b/test-infra/compiler-test-runner.ts
@@ -1,11 +1,10 @@
 import test from "node:test";
 import assert from "node:assert/strict";
-import { readFileSync, writeFileSync, mkdtempSync, rmSync, readdirSync, existsSync } from "node:fs";
+import { readFileSync, writeFileSync, mkdtempSync, rmSync, readdirSync } from "node:fs";
 import { join, resolve } from "node:path";
 import { tmpdir } from "node:os";
-import { parsejaiph } from "../src/parser";
+import { loadModuleGraph } from "../src/transpile/module-graph";
 import { validateReferences } from "../src/transpile/validate";
-import { resolveImportPath } from "../src/transpile/resolve";
 
 // --- txtar parser ---
 
@@ -119,13 +118,8 @@ function runTestCase(tc: TxtarTestCase): void {
 
     let caughtError: Error | undefined;
     try {
-      const ast = parsejaiph(readFileSync(entryPath, "utf8"), entryPath);
-      validateReferences(ast, {
-        resolveImportPath,
-        existsSync: (p: string) => existsSync(p),
-        readFile: (p: string) => readFileSync(p, "utf8"),
-        parse: parsejaiph,
-      });
+      const graph = loadModuleGraph(entryPath);
+      validateReferences(graph);
     } catch (err) {
       caughtError = err as Error;
     }
diff --git a/tools/embed-assets.js b/tools/embed-assets.js
new file mode 100644
index 00000000..e162501e
--- /dev/null
+++ b/tools/embed-assets.js
@@ -0,0 +1,65 @@
+#!/usr/bin/env node
+// Regenerates src/runtime/embedded-assets.ts from on-disk asset files so the
+// `jaiph` binary stays self-contained (no sibling files needed at runtime).
+// Also regenerates src/version.ts from package.json so `jaiph --version` has
+// a single source of truth (package.json) in both the tsc and bun --compile
+// build paths.
+//
+// Run automatically as the first step of `npm run build`. The generated files
+// are checked into git so a fresh checkout type-checks before the first build;
+// tests assert the encoded contents match the current sources, so a stale
+// checked-in copy fails CI rather than silently shipping outdated text.
+
+const { readFileSync, writeFileSync } = require("node:fs");
+const { join, resolve } = require("node:path");
+
+const ROOT = resolve(__dirname, "..");
+
+const ASSETS = [
+  { name: "OVERLAY_RUN_SH", path: "runtime/overlay-run.sh" },
+  { name: "JAIPH_SKILL_MD", path: "docs/jaiph-skill.md" },
+];
+
+const entries = ASSETS.map((asset) => {
+  const bytes = readFileSync(join(ROOT, asset.path));
+  return { ...asset, base64: bytes.toString("base64") };
+});
+
+const lines = [
+  "// AUTO-GENERATED by tools/embed-assets.js — do not edit by hand.",
+  "// Regenerated by `npm run build`. Sources:",
+  ...ASSETS.map((a) => `//   - ${a.path}`),
+  "//",
+  "// Base64-encoded so a bun --compile binary carries the bytes inside the",
+  "// executable; the embedded-assets test fails if these drift from disk.",
+  "",
+];
+
+for (const entry of entries) {
+  lines.push(`export const ${entry.name}_BASE64 =`);
+  lines.push(`  ${JSON.stringify(entry.base64)};`);
+  lines.push("");
+}
+
+lines.push(
+  "export function decodeEmbeddedAsset(base64: string): string {",
+  "  return Buffer.from(base64, \"base64\").toString(\"utf8\");",
+  "}",
+  "",
+);
+
+writeFileSync(join(ROOT, "src/runtime/embedded-assets.ts"), lines.join("\n"));
+
+const pkg = JSON.parse(readFileSync(join(ROOT, "package.json"), "utf8"));
+if (typeof pkg.version !== "string" || pkg.version.length === 0) {
+  throw new Error("embed-assets: package.json missing string version field");
+}
+const versionFile = [
+  "// AUTO-GENERATED by tools/embed-assets.js — do not edit by hand.",
+  "// Regenerated by `npm run build` from package.json's version field so the",
+  "// tsc and bun --compile builds both ship the same single-sourced literal.",
+  "",
+  `export const VERSION = ${JSON.stringify(pkg.version)};`,
+  "",
+].join("\n");
+writeFileSync(join(ROOT, "src/version.ts"), versionFile);