diff --git a/.dockerignore b/.dockerignore
index d39f81a13..38ce5cb2f 100644
--- a/.dockerignore
+++ b/.dockerignore
@@ -11,14 +11,15 @@
 **/*.deb
 
 build
+tests/build
+tests/fuzz/corpus
+tests/fuzz/corpus-config
+tests/fuzz/seed-corpus
 third-party/downloads
+third-party/riscv-arch-test/riscv-test-stats
 src/cartesi-jsonrpc-machine
 src/cartesi-hash-tree-hash
-
-doc/html
-doc/api.md
-doc/html/
-doc/xml/
+doc/
 
 .git
 .github
diff --git a/.gitattributes b/.gitattributes
index f77a34ea7..5fe573d75 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -1,2 +1,3 @@
 third-party/** linguist-vendored
 tests/** linguist-vendored
+doc/recipes/rootfs-docs.ext2 filter=lfs diff=lfs merge=lfs -text
diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 10eb81674..8e91ac06b 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -685,9 +685,101 @@ jobs:
         run: |
           docker run --rm -t ${{ github.repository_owner }}/machine-emulator:sanitizer make sanitize=yes test-save-and-load test-machine test-lua test-jsonrpc test-c-api test-c-api-remote test-c-jsonrpc-api test-coverage-machine test-uarch-rv64ui test-uarch-interpreter test-coverage-uarch
 
+  docs:
+    name: Docs
+    needs: build
+    runs-on: ubuntu-latest-8-cores
+    steps:
+      - name: Checkout machine emulator source code
+        uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
+        with:
+          submodules: recursive
+          lfs: true
+
+      - name: Setup variables
+        run: echo MACHINE_EMULATOR_VERSION=`make version` >> $GITHUB_ENV
+
+      - name: Install e2tools
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y --no-install-recommends e2tools
+
+      - name: Check rootfs-docs.ext2 is up to date
+        run: make -C doc check-rootfs-docs
+
+      - name: Ensure doc/recipes/rootfs-docs.licenses.md is tracked
+        run: |
+          if ! git ls-files --error-unmatch doc/recipes/rootfs-docs.licenses.md >/dev/null 2>&1; then
+            echo "::error::doc/recipes/rootfs-docs.licenses.md is not tracked in git. The sync check requires a committed baseline to diff against. Generate it with 'make -C doc build-rootfs-docs-license' and commit the result."
+            exit 1
+          fi
+
+      - name: Build rootfs-docs license report
+        run: make -C doc build-rootfs-docs-license
+
+      - name: Check rootfs-docs.licenses.md matches committed version
+        run: |
+          if git diff --quiet doc/recipes/rootfs-docs.licenses.md; then
+            exit 0
+          fi
+          git --no-pager diff doc/recipes/rootfs-docs.licenses.md
+          echo "::error::doc/recipes/rootfs-docs.licenses.md is out of sync with the generator. The diff above is what 'make -C doc build-rootfs-docs-license' produces vs the committed file. Check if changes were intended and, if so, regenerate locally and commit the result."
+          exit 1
+
+      - name: Login to Docker Hub
+        uses: docker/login-action@4907a6ddec9925e35a0a9e82d7399ccc52663121 # v4.1.0
+        with:
+          username: ${{ secrets.DOCKER_USERNAME }}
+          password: ${{ secrets.DOCKER_PASSWORD }}
+
+      - name: Login to GitHub Container Registry
+        uses: docker/login-action@4907a6ddec9925e35a0a9e82d7399ccc52663121 # v4.1.0
+        with:
+          registry: ghcr.io
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Set up Depot CLI
+        uses: depot/setup-action@15c09a5f77a0840ad4bce955686522a257853461 # v1.7.1
+
+      - name: Build machine-emulator docker image
+        uses: depot/build-push-action@5f3b3c2e5a00f0093de47f657aeaefcedff27d18 # v1.17.0
+        with:
+          file: Dockerfile
+          context: .
+          platforms: linux/amd64
+          tags: cartesi/machine-emulator:devel
+          push: false
+          load: true
+          build-args: |
+            DEBUG=${{ (startsWith(github.ref, 'refs/tags/v') && 'no' || 'yes') }}
+            GIT_COMMIT=${GITHUB_SHA}
+            MACHINE_EMULATOR_VERSION=${{ env.MACHINE_EMULATOR_VERSION }}
+          project: ${{ vars.DEPOT_PROJECT }}
+          token: ${{ secrets.DEPOT_TOKEN }}
+
+      - name: Ensure doc/README.md is tracked
+        run: |
+          if ! git ls-files --error-unmatch doc/README.md >/dev/null 2>&1; then
+            echo "::error::doc/README.md is not tracked in git. The sync check requires a committed baseline to diff against. Generate it with 'make -C doc README.md' and commit the result."
+            exit 1
+          fi
+
+      - name: Build documentation
+        run: make -C doc README.md
+
+      - name: Check README.md matches committed version
+        run: |
+          if git diff --quiet doc/README.md; then
+            exit 0
+          fi
+          git --no-pager diff doc/README.md
+          echo "::error::doc/README.md is out of sync with the generator. The diff above is what 'make -C doc README.md' produces vs the committed file. Check if changes were intended and, if so, regenerate locally and commit the result."
+          exit 1
+
   publish_artifacts:
     name: Publish artifacts
-    needs: [build, lint, coverage, sanitize, test_amd64, test_arm64, risc0]
+    needs: [build, lint, coverage, sanitize, test_amd64, test_arm64, risc0, docs]
     runs-on: ubuntu-latest
     steps:
       - name: Checkout emulator source code
@@ -862,7 +954,7 @@ jobs:
 
       - name: Install rzup
         run: |
-          cargo install --git https://github.com/risc0/risc0 rzup
+          cargo install --locked --git https://github.com/risc0/risc0 rzup
           rzup install cargo-risczero 3.0.5
           rzup install r0vm 3.0.5
           rzup install cpp 2024.1.5
diff --git a/.gitignore b/.gitignore
index e377ade0d..202e01405 100644
--- a/.gitignore
+++ b/.gitignore
@@ -18,10 +18,8 @@ src/cartesi-jsonrpc-machine
 src/cartesi-hash-tree-hash
 src/tests/test-machine-c-api
 
-doc/html
-doc/api.md
-doc/html/
-doc/xml/
+doc/doxygen/html
+doc/recipes/cache
 
 .clangd
 .venv
diff --git a/CHANGELOG.md b/CHANGELOG.md
index b01d548f3..a3f1bf836 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -6,16 +6,30 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ## [Unreleased]
 ## Added
-- Added `--nvram` command line option and `nvram_configs` machine configuration for UIO-backed memory ranges, exposed to the guest via `generic-uio`
-- Added `label` field to flash drive and nvram configurations, propagated to the guest through DTB properties
-- Added optional directory argument to `--dump-memory-ranges` to support read-only install locations
+- Added a user manual under `doc/`, generated from a template by a docgen pipeline that executes and verifies every code snippet against the locally built emulator
+- Added `--nvram` command line option and `nvram` machine configuration for UIO-backed memory ranges, exposed to the guest as `/dev/uio*` via `generic-uio`
+- Added a `label` field to memory range configurations, exposed to the guest through a standard DTB `/aliases` node (`flashdriveN`, `nvramN`, and any user label)
+- Added recording of a revert root hash as a logged input of `send_cmio_response`, with `read_revert_root_hash`/`write_revert_root_hash` accessors across all API layers
+- Added reversion to the recorded revert root hash for rollup inputs that end rejected, when logging steps, logging uarch resets, verifying, and collecting root hashes
+- Added emission of per-output proofs from `--cmio-advance-state`
+- Added an optional user schema dictionary argument to `cartesi.tojson`/`cartesi.fromjson` to name binary and compound fields of caller-defined message types
+- Added a `cartesi.hash-tree` Lua module for hash-tree slice/splice verification and building the output-hashes frontier behind the output proofs
+- Added `get_address_name` to resolve a physical address to a descriptive name, across the C, Lua, and JSON-RPC APIs
+- Added the ability for `--initial-hash` and `--final-hash` to write the hash to a file
+- Added an optional directory argument to `--dump-memory-ranges` to support read-only install locations
 - Added decoding of RISC-V Zcb compressed instructions (required by kernels built with GCC 14)
 - Added fallback to `read_reg` in the GDB stub so `monitor reg <name>` works for any named register
-- Added `CM_FLASH_DRIVE_MAX`, `CM_NVRAM_MAX`, and `CM_MEMORY_RANGE_LABEL_MAX` constants to the public C API
+- Added `--bash-completion` to print a bash completion script for `cartesi-machine`
+- Added public C API constants `CM_FLASH_DRIVE_MAX`, `CM_NVRAM_MAX`, `CM_MEMORY_RANGE_LABEL_MAX`, `CM_RTC_FREQ_DIV`, and `CM_CMIO_LOG2_MAX_OUTPUT_COUNT`
+- Added the peripheral `CM_AR_*` address range constants, the `CM_PMA_*_DID` driver id constants, the HTIF device, command, shift, and mask constants, and the `CM_DTB_BOOTARGS_*` macros to the public C API
 - Added LuaCov-based coverage tracking for Lua code, integrated with the gcov report pipeline
+- Added a JSON-RPC C API coverage suite and converted `test-cm-cli` and `test-evmu` to the lester spec format
 - Added `spec-cm-cli.lua` covering every command-line option of `cartesi-machine.lua`
 
 ## Fixed
+- Fixed leaf size in `cartesi-hash-tree-hash`, which was 8 instead of 32
+- Fixed read-only flash drives not being mounted with `-o ro`, which trapped guest writes and panicked init
+- Fixed missing `#address-cells` on the per-CPU `interrupt-controller` node in the DTB, silencing a `dtc` interrupt-provider lint warning
 - Fixed firmware reserved region in the DTB being too small for OpenSBI built with GCC 14
 - Fixed missing validation of memory range labels and of `replace_memory_range` arguments
 - Fixed boolean merging in `merge_memory_range_opts` so options can be explicitly overridden to `false`
@@ -23,15 +37,32 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 - Fixed `dump_pmas()` still calling the removed `get_memory_ranges()` method
 - Fixed unanchored patterns matching `--quiet` and `--assert-rolling-template`
 - Fixed `help()` internally calling `os.exit()`
+- Fixed a typo in the `cartesi-machine.lua` cmio handling
 
 ## Changed
-- Renamed `--dump-memory-ranges` to `--dump-address-ranges` for consistency with `get_address_ranges()`
+- Renamed the yield constants in `cm.h` and the Lua API from `CM_CMIO_YIELD_*` to `CM_HTIF_YIELD_*` (and the command suffix from `COMMAND` to `CMD`)
+- Renamed the PMA "device id" to "driver id" across the public API (`CM_PMA_*_DID` constants, `driver_id` in `get_address_ranges`)
+- Changed `get_address_ranges` to report per-range attributes (`is_memory`, `is_device`, `is_readable`, `is_writeable`, `is_executable`, `is_read_idempotent`, `is_write_idempotent`, and `driver_id`)
+- Replaced the `--store-json-config`/`--load-json-config` options with a `format:<lua|json>` sub-option on `--store-config`/`--load-config`, defaulting to the format inferred from the filename extension
+- Changed `--initial-proof`/`--final-proof` to default to Lua tables and accept `format:<lua|json>` and `label:` sub-options, where before they were dumped only as JSON
+- Reworked command-line option parsing so compound options such as `--volume` and `--port-forward` take `key:value` sub-options, and short options take a space-separated value (`-u <name>` instead of `-u=<name>`)
+- Changed memory ranges with an unset start to be placed past the end of RAM, rounded up to a power of two and aligned to their length, with flash drives and nvrams drawn from a shared pool
+- Changed `log_send_cmio_response` and `verify_send_cmio_response` to treat invalid responses and advance-state responses delivered outside an rx-accepted manual yield as no-ops, while the live `send_cmio_response` still rejects them as errors
+- Changed the uarch state-access layer to align misaligned accesses down to their natural size instead of rejecting them
+- Changed JSON-RPC error logs to omit the Boost `source_location` suffix at non-debug levels
 - Renamed all C++ headers from `.h` to `.hpp`, and renamed `machine-c-api.{h,cpp}` to `cm.{h,cpp}`
-- Bumped machine configuration archive version from 6 to 7 (for the new `nvram_configs` and `label` fields)
+- Bumped machine configuration archive version from 6 to 7 (for the new `nvram` and `label` fields)
 - Moved the `/run/cartesi/memoryranges/` sysfs setup from the DTB init script into `cartesi-init`
 - Updated guest bootargs to bind `uio_pdrv_genirq` to generic-uio nodes
 - Bumped test `linux.bin` and `rootfs.ext2` images
 
+## Removed
+- Removed the `--store-json-config` and `--load-json-config` options (folded into the `format:` sub-option of `--store-config`/`--load-config`)
+- Removed the `--replace-flash-drive` option, subsumed by `--replace-memory-range`
+- Removed `CM_ERROR_REGEX_ERROR` (covered by `CM_ERROR_RUNTIME_ERROR`) and `CM_ERROR_SYSTEM_ERROR`, and renumbered the error enum
+- Removed `machine_reg_get_name` in favor of `get_address_name`
+- Removed `mark_dirty_page` from the uarch and state-access interfaces
+
 ## [0.20.0] - 2026-04-09
 ## Added
 - Added RISC0 zkVM integration for fraud proof verification, with C++, Rust, and Solidity implementations
diff --git a/Dockerfile b/Dockerfile
index 10cdd977a..bfb90eab0 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -1,4 +1,7 @@
-FROM debian:trixie-20250811 AS toolchain
+ARG BUILD_BASE=debian:trixie-20250811
+ARG RUNTIME_BASE=debian:trixie-20250811-slim
+
+FROM $BUILD_BASE AS toolchain
 
 RUN apt-get update && \
     DEBIAN_FRONTEND=noninteractive apt-get install --no-install-recommends -y \
@@ -56,15 +59,24 @@ FROM builder AS debian-packager
 RUN make install-uarch debian-package DESTDIR=$PWD/_install
 
 ####################################################################################################
-FROM debian:trixie-20250811-slim
+FROM $RUNTIME_BASE
 ARG TARGETARCH
+ARG RUNTIME_BASE
+LABEL io.cartesi.machine-emulator.base-image="$RUNTIME_BASE"
 
 COPY --from=debian-packager /usr/src/emulator/machine-emulator_${TARGETARCH}.deb machine-emulator.deb
+COPY tests/dependencies tests/dependencies.sha256 /usr/share/cartesi-machine/
 
 RUN apt-get update && \
-    apt-get install -y ./machine-emulator.deb && \
+    apt-get install -y gosu ./machine-emulator.deb && \
     rm -rf /var/lib/apt/lists/* /var/cache/apt/* machine-emulator.deb
 
+# Carried but dormant (no ENTRYPOINT set here, so production behavior is
+# unchanged): lets a derived dev image (e.g. doc/) opt into running as the host
+# user by pointing ENTRYPOINT at this script. Needs gosu, installed above.
+COPY tools/docker-entrypoint.sh /usr/local/bin/entrypoint.sh
+RUN chmod +x /usr/local/bin/entrypoint.sh
+
 RUN groupadd --system --gid 102 cartesi && \
     useradd --system --uid 102 --gid 102 --no-create-home --home /nonexistent --comment "cartesi user" --shell /bin/false cartesi
 
diff --git a/Makefile b/Makefile
index 389b5e91c..b19b4fe65 100644
--- a/Makefile
+++ b/Makefile
@@ -77,7 +77,7 @@ EMU_TO_BIN= src/cartesi-jsonrpc-machine src/cartesi-hash-tree-hash
 EMU_TO_LIB= src/$(LIBCARTESI_SO) src/$(LIBCARTESI_SO_JSONRPC)
 EMU_TO_LIB_A= src/libcartesi.a src/libcartesi_jsonrpc.a src/libluacartesi.a src/libluacartesi_jsonrpc.a
 EMU_LUA_TO_BIN= src/cartesi-machine.lua src/cartesi-machine-stored-hash.lua
-EMU_TO_LUA_PATH= src/cartesi/util.lua src/cartesi/gdbstub.lua src/cartesi/evmu.lua
+EMU_TO_LUA_PATH= src/cartesi/util.lua src/cartesi/gdbstub.lua src/cartesi/evmu.lua src/cartesi/bash.lua src/cartesi/hash-tree.lua
 EMU_TO_LUA_THIRD_PARTY_PATH= src/cartesi/third-party/bint.lua
 EMU_TO_LUA_CPATH= src/cartesi.so
 EMU_TO_LUA_CARTESI_CPATH= src/cartesi/jsonrpc.so
@@ -105,6 +105,12 @@ export UARCH_DEFS
 TAG ?= devel
 DEBIAN_IMG ?= cartesi/machine-emulator:$(TAG).deb
 
+# Base images for the emulator Dockerfile. Single source of truth: passed as
+# build-args and stamped into the image as a label so downstream images (e.g.
+# doc/) can reuse the exact same base without duplicating these values.
+BUILD_BASE ?= debian:trixie-20250811
+RUNTIME_BASE ?= debian:trixie-20250811-slim
+
 # Docker image platform
 BUILD_PLATFORM ?=
 
@@ -247,11 +253,14 @@ test% coverage% build-tests%:
 
 build-tests-misc-with-builder-image: build-emulator-builder-image
 
-lint check-format format check-format-lua check-lua format-lua:
+lint check-format format:
 	@$(MAKE) $@-src $@-tests
 
+check-format-lua check-lua format-lua:
+	@$(MAKE) $@-src $@-tests $@-doc
+
 lint-% check-format-% format-% check-format-lua-% check-lua-% format-lua-%:
-	@eval $$($(MAKE) -s --no-print-directory env); $(MAKE) -C $(if $(findstring -src,$@),src,tests) $(subst -src,,$(subst -tests,,$@))
+	@eval $$($(MAKE) -s --no-print-directory env); $(MAKE) -C $(if $(findstring -doc,$@),doc,$(if $(findstring -src,$@),src,tests)) $(subst -doc,,$(subst -src,,$(subst -tests,,$@)))
 
 source-default:
 	@eval $$($(MAKE) -s --no-print-directory env); $(MAKE) -C $(SRCDIR)
@@ -269,13 +278,13 @@ $(SRCDIR)/interpret-jump-table.hpp:
 	@eval $$($(MAKE) -s --no-print-directory env); $(MAKE) -C $(SRCDIR) interpret-jump-table.hpp
 
 build-emulator-builder-image:
-	docker build $(DOCKER_PLATFORM) --build-arg DEBUG=$(debug) --build-arg COVERAGE=$(coverage) --build-arg THREADS=$(threads) --build-arg SANITIZE=$(sanitize) --target builder -t cartesi/machine-emulator:builder -f Dockerfile .
+	docker build $(DOCKER_PLATFORM) --build-arg DEBUG=$(debug) --build-arg COVERAGE=$(coverage) --build-arg THREADS=$(threads) --build-arg SANITIZE=$(sanitize) --build-arg BUILD_BASE=$(BUILD_BASE) --target builder -t cartesi/machine-emulator:builder -f Dockerfile .
 
 build-emulator-toolchain-image build-toolchain:
-	docker build $(DOCKER_PLATFORM) --target toolchain -t cartesi/machine-emulator:toolchain -f Dockerfile .
+	docker build $(DOCKER_PLATFORM) --build-arg BUILD_BASE=$(BUILD_BASE) --target toolchain -t cartesi/machine-emulator:toolchain -f Dockerfile .
 
 build-emulator-image:
-	docker build $(DOCKER_PLATFORM) --build-arg DEBUG=$(debug) --build-arg COVERAGE=$(coverage) --build-arg THREADS=$(threads) --build-arg SANITIZE=$(sanitize) -t cartesi/machine-emulator:$(TAG) -f Dockerfile .
+	docker build $(DOCKER_PLATFORM) --build-arg DEBUG=$(debug) --build-arg COVERAGE=$(coverage) --build-arg THREADS=$(threads) --build-arg SANITIZE=$(sanitize) --build-arg BUILD_BASE=$(BUILD_BASE) --build-arg RUNTIME_BASE=$(RUNTIME_BASE) -t cartesi/machine-emulator:$(TAG) -f Dockerfile .
 
 build-emulator-tests-image: build-emulator-builder-image build-emulator-image
 	docker build $(DOCKER_PLATFORM) --build-arg DEBUG=$(debug) --build-arg COVERAGE=$(coverage) --build-arg THREADS=$(threads) --build-arg SANITIZE=$(sanitize) --build-arg TAG=$(TAG) -t cartesi/machine-emulator:tests -f tests/Dockerfile .
@@ -284,7 +293,7 @@ build-emulator-tests-builder-image: build-emulator-builder-image
 	docker build $(DOCKER_PLATFORM) --target tests-builder --build-arg DEBUG=$(debug) --build-arg COVERAGE=$(coverage) --build-arg THREADS=$(threads) --build-arg SANITIZE=$(sanitize) --build-arg TAG=$(TAG) -t cartesi/machine-emulator:tests-builder -f tests/Dockerfile .
 
 build-debian-package:
-	docker build $(DOCKER_PLATFORM) --target debian-packager --build-arg DEBUG=$(debug) --build-arg COVERAGE=$(coverage) --build-arg THREADS=$(threads) --build-arg SANITIZE=$(sanitize) -t $(DEBIAN_IMG) -f Dockerfile .
+	docker build $(DOCKER_PLATFORM) --target debian-packager --build-arg DEBUG=$(debug) --build-arg COVERAGE=$(coverage) --build-arg THREADS=$(threads) --build-arg SANITIZE=$(sanitize) --build-arg BUILD_BASE=$(BUILD_BASE) -t $(DEBIAN_IMG) -f Dockerfile .
 
 build-tests-debian-packages: build-emulator-builder-image
 	docker build $(DOCKER_PLATFORM) --target tests-debian-packager --build-arg TAG=$(TAG) -t cartesi/machine-emulator:tests-debian-packager -f tests/Dockerfile .
diff --git a/doc/.dockerignore b/doc/.dockerignore
new file mode 100644
index 000000000..ed6d64661
--- /dev/null
+++ b/doc/.dockerignore
@@ -0,0 +1,6 @@
+Makefile
+README.md.template
+doxygen
+recipes/cache
+recipes/*.ext2
+!recipes/rootfs-docs.ext2
diff --git a/doc/.gitignore b/doc/.gitignore
new file mode 100644
index 000000000..a2e2df65c
--- /dev/null
+++ b/doc/.gitignore
@@ -0,0 +1,2 @@
+recipes/rootfs-docs.inputs.sha256
+recipes/rootfs-docs.inputs.sha256-have
diff --git a/doc/.luacheckrc b/doc/.luacheckrc
new file mode 100644
index 000000000..1d2477882
--- /dev/null
+++ b/doc/.luacheckrc
@@ -0,0 +1,16 @@
+-- alerts.lua and replace.lua are pandoc Lua filters: pandoc runs them inside
+-- its own interpreter, which injects the `pandoc` module along with the
+-- FORMAT and PANDOC_SCRIPT_FILE globals, and invokes the filter callbacks
+-- (Div, Pandoc) that the filter defines at the top level. Declare that
+-- environment so luacheck does not report the pandoc API as undefined or
+-- non-standard globals.
+--
+-- The recipe scripts under recipes/ are ordinary lua5.4 programs and are left
+-- under luacheck's default configuration, so genuine stray globals there are
+-- still caught.
+local pandoc_filter = {
+    read_globals = { "FORMAT", "PANDOC_SCRIPT_FILE", "pandoc" },
+    globals = { "Div", "Pandoc" },
+}
+files["alerts.lua"] = pandoc_filter
+files["replace.lua"] = pandoc_filter
diff --git a/doc/Dockerfile b/doc/Dockerfile
new file mode 100644
index 000000000..4b4eb1955
--- /dev/null
+++ b/doc/Dockerfile
@@ -0,0 +1,76 @@
+ARG TAG=0.20.0
+ARG GUEST_TOOLS_VERSION=v0.18.0-test4
+ARG GENEXT2FS_VERSION=v1.5.6
+# Base for the host-tool builder stages below. These stages compile binaries
+# that are copied into the final emulator-based image, so the base must stay
+# ABI-compatible with cartesi/machine-emulator:$TAG. It deliberately does NOT
+# reference $TAG, so bumping the emulator image reuses the builders' cache.
+# The Makefile overrides this with the emulator image's own base, read from its
+# io.cartesi.machine-emulator.base-image label, so it tracks automatically if
+# the emulator rebases.
+ARG BUILDER_BASE=debian:trixie-20250811-slim
+
+FROM $BUILDER_BASE AS hex-builder
+ARG GUEST_TOOLS_VERSION
+USER root
+RUN DEBIAN_FRONTEND=noninteractive apt-get update && \
+    apt-get install -y --no-install-recommends g++ wget ca-certificates && \
+    wget -qO- https://github.com/cartesi/machine-guest-tools/archive/refs/tags/$GUEST_TOOLS_VERSION.tar.gz \
+        | tar -xz -C /tmp --wildcards --strip-components=3 '*/sys-utils/hex/hex.cpp' && \
+    g++ -O2 -o /usr/local/bin/hex /tmp/hex.cpp
+
+FROM $BUILDER_BASE AS xgenext2fs-builder
+ARG GENEXT2FS_VERSION
+USER root
+RUN DEBIAN_FRONTEND=noninteractive apt-get update && \
+    apt-get install -y --no-install-recommends \
+        automake autotools-dev build-essential libarchive-dev wget ca-certificates && \
+    wget -qO- https://github.com/cartesi/genext2fs/archive/refs/tags/$GENEXT2FS_VERSION.tar.gz \
+        | tar -xz -C /tmp && \
+    cd /tmp/genext2fs-* && \
+    ./autogen.sh && \
+    ./configure --enable-libarchive --prefix=/usr/local && \
+    make -j"$(nproc)" install
+
+FROM cartesi/machine-emulator:$TAG
+
+USER root
+
+RUN DEBIAN_FRONTEND=noninteractive apt-get update && \
+    apt-get install -y \
+        make pandoc \
+        bash-completion bc devio device-tree-compiler e2tools file graphviz jq libarchive13 lua-dkjson lua-socket net-tools wget && \
+    rm -rf /var/lib/apt/lists/*
+
+# Snapshot cartesi-machine's bash completion into the canonical dir, then enable
+# the framework loader by uncommenting the block Debian ships (disabled) in
+# /etc/bash.bashrc. The package's /etc/profile.d snippet only covers login
+# shells; the playground runs a non-login shell, which reads only bash.bashrc.
+# With the loader active, the file lazy-loads on first `cartesi-machine <TAB>`.
+RUN cartesi-machine --bash-completion > /usr/share/bash-completion/completions/cartesi-machine && \
+    sed -i '/^#if ! shopt -oq posix; then/,/^#fi$/ s/^#//' /etc/bash.bashrc
+
+COPY --from=hex-builder /usr/local/bin/hex /usr/local/bin/hex
+COPY --from=xgenext2fs-builder /usr/local/bin/xgenext2fs /usr/local/bin/xgenext2fs
+
+RUN mkdir -p /tmp/cartesi-images/build/images && \
+    cd /usr/share/cartesi-machine && \
+    wget -nc -i dependencies -P /tmp/cartesi-images/build/images && \
+    cd /tmp/cartesi-images && \
+    cp /usr/share/cartesi-machine/dependencies.sha256 . && \
+    sha256sum --check dependencies.sha256 && \
+    cd /usr/share/cartesi-machine/images && \
+    mv /tmp/cartesi-images/build/images/linux-*.bin . && \
+    ln -s "$(ls linux-*.bin)" linux.bin && \
+    rm -rf /tmp/cartesi-images
+
+COPY recipes/rootfs-docs.ext2 /usr/share/cartesi-machine/images/rootfs-docs.ext2
+RUN ln -s rootfs-docs.ext2 /usr/share/cartesi-machine/images/rootfs.ext2
+
+ENV DEV_ENV_HAS_DOCGEN=yes
+ENV PATH=/work/recipes:${PATH}
+
+# Run as the host user: the entrypoint (carried dormant by the emulator image)
+# reads the USER/UID/GID/GROUP env that run-docs-image / docs-image-exec pass
+# and gosu-drops to it, so files written under /work are owned by the host user.
+ENTRYPOINT ["/usr/local/bin/entrypoint.sh"]
diff --git a/doc/Makefile b/doc/Makefile
new file mode 100644
index 000000000..778bbaecb
--- /dev/null
+++ b/doc/Makefile
@@ -0,0 +1,236 @@
+# Docker image tag — must match the tag used by the root Makefile's
+# build-emulator-image target so the docs image layers on top of an
+# emulator built from the local source (kernel/rootfs images in
+# tests/dependencies are built against the unreleased branch and may
+# require emulator features not in any released base image).
+TAG ?= devel
+
+DOCS_IMAGE = cartesi/machine-emulator-docs
+
+# Docker image platform
+BUILD_PLATFORM ?=
+
+ifneq ($(BUILD_PLATFORM),)
+DOCKER_PLATFORM=--platform $(BUILD_PLATFORM)
+endif
+
+DEV_ENV_HAS_DOCGEN ?= no
+RECIPES_DIR ?= $(CURDIR)/recipes
+REPLACE_CACHE_DIR := $(RECIPES_DIR)/cache
+export RECIPES_DIR REPLACE_CACHE_DIR
+export LUA_PATH := $(CURDIR)/?.lua;$(RECIPES_DIR)/?.lua;$(LUA_PATH);;
+
+STYLUA=stylua
+STYLUA_FLAGS=--indent-type Spaces --respect-ignores
+
+.PHONY: build-docs-image clean format-lua check-format-lua check-lua
+.DELETE_ON_ERROR:
+
+# Lua linting/formatting for the recipe snippets and pandoc filters. The
+# generated cache (REPLACE_CACHE_DIR) holds extracted block bodies that are
+# rewritten on every render, so it is excluded from both tools.
+format-lua:
+	@$(STYLUA) $(STYLUA_FLAGS) .
+
+check-format-lua:
+	@$(STYLUA) $(STYLUA_FLAGS) --check .
+
+check-lua:
+	luacheck . --exclude-files '$(REPLACE_CACHE_DIR)/**'
+
+ROOTFS_DOCS_INPUTS := \
+    $(RECIPES_DIR)/Dockerfile.rootfs-docs \
+    $(RECIPES_DIR)/build-rootfs-docs.sh \
+    $(RECIPES_DIR)/puppet.c \
+    $(wildcard $(RECIPES_DIR)/hello/*)
+
+ROOTFS_DOCS_EXT2 := $(RECIPES_DIR)/rootfs-docs.ext2
+ROOTFS_DOCS_KEY := $(RECIPES_DIR)/rootfs-docs.inputs.sha256
+
+# Fingerprint of the recipe inputs. Generated and gitignored, embedded into the
+# image at build time and re-derived here to spot a stale committed image
+# without rebuilding. Both sides use the same input list so they cannot drift.
+$(ROOTFS_DOCS_KEY): $(ROOTFS_DOCS_INPUTS)
+	cat $(sort $(ROOTFS_DOCS_INPUTS)) | sha256sum | head -c 64 > $@
+
+# Build the image. build-rootfs-docs.sh embeds $(ROOTFS_DOCS_KEY) into it.
+$(ROOTFS_DOCS_EXT2): $(ROOTFS_DOCS_INPUTS) $(ROOTFS_DOCS_KEY)
+	cd $(RECIPES_DIR) && ./build-rootfs-docs.sh
+
+# Convenience alias, since the real target is an absolute path.
+.PHONY: build-rootfs-docs
+build-rootfs-docs: $(ROOTFS_DOCS_EXT2)
+
+# Verify the committed image matches the current recipe inputs. No rebuild and no
+# network, so CI runs it after a git lfs pull. A missing or stale image is a hard
+# error. e2cp copies the embedded fingerprint out under a -have suffix to compare
+# against the freshly derived one.
+.PHONY: check-rootfs-docs
+check-rootfs-docs: $(ROOTFS_DOCS_KEY)
+	@test -s $(ROOTFS_DOCS_EXT2) || { \
+	    echo "ERROR: rootfs-docs.ext2 missing, run 'git lfs pull'"; exit 1; }
+	@e2cp $(ROOTFS_DOCS_EXT2):/var/log/rootfs-docs.inputs.sha256 $(ROOTFS_DOCS_KEY)-have
+	@cmp -s $(ROOTFS_DOCS_KEY) $(ROOTFS_DOCS_KEY)-have || { \
+	    echo "ERROR: rootfs-docs.ext2 is stale (recipe inputs changed)."; \
+	    echo "Run 'make -C doc build-rootfs-docs' and commit it."; \
+	    exit 1; \
+	}
+
+ROOTFS_DOCS_LICENSES := $(RECIPES_DIR)/rootfs-docs.licenses.md
+
+# Package and license report for the committed image. It is derived from the
+# ext2 itself rather than from a rebuild, and committed alongside it so a
+# checkout carries the license information with the binary. Like the targets
+# above, freshness is judged by content rather than timestamps, so this always
+# regenerates the report. CI then diffs it against the committed version, as
+# it does for README.md.
+.PHONY: build-rootfs-docs-license
+build-rootfs-docs-license: | ensure-rootfs-docs
+	cd $(RECIPES_DIR) && ./build-rootfs-docs-license.sh > $(ROOTFS_DOCS_LICENSES)
+
+# Local convenience used before the docs image is built. Fetch the image from
+# LFS if absent or still an unsmudged pointer, rebuild it locally if the embedded
+# fingerprint no longer matches the recipe inputs.
+.PHONY: ensure-rootfs-docs
+ensure-rootfs-docs:
+	@if [ ! -s $(ROOTFS_DOCS_EXT2) ] || \
+	    git lfs pointer --check --file $(ROOTFS_DOCS_EXT2) >/dev/null 2>&1; then \
+	    echo "rootfs-docs.ext2 not present, fetching from git lfs..."; \
+	    git lfs pull --include "$(ROOTFS_DOCS_EXT2)" || true; \
+	fi
+	@if $(MAKE) -s check-rootfs-docs >/dev/null 2>&1; then \
+	    echo "rootfs-docs.ext2 is up to date."; \
+	else \
+	    echo "rootfs-docs.ext2 missing or stale, rebuilding locally..."; \
+	    rm -f $(ROOTFS_DOCS_EXT2); \
+	    $(MAKE) $(ROOTFS_DOCS_EXT2); \
+	fi
+
+check-docs-image:
+	@if docker images $(DOCKER_PLATFORM) -q $(DOCS_IMAGE):$(TAG) 2>/dev/null | grep -q .; then \
+		echo "Docker image $(DOCS_IMAGE):$(TAG) exists"; \
+	else \
+		echo "Docker image $(DOCS_IMAGE):$(TAG) does not exist. Creating:"; \
+		$(MAKE) build-docs-image; \
+	fi
+
+docs-image-exec: check-docs-image
+	docker run --hostname playground --rm \
+		-e USER=$$(id -u -n) \
+		-e GROUP=$$(id -g -n) \
+		-e UID=$$(id -u) \
+		-e GID=$$(id -g) \
+		-v $(CURDIR):/work \
+		-w /work \
+		$(DOCS_IMAGE):$(TAG) /bin/bash -c "$(CONTAINER_COMMAND)"
+
+run-docs-image: check-docs-image
+	docker run \
+        --hostname playground \
+        --name playground \
+        --rm \
+		-e USER=$$(id -u -n) \
+		-e GROUP=$$(id -g -n) \
+		-e UID=$$(id -u) \
+		-e GID=$$(id -g) \
+		-v $(CURDIR):/work \
+		-w /work \
+	    -it \
+		$(DOCS_IMAGE):$(TAG) \
+	    /bin/bash
+
+build-docs-image: | ensure-rootfs-docs
+	@if docker image inspect cartesi/machine-emulator:$(TAG) >/dev/null 2>&1; then \
+		echo "Docker image cartesi/machine-emulator:$(TAG) exists, reusing"; \
+	else \
+		$(MAKE) -C .. build-emulator-image TAG=$(TAG); \
+	fi
+	base=$$(docker image inspect --format '{{ index .Config.Labels "io.cartesi.machine-emulator.base-image" }}' cartesi/machine-emulator:$(TAG)); \
+	docker build $(DOCKER_PLATFORM) --build-arg TAG=$(TAG) $${base:+--build-arg BUILDER_BASE=$$base} -t $(DOCS_IMAGE):$(TAG) .
+
+$(REPLACE_CACHE_DIR):
+	mkdir -p $@
+
+ifeq ($(DEV_ENV_HAS_DOCGEN),yes)
+
+# Dry-run: scan the template, populate cache directories, and emit one make
+# rule per annotated block into template.d. The rendered output IS the .d
+# file (pandoc emits the RawBlock that replace.lua builds).
+template.d: README.md.template replace.lua | $(REPLACE_CACHE_DIR)
+	REPLACE_CACHE_DIR=$(REPLACE_CACHE_DIR) RECIPES_DIR=$(RECIPES_DIR) \
+	    pandoc -f markdown -t plain \
+	    -M write-user-dependencies=README.md \
+	    -M docs_image=$(DOCS_IMAGE):$(TAG) \
+	    --lua-filter replace.lua README.md.template -o $@
+
+ifeq (,$(filter clean,$(MAKECMDGOALS)))
+-include template.d
+endif
+
+# Diagrams rendered from committed sources under images/. Generated into the same
+# dir and committed, like README.md itself. Regenerated only when a source changes.
+# Order-only prereq of README.md below: a render always brings them up to date,
+# without forcing a re-render when only the image bytes change (the template
+# references the path, not the contents).
+# Diagrams are committed SVGs under images/, like README.md itself, with no background of
+# their own so they inherit the page. state-tree's ink colors depend on the theme, so it is
+# built in a light and a dark variant that the template selects with a <picture>;
+# outputs-tree reads on both themes, so a single variant serves both.
+DOC_DIAGRAMS := \
+    images/outputs-tree.svg \
+    images/state-tree-light.svg images/state-tree-dark.svg
+
+# outputs-tree pins its node positions for a perfectly symmetric binary tree (dot's own
+# layout skews internal nodes), so it renders with neato -n, which uses the given positions
+# and runs no layout. Held nodes are filled and the unmaterialized interiors are transparent
+# outlines, so its colors read on both themes from one variant.
+images/outputs-tree.svg: images/outputs-tree.dot
+	neato -n -Tsvg $< -o $@
+
+# state-tree draws an actual machine's state hash-tree over the address space. It
+# instantiates a machine and reads its memory ranges, so it is a Lua program that emits the
+# SVG directly rather than a Graphviz source. Its first argument selects the palette.
+images/state-tree-light.svg: images/state-tree.lua
+	lua5.4 $< light > $@
+images/state-tree-dark.svg: images/state-tree.lua
+	lua5.4 $< dark > $@
+
+# Real run: render the document. template.d adds per-cache-file prereqs to
+# README.md, so editing a recipe propagates here naturally. check-rootfs-docs is
+# order-only so a recipe-input change that leaves the committed image stale fails
+# the render here (as in CI) without forcing a re-render on every invocation.
+README.md: README.md.template replace.lua alerts.lua github.template.md template.d | check-rootfs-docs $(DOC_DIAGRAMS)
+	REPLACE_CACHE_DIR=$(REPLACE_CACHE_DIR) RECIPES_DIR=$(RECIPES_DIR) \
+	    pandoc -f markdown -s -t gfm --toc \
+	    -M docs_image=$(DOCS_IMAGE):$(TAG) \
+	    --lua-filter replace.lua --lua-filter alerts.lua \
+	    --template=github.template.md \
+	    README.md.template -o $@
+
+README.html: README.md README.md.template replace.lua alerts.lua github.template.html template.d
+	REPLACE_CACHE_DIR=$(REPLACE_CACHE_DIR) RECIPES_DIR=$(RECIPES_DIR) \
+	    pandoc -f markdown+emoji -s -t html5 --toc --mathjax \
+	    -M docs_image=$(DOCS_IMAGE):$(TAG) \
+	    --lua-filter replace.lua --lua-filter alerts.lua \
+	    --template=github.template.html \
+	    README.md.template -o $@
+
+else
+
+# Without docgen tools on the host, delegate the whole build to the docs
+# container. Inside, DEV_ENV_HAS_DOCGEN=yes activates the rules above and
+# evaluates staleness against template.d.
+.PHONY: README.md README.html
+README.md: | check-docs-image
+	@jobs=$(if $(JOBS),$(JOBS),$$(docker run --rm $(DOCS_IMAGE):$(TAG) nproc)); \
+	$(MAKE) docs-image-exec CONTAINER_COMMAND="make -j$$jobs README.md DEV_ENV_HAS_DOCGEN=yes"
+
+README.html: README.md
+	$(MAKE) docs-image-exec CONTAINER_COMMAND="make README.html DEV_ENV_HAS_DOCGEN=yes"
+endif
+
+clean:
+	rm -f README.md template.d
+	rm -f $(RECIPES_DIR)/rootfs-docs.tar
+	rm -f $(ROOTFS_DOCS_KEY) $(ROOTFS_DOCS_KEY)-have
+	rm -rf $(REPLACE_CACHE_DIR)
diff --git a/doc/README.md b/doc/README.md
new file mode 100644
index 000000000..b530edcd2
--- /dev/null
+++ b/doc/README.md
@@ -0,0 +1,8467 @@
+# Table of contents
+
+- [Introduction](#introduction)
+  - [Scalability](#scalability)
+  - [Productivity](#productivity)
+  - [What’s in a machine](#whats-in-a-machine)
+    - [Rolling Cartesi Machines and Cartesi
+      Rollups](#rolling-cartesi-machines-and-cartesi-rollups)
+  - [Documentation](#documentation)
+- [The host perspective](#the-host-perspective)
+  - [Machine playground](#machine-playground)
+  - [Command-line interface](#command-line-interface)
+    - [Initialization](#initialization)
+    - [Interactive sessions](#interactive-sessions)
+    - [Flash drives](#flash-drives)
+    - [Persistent flash drives and
+      NVRAMs](#persistent-flash-drives-and-nvrams)
+    - [Limiting execution](#limiting-execution)
+    - [State hashes](#state-hashes)
+    - [Persistent Cartesi Machines](#persistent-cartesi-machines)
+    - [Running as root](#running-as-root)
+    - [Cartesi Machine templates](#cartesi-machine-templates)
+    - [State value proofs](#state-value-proofs)
+    - [Remote Cartesi Machines](#remote-cartesi-machines)
+    - [Rolling Cartesi Machines](#rolling-cartesi-machines)
+    - [Rolling Cartesi Machine
+      templates](#rolling-cartesi-machine-templates)
+    - [Additional options](#additional-options)
+  - [Lua interface](#lua-interface)
+    - [Instantiation by configuration](#instantiation-by-configuration)
+    - [Default configuration](#default-configuration)
+    - [Generating configurations](#generating-configurations)
+    - [Additional sample
+      configurations](#additional-sample-configurations)
+    - [Loading and running machines](#loading-and-running-machines)
+    - [Instantiation from persistent
+      state](#instantiation-from-persistent-state)
+    - [Limiting execution](#limiting-execution-1)
+    - [Progress feedback](#progress-feedback)
+    - [Cartesi Machine templates](#cartesi-machine-templates-1)
+    - [State hashes](#state-hashes-1)
+    - [External state access](#external-state-access)
+    - [State value proofs](#state-value-proofs-1)
+    - [Remote Cartesi Machines](#remote-cartesi-machines-1)
+    - [Rolling Cartesi Machines](#rolling-cartesi-machines-1)
+    - [Output proofs](#output-proofs)
+    - [State-transition proofs](#state-transition-proofs)
+- [The guest perspective](#the-guest-perspective)
+  - [Linux environment](#linux-environment)
+    - [Building a custom root
+      file-system](#building-a-custom-root-file-system)
+    - [Guest “Hello world!”](#guest-hello-world)
+    - [Flash drives and NVRAMs](#flash-drives-and-nvrams)
+    - [Initialization](#initialization-1)
+    - [Communication between guest and
+      host](#communication-between-guest-and-host)
+  - [System architecture](#system-architecture)
+    - [The main processor](#the-main-processor)
+    - [The microarchitecture](#the-microarchitecture)
+    - [The board](#the-board)
+    - [Linux setup](#linux-setup)
+- [The blockchain perspective](#the-blockchain-perspective)
+  - [Hash-view of state](#hash-view-of-state)
+    - [Slicing and splicing](#slicing-and-splicing)
+    - [Template instantiation](#template-instantiation)
+    - [Result extraction](#result-extraction)
+    - [The output hashes tree](#the-output-hashes-tree)
+    - [Output verification](#output-verification)
+  - [Verification game](#verification-game)
+    - [Settling a dispute](#settling-a-dispute)
+    - [One bisection level](#one-bisection-level)
+    - [Verifying the state transition](#verifying-the-state-transition)
+    - [Verifying the result](#verifying-the-result)
+    - [Running the game](#running-the-game)
+
+# Introduction
+
+The Cartesi Machine is Cartesi’s solution for verifiable computation. It
+was designed to bring mainstream scalability to decentralized
+applications and mainstream productivity to their developers.
+
+## Scalability
+
+Applications running exclusively on smart contracts face severe
+constraints on the amount of data they can manipulate and on the
+complexity of computations they can perform. These limitations manifest
+themselves as exorbitant transaction costs and, even if such costs could
+somehow be overcome, as extremely long computation times.
+
+In comparison, applications running inside Cartesi Machines can process
+practically unlimited amounts of data, and at a pace orders of magnitude
+faster. This is possible because Cartesi Machines run off-chain, free of
+the overhead imposed by the consensus mechanisms used by blockchains.
+
+In a typical scenario, one of the parties involved in an application
+will execute the Cartesi Machine off-chain and report its results to the
+blockchain. Different parties do not need to trust each other because
+the Cartesi platform includes an automatic dispute mechanism for Cartesi
+Machines. All interested parties repeat the computation off-chain and,
+if their results do not agree, they enter into a dispute, which the
+mechanism guarantees to be always won by an honest party against any
+number of dishonest parties.
+
+To enable this dispute mechanism, Cartesi Machines are executed inside a
+special emulator that has three unique properties:
+
+- Cartesi Machines are *self contained* — They run in isolation from any
+  external influence on the computation;
+- Cartesi Machines are *reproducible* — Two parties performing the same
+  computation always obtain exactly the same results;
+- Cartesi Machines are *transparent* — They expose their entire state
+  for external inspection.
+
+From the point of view of the blockchain, the disputes require only a
+tiny fraction of the amount of computation performed by the Cartesi
+Machine. Dispute resolution thus becomes an ordinary task and dishonest
+parties are generally expected to be exposed, which discourages the
+posting of incorrect results and further increases the efficiency of the
+platform.
+
+Cartesi Machines allow decentralized applications to take advantage of
+vastly increased computing capabilities off-chain, while enjoying the
+same security guarantees offered by code that runs natively as smart
+contracts. This is what Cartesi means by scalability.
+
+## Productivity
+
+Scalability is not the only impediment to widespread blockchain
+adoption. Another serious limiting factor is the reduced developer
+productivity.
+
+Modern software development involves the combination of dozens of
+off-the-shelf software components. Creating these components took the
+concerted effort of an active worldwide community over the course of
+several decades. They have all been developed and tested using
+well-established toolchains (programming languages, compilers, linkers,
+profilers, debuggers, etc.), and rely on multiple services provided by
+modern operating systems (memory management, multi-tasking, file
+systems, networking, etc.).
+
+Smart contracts are developed using ad-hoc toolchains, and run directly
+on top of custom virtual machines, without the support of an underlying
+operating system. This arrangement deprives developers of the tools of
+their trade, severely reduces their expressive power, and consequently
+decimates their productivity.
+
+In contrast, Cartesi Machines are based on a proven platform:
+[RISC-V](https://riscv.org/). RISC-V was born of research in academia at
+UC Berkeley. It is now maintained by its own independent foundation. It
+is important to keep in mind that, unlike many of its academic
+counterparts, RISC-V is not a toy architecture. It is suitable for
+direct native hardware implementation, which is indeed currently
+commercialized by a large (and ever-increasing) number of
+[vendors](https://en.wikipedia.org/wiki/RISC-V#Implementations). This
+means that, in the future, Cartesi will not be limited to emulation or
+binary translation off-chain. The RISC-V platform is supported by a
+vibrant community of developers. Their efforts have produced an
+extensive software infrastructure, most notably ports of the Linux
+Operating System and the GNU toolchain.
+
+By moving key parts of their application logic to run inside Cartesi
+Machines, but on top of the Linux Operating System, developers are
+isolated not only from the limitations and idiosyncrasies of specific
+blockchains, but also from irrelevant details of the Cartesi Machine
+architecture itself. They regain access to all the tools they have come
+to rely on when writing applications.
+
+This is Cartesi’s contribution to empowering application developers to
+express their creativity unimpeded, and to boost their productivity.
+
+## What’s in a machine
+
+The key components of a Cartesi Machine are its main processor and a
+board. The processor that performs the computations, executing the
+traditional fetch-execute loop while maintaining a variety of registers,
+implements a generous set of RISC-V extensions. The board defines the
+surrounding environment with an assortment of memories (RAM, flash
+drives, NVRAMs etc) and a number of devices. Memories and devices are
+mapped to the 64-bit physical address space of the Cartesi Machine. The
+amount of RAM, as well as the number, length, and position of the flash
+drives and NVRAMs in the address space can be chosen according to the
+needs of each particular application. The Cartesi Machine emulator is a
+program that carefully implements the Cartesi Machine architecture so
+that its execution is reproducible in production. During development, a
+variety of convenient devices can be added to the Cartesi Machine that
+make prototyping more ergonomic. The emulator can be built from the
+[`cartesi/machine-emulator`](https://github.com/cartesi/machine-emulator)
+repository.
+
+The Cartesi Machine also includes a microarchitecture (uarch) that can
+drive the main processor using a much-reduced RISC-V ISA. This is
+necessary to enable verifiability in architectures that, due to
+computational limitations, cannot emulate a main-processor instruction,
+such as blockchains. Running the uarch until it halts, and then
+resetting the uarch to its pristine state, is equivalent to executing
+one instruction of the main processor. See [the microarchitecture
+section](#the-microarchitecture) for details.
+
+The initialization of a Cartesi Machine typically loads the Linux kernel
+into RAM, and a Linux root file-system (as a flash drive) from regular
+files in the host file-system. The Linux kernel `linux.bin`, is built by
+the
+[`cartesi/machine-linux-image`](https://github.com/cartesi/machine-linux-image)
+repository. After it is done with its own initialization, the Linux
+kernel cedes control to the `/usr/sbin/cartesi-init` program in the root
+file-system. The root file-system `rootfs.ext2` contains all the data
+files and programs that make up the Linux distribution. It is built by
+the
+[`cartesi/machine-rootfs-image`](https://github.com/cartesi/machine-rootfs-image)
+repository. The components of the guest application can reside in the
+root file-system itself, or in their own, separate file-systems. The
+emulator can be instructed to execute whatever command is necessary to
+start the guest application. For a complete description of the Cartesi
+Machine architecture and the boot process, see the documentation for
+[the guest perspective](#the-guest-perspective).
+
+There are two distinct modes of operation. In the first mode, a Cartesi
+Machine is initialized and tasked to run a guest application until the
+machine *halts*. Inputs for the guest application can be provided as
+additional flash drives with file-systems, or NVRAMs with raw data.
+Outputs are only available to the host after the machine halts. Once it
+halts, the machine cannot perform any additional computations.
+
+In the second mode of operation, the guest application runs in a loop.
+In each iteration, it obtains a request carrying an input, performs any
+necessary computations to service the request, and produces a number of
+responses. Indeed, this is much like a server in which the guest
+application can interact with the outside world. We say that a Cartesi
+Machine operating in this mode is a *Rolling Cartesi Machine*.
+
+### Rolling Cartesi Machines and Cartesi Rollups
+
+Rolling Cartesi Machines accept two types of requests: advance-state
+requests and inspect-state requests. Advance-state requests can create
+persistent changes to the state of the underlying Cartesi Machine. In
+contrast, inspect-state requests leave the state unchanged.
+
+Both types of request are serviced by the guest application, which
+modifies the state of the Cartesi Machine while doing so. When servicing
+an advance-state request, the guest application ultimately either
+accepts or rejects it. The resulting modifications are kept only when
+the request is accepted, and reverted when it is rejected. State
+modifications are always reverted after inspect-state requests are
+serviced.
+
+The stringent demands of reproducibility prevent a Cartesi Machine from
+communicating *directly* with the outside world. Indeed, if two parties
+were to run the same Cartesi Machine and then disagree on the data each
+instance independently obtained from a network connection, there would
+be no way to settle a dispute between them. Instead, Rolling Cartesi
+Machines communicate with the outside world under controlled conditions,
+through *Cartesi Rollups*.
+
+In a nutshell, Cartesi Rollups uses the blockchain to maintain a public
+record of advance-state requests targeting each Rolling Cartesi Machine.
+Both the order and the inputs carried by these requests are recorded and
+made available in an indisputable fashion. Since Cartesi Machines are
+deterministic, and since the inputs are agreed upon, the state of a
+Rolling Cartesi Machine can be advanced in a well-defined way, always
+producing the same set of responses, no matter who runs it.
+
+After producing each response to a request, the guest application asks
+the machine to *yield* control back to the host. The host extracts the
+response and *resumes* the machine. When done with a given input, the
+guest application once again asks the machine to yield control back to
+the host. At the same time, it notifies the host whether the input was
+accepted or rejected. The host then prepares the input for the next
+request, and *resumes* either the modified machine or a backup copy, so
+the guest application can service the next request in a new iteration of
+its loop. Inputs and responses are transferred in special memory ranges
+(*CMIO* memory ranges).
+
+Advancing the state of a Rolling Cartesi Machine can produce four types
+of response: *vouchers*, *notices*, *reports*, and *exceptions*.
+Vouchers allow a Rolling Cartesi Machine to interact back with the
+blockchain. A voucher issued by the guest application may, for example,
+grant a user the right to withdraw tokens locked into a custodial smart
+contract. Notices are used to register noteworthy changes to the state
+of the guest application. A notice may be issued, for example,
+announcing the demise of a character in a game or some other relevant
+state transition. Disputes over the fact that a voucher or notice has
+been generated while advancing the state of a Rolling Cartesi Machine
+can be settled by Cartesi Rollups. Reports, in contrast, are used to
+output any data that is irrelevant to the blockchain. A report may, for
+example, provide diagnostic information on the reasons why an input has
+been rejected.
+
+*Rejecting an input not only reverts the state, but also cancels all
+vouchers and notices emitted while the request was serviced.*
+
+The advance-state requests serviced by a Rolling Cartesi Machine are
+grouped into *epochs*. At the end of an epoch, the state of the machine
+is finalized, so its state hash becomes known. From the finalized state
+one can read the *output hashes root hash*, a single hash that commits
+to every voucher and notice the machine has ever emitted. This hash is
+the root of a Merkle tree maintained inside the machine, where each leaf
+is the hash of one of the outputs, in the order they are emitted. (The
+index of an output is its leaf position.) Given the contents of an
+output, and a proof that its hash is the leaf at that index in the tree,
+it is therefore possible to verify that the machine has in fact produced
+that output. This is how Cartesi Rollups settles disputes over the
+vouchers and notices a Rolling Cartesi Machine produces.
+
+Between state advances, it is possible to inspect the state of a Rolling
+Cartesi Machine. This works by sending a query for processing inside the
+Cartesi Machine. State inspection produces only reports and exceptions.
+*All modifications to the state due to servicing queries are reverted
+after the responses are collected.*
+
+An exception, which either kind of request may produce, signals an
+irrecoverable error encountered by the guest application.
+
+## Documentation
+
+Cartesi Machines can be seen from three different perspectives:
+
+- *The host perspective* — This is the environment right outside the
+  Cartesi Machine emulator. It is most relevant to developers setting up
+  Cartesi Machines, running them, or manipulating their contents. It
+  includes the emulator’s API in all its flavors: C, C++, Lua, JSON-RPC,
+  and the command-line interface;
+- *The guest perspective* — This is the environment inside the Cartesi
+  Machine. It encompasses Cartesi’s particular flavor of the RISC-V
+  architecture, as well as the organization of the Linux Operating
+  System that runs on top of it. It is most relevant to programmers
+  responsible for the application components that run off-chain but must
+  be verifiable. The cross-compiling toolchain, and the tools used to
+  build the Linux kernel and the Linux root file-systems are also
+  important from this perspective, even though they are used in the
+  host;
+- *The blockchain perspective* — This is the view smart contracts have
+  of Cartesi Machines. It consists almost exclusively of the
+  manipulation of cryptographic hashes of the state of Cartesi Machines
+  and parts thereof. In particular, using only hash operations, the
+  blockchain can verify assertions concerning the contents of the state,
+  and can obtain the state hash that results from modifications to the
+  state. Notably, this includes direct verification by the blockchain of
+  RISC-V instructions performed by the uarch, and ZK proofs of batches
+  of RISC-V instructions performed by the main processor.
+
+As with every computer, the level of knowledge required to interact with
+Cartesi Machines depends on the nature of the application being created.
+Simple applications make only modest demands of each kind of developer.
+Guest developers code a few scripts invoking pre-installed software
+components. Host developers fill out a configuration file specifying the
+location of the components needed to build a Cartesi Machine. Blockchain
+developers instantiate one of the high-level contracts provided by
+Cartesi. At the other extreme are the developers contributing to the
+Cartesi ecosystem, who regularly write, build, and deploy custom
+software components to run in the guest, or even change the Linux kernel
+to support Cartesi-specific devices. Additionally, these developers
+programmatically control the creation and execution of Cartesi Machines
+in the host, and must also understand and use the hash-based state
+manipulation primitives the blockchain needs.
+
+Although Cartesi’s goal is to shield platform users from as much
+complexity as possible, there is value in making information available
+to the greatest extent possible. To that end, this documentation of
+Cartesi Machines aims to provide enough information to cover all three
+perspectives, at all depths of understanding.
+
+# The host perspective
+
+Cartesi’s reference off-chain implementation of a Cartesi Machine is
+based on software emulation. The emulator is written in C++23 with
+well-insulated POSIX dependencies. The
+[`cartesi/machine-emulator`](https://github.com/cartesi/machine-emulator)
+repository can be used to build and install the Cartesi Machine
+emulator. The emulator is implemented by a C++ class that can be
+accessed in a variety of different ways.
+
+When linked to a C++ application, the emulator can be controlled
+directly via the interface of the `cartesi::machine` class. C
+applications can control the emulator in a similar way, by means of a
+matching C API defined in the include file `cm.h`. The C API is stable
+and complete. It is the basis for the creation of binds in other
+programming languages, most notably the Lua programming language. The
+emulator can be accessed via a `cartesi` module that exposes a
+`cartesi.machine` interface to Lua programs. Additionally, Cartesi
+provides a JSON-RPC server that can run a Cartesi Machine instance that
+is controlled remotely. The server supports JSON-RPC discovery so client
+libraries can be generated automatically. Finally, there is a
+command-line utility (written in Lua) that can configure and run Cartesi
+Machines for rapid prototyping. The C, C++, Lua APIs as well as the
+command-line utility can seamlessly instantiate local emulators or
+connect to remote JSON-RPC servers.
+
+The documentation starts from the command-line utility,
+`cartesi-machine`. This utility is used for most prototyping tasks. The
+documentation then covers the Lua interface of `cartesi.machine`. The C,
+C++, and JSON-RPC interfaces closely mirror the Lua interface documented
+here, so this document does not cover them separately. The C API is
+defined in the `cm.h` header. The JSON-RPC API supports discovery, so
+client bindings can be generated from a running server.
+
+## Machine playground
+
+The setup of a new development environment is often a time-consuming
+task. This is particularly true in case of cross-development
+environments (i.e., when the development happens in a host platform but
+software runs in a different target platform). With this in mind, the
+Cartesi team provides the `cartesi/machine-emulator-docs` Docker image
+for use while reading this documentation. The Docker image enables
+immediate experimentation with Cartesi Machines, as well as the
+generation of the documentation itself. It comes with a pre-built
+emulator and Lua interpreter accessible within the command-line, as well
+as a pre-built RAM image and root file-system. It also comes with the
+cross-compiler for the RISC-V architecture on which the Cartesi Machine
+is based.
+
+To enter the playground, open a terminal, download the Docker image from
+Cartesi’s repository, and run it adequately mapping the current user and
+group information, as well as making the host’s current directory
+available inside the container:
+
+``` bash
+docker pull cartesi/machine-emulator-docs:devel
+```
+
+``` bash
+docker run \
+    --hostname playground \
+    --name playground \
+    --rm \
+    -e USER=$(id -u -n) \
+    -e GROUP=$(id -g -n) \
+    -e UID=$(id -u) \
+    -e GID=$(id -g) \
+    -v "$(pwd)":/work \
+    -w /work \
+    -it \
+    cartesi/machine-emulator-docs:devel \
+    /bin/bash
+```
+
+Once inside, you can execute the `cartesi-machine` utility as follows:
+
+``` bash
+cartesi-machine --help | head -n 40
+```
+
+``` text
+Usage:
+
+  /usr/share/lua/5.4/cartesi-machine.lua [options] [command] [arguments]
+
+where options are:
+  --help
+    display this information.
+
+  --version
+    display cartesi machine version information and exit.
+
+  --version-json
+    display cartesi machine semantic version and exit.
+
+  --bash-completion
+    print a bash completion script for this program to stdout and exit.
+    Install with: source <(cartesi-machine --bash-completion)
+
+  --assert-version=<major>.<minor>[.<patch>]
+    exit with failure in case the cartesi machine emulator version mismatches
+
+  --remote-spawn
+    spawns a remote cartesi machine,
+    when --remote-address is specified, it listens on the specified address,
+    otherwise it listens on "127.0.0.1:0".
+
+  --remote-address=<ip>:<port>
+    use a remote cartesi machine listening to <ip>:<port> instead of
+    running a local cartesi machine.
+
+  --remote-health-check
+    checks health of remote server and exit
+
+  --remote-fork[=<ip>:<port>]
+    fork the remote cartesi machine before the execution,
+    in case an address is specified the new forked server will be rebound to it.
+
+  --remote-shutdown
+    shutdown the remote cartesi machine after the execution.
+
+...
+```
+
+A final check can also be performed to verify if the contents inside the
+container are as expected:
+
+``` bash
+sha256sum /usr/share/cartesi-machine/images/linux.bin
+```
+
+``` text
+9fb5aaa623f35c0ef2138c8dadf1b0a1e388e0f51758cb6a5477ec5cecd3a029  /usr/share/cartesi-machine/images/linux.bin
+```
+
+``` bash
+sha256sum /usr/share/cartesi-machine/images/rootfs.ext2
+```
+
+``` text
+fe62e2afa2d46eb85b79380f7fce5e47c9852c0b4c93ca751fe96923b555843c  /usr/share/cartesi-machine/images/rootfs.ext2
+```
+
+Note that, if the hashes of the files you are using do not match the
+ones above, then when you attempt to replicate the examples in the
+documentation, you will obtain different hashes. Moreover, the cycle
+counts and outputs may also differ.
+
+## Command-line interface
+
+In the simplest usage scenario, the `cartesi-machine` command-line
+utility can be used to define a Cartesi Machine and run it until it
+halts. The command-line utility, however, is very versatile. It was
+designed to simplify the most common prototyping tasks.
+
+The simplest invocation takes no arguments
+
+``` bash
+cartesi-machine
+```
+
+and produces the output
+
+``` text
+
+         .
+        / \
+      /    \
+\---/---\  /----\
+ \       X       \
+  \----/  \---/---\
+       \    / CARTESI
+        \ /   MACHINE
+         '
+
+Nothing to do.
+
+Halted
+Cycles: 41860482
+```
+
+The utility instantiates a default Cartesi Machine and runs it until it
+halts. The Linux kernel boots, the Cartesi-provided `cartesi-init`
+script prints the ASCII-art splash and reports there is nothing to do,
+then gracefully halts the machine. This takes many millions of cycles to
+complete: time mostly spent initializing the Linux kernel. The utility
+regains control from the emulator, and prints the `Halted` message and
+the cycle count.
+
+### Initialization
+
+The following command instructs `cartesi-machine` to build a Cartesi
+Machine. The machine has 128MiB of RAM, uses `linux.bin` as the RAM
+image, and uses `rootfs.ext2` as the root file-system. (`linux.bin` is
+generated by
+[machine-linux-image](https://github.com/cartesi/machine-linux-image)
+and `rootfs.ext2` is generated by
+[machine-rootfs-image](https://github.com/cartesi/machine-rootfs-image).
+Sample files are available in the `cartesi/machine-emulator-docs` Docker
+image, which can be built from the `doc/` directory of the
+[machine-emulator](https://github.com/cartesi/machine-emulator)
+repository.) Once initialization is complete, the machine executes the
+command `ls /bin` and exits.
+
+``` bash
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    --ram-length=128Mi \
+    --ram-image="/usr/share/cartesi-machine/images/linux.bin" \
+    --flash-drive="label:root,data_filename:/usr/share/cartesi-machine/images/rootfs.ext2" \
+    -- ls /bin
+```
+
+The `--quiet` option suppresses the output of `cartesi-machine.lua`
+itself, leaving visible only what is produced inside the machine. The
+command-line option `--no-init-splash` instructs the utility to skip the
+splash, keeping the output focused on the example at hand. The
+`--ram-image`, `--ram-length`, and `--flash-drive` command-line options
+have the values in the example as default, so these options can be
+omitted. To remove these default settings, use the command-line options
+`--no-ram-image` and `--no-root-flash-drive`, respectively.
+
+The simplified command-line is
+
+``` bash
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    -- ls /bin
+```
+
+The output is
+
+``` text
+'['			   gunzip	      rgrep
+ addpart		   gzexe	      rm
+ apt			   gzip		      rmdir
+ apt-cache		   hardlink	      rollup
+ apt-cdrom		   head		      rollup-http-server
+ apt-config		   hex		      rollup-init
+ apt-get		   hostid	      run-parts
+ apt-key		   hostname	      runcon
+ apt-mark		   iconv	      savelog
+ arch			   id		      script
+...
+```
+
+It shows the listing of directory `/bin/` inside the root file-system.
+The listing was produced by the entrypoint command that follows the `--`
+separator in the command line. By a method explained in great detail
+later on (see [The guest perspective initialization](#initialization-1))
+the entrypoint is picked up by the Cartesi-provided
+`/usr/sbin/cartesi-init`, which executes it before gracefully halting
+the machine.
+
+> [!NOTE]
+>
+> In many of the documentation examples, the utilities invoked from the
+> command-line executed by a Cartesi Machine are in the default search
+> path for executables. (This is set up by the Cartesi-provided
+> `/usr/sbin/cartesi-init` script itself.) When in doubt, or when using
+> your own executables installed in custom locations, make sure to
+> invoke them by using their full paths (e.g., `/bin/ls` or `/bin/sh`
+> instead of simply `ls` and `sh`.)
+
+### Interactive sessions
+
+By default, the `cartesi-machine` utility executes the Cartesi Machine
+in non-interactive mode. Verifiable computations must always be run in
+non-interactive sessions. User interaction with a Cartesi Machine via
+the console is, after all, not reproducible. Nevertheless, during
+development, it is often convenient to directly interact with the
+emulator, as if using a computer console.
+
+The command-line option `-i` (short for `--htif-console-getchar`)
+instructs the emulator to monitor the console for input, and to make
+this input available to the Linux kernel. Typically, this option will be
+used in conjunction with the `--` separator and the command `sh`,
+causing the Cartesi-provided `/usr/sbin/cartesi-init` script to drop
+into an interactive shell. Interaction with the shell enables the
+exploration of the Linux distribution from the inside. Exiting the shell
+returns control back to `/usr/sbin/cartesi-init`, which then gracefully
+halts the machine.
+
+For example, if an interactive session is started with the following
+command
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    -i \
+    -- sh
+```
+
+it drops into the shell. Running the command `ls /bin` causes the
+listing of directory `/bin` to appear. Pressing Ctrl+D at the prompt
+then causes the shell to exit. The output is
+
+``` text
+$ ls /bin
+'['			   gunzip	      rgrep
+ addpart		   gzexe	      rm
+ apt			   gzip		      rmdir
+ apt-cache		   hardlink	      rollup
+ apt-cdrom		   head		      rollup-http-server
+ apt-config		   hex		      rollup-init
+ apt-get		   hostid	      run-parts
+ apt-key		   hostname	      runcon
+ apt-mark		   iconv	      savelog
+...
+```
+
+> [!NOTE]
+>
+> When running in interactive mode, not even the final cycle count is
+> reproducible. To avoid busy wait for new interactive input, the
+> emulator sleeps from one Cartesi Machine timer interrupt to the next,
+> skipping Cartesi Machine cycles forward so programs running inside
+> stay *roughly* in sync with wall-clock time outside. This dynamic
+> balancing act is sure to vary between executions and across different
+> computers.
+
+### Flash drives
+
+The command-line option
+`--flash-drive=label:<label>,data_filename:<filename>` can be used to
+add between 1 and 8 flash drives to the Cartesi Machine. Here, the
+string `<label>` is the *label* for the flash drive, and `<filename>`
+points to an *image file* with the initial contents of the flash drive.
+When the image file contains a valid file-system, the `cartesi-machine`
+command-line utility instructs `/usr/sbin/cartesi-init` to mount it at
+`/mnt/<label>`.
+
+To enable transparency, Cartesi Machine flash drives are mapped into the
+machine’s 64-bit address space. The start and length are set,
+respectively, by the `start:<number>` and `length:<number>` parameters
+to `--flash-drive`.
+
+When the `length` parameter is omitted, the `cartesi-machine` utility
+automatically sets the size of a flash drive to match the size of its
+image file. Because RISC-V uses 4KiB pages, image files must have a size
+multiple of 4KiB. (The `truncate` utility can be used to pad a file with
+zeros so its size is a multiple of 4KiB.)
+
+For convenience, numbers can be specified in decimal or hexadecimal
+(e.g., `4096` or `0x1000`) and may include a suffix multiplier (i.e.,
+`Ki` to multiply by 2<sup>10</sup>, `Mi` to multiply by 2<sup>20</sup>,
+and `Gi` to multiply by 2<sup>30</sup>). They can also use the C
+programming language *shift left* notation to multiply by arbitrary
+powers of 2 (e.g. `1 << 24` meaning 2<sup>24</sup>).
+
+When the `length` of a drive is specified, the `data_filename` parameter
+can be omitted. In that case, the drive starts in a *pristine* state:
+i.e., filled with zeros. If, however, both `length` and `data_filename`
+are specified, then the `length` must exactly match the size of the
+image file referred to by the `data_filename` parameter.
+
+The positioning of memory ranges in the machine’s address space has
+implications on certain operations, discussed in detail under [the
+blockchain perspective](#hash-view-of-state), that involve the
+manipulation of hashes of the Cartesi Machine state. First, memory
+ranges cannot overlap with each other. Second, memory ranges must start
+at positions that are aligned to their lengths. Finally, the lengths
+used to restrict the starts and to detect overlaps are rounded up to the
+next power of 2.
+
+When the `start` of a drive is omitted, the emulator automatically
+places it following this rule. The first drive is placed past the RAM,
+and each remaining drive is placed past the previous one.
+
+The preferred file-system type is `ext2`. This is because `ext2` image
+files can be easily created with the `xgenext2fs` command-line utility
+(a Cartesi fork of `genext2fs`) and manipulated with `e2ls`, `e2cp`,
+`e2rm`, etc. All of these utilities come pre-installed in the
+`cartesi/machine-emulator-docs` Docker image (the `e2tools` package also
+provides `e2ls`, `e2cp`, and `e2rm` individually for Ubuntu hosts).
+Support for `ext4` is also enabled by default in the kernel. (Support
+for additional file-systems can be enabled by modifying the
+configuration that
+[`cartesi/machine-linux-image`](https://github.com/cartesi/machine-linux-image)
+uses to produce `linux.bin`.)
+
+For example,
+
+``` bash
+mkdir foo
+echo "Hello world!" > foo/bar.txt
+tar \
+    --sort=name \
+    --mtime="2022-01-01" \
+    --owner=1000 \
+    --group=1000 \
+    --numeric-owner \
+    -cf foo.tar \
+    --directory=foo .
+xgenext2fs \
+    -fzB 4096 \
+    -i 4096 \
+    -a foo.tar \
+    foo.ext2
+```
+
+> [!NOTE]
+>
+> The flags above are the base set used in all `xgenext2fs` examples in
+> this documentation. The `-a foo.tar` flag tells `xgenext2fs` to
+> populate the image from a `tar` archive rather than from a directory
+> tree. The `-f` (faketime) flag zeros the modification times that
+> `xgenext2fs` would otherwise read from the inputs. The `-z` flag
+> writes a sparse file, leaving unwritten blocks as holes on disk. The
+> `-B 4096` flag sets the block size to 4096 bytes. The `-i 4096` flag
+> requests one inode per 4096 bytes of data.
+>
+> The tar detour is what makes the output reproducible. Running
+> `xgenext2fs` directly on a directory tree would record modification
+> times, user and group IDs, and traverse the directory in an
+> unspecified order. The `-f` flag fixes the timestamp problem, but does
+> nothing about the rest. The `tar` invocation above pins the file order
+> (`--sort=name`), the timestamps (`--mtime`), and the user and group
+> IDs (`--owner`, `--group`, `--numeric-owner`). `xgenext2fs` then walks
+> the archive in deterministic order and emits a byte-identical
+> file-system on every run.
+
+The image can be loaded as a flash drive:
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --flash-drive="label:foo,data_filename:foo.ext2" \
+    -- "cat /mnt/foo/bar.txt"
+```
+
+Here, a flash drive with label `foo` is initialized with the contents of
+an `ext2` file-system in the image file `foo.ext2`. The Cartesi-provided
+`/usr/sbin/cartesi-init` mounts this as `/mnt/foo`. The command executed
+in the machine simply copies the contents of `/mnt/foo/bar.txt` to the
+terminal. The output is
+
+``` text
+Hello world!
+
+Halted
+Cycles: 56572298
+```
+
+### Persistent flash drives and NVRAMs
+
+By default, the emulator does *not* modify the image files associated to
+any of its memory ranges (such as the RAM, flash drives, and NVRAMs).
+However, since these image files can be very large, the emulator does
+not pre-allocate any host memory for them. Instead, it uses the
+operating system’s memory mapping capabilities. The operating system
+reads to host memory only those pages from the image file that are
+actually read by code executing in the guest. (Naturally, when a state
+hash is requested, all image files are read from disk in their entirety
+and processed. See below.) These image files are mapped to host memory
+in a *copy-on-write* fashion. When code running in the guest causes the
+emulator to write to a mapped image file, the operating system makes a
+copy of the page before modification and replaces the mapping to point
+to the fresh copy. The image files are never written to. (The
+`--dump-memory-ranges` command-line option can be used to inspect the
+modified copies for debugging purposes. See below.)
+
+> [!NOTE]
+>
+> The entrypoint commands executed by the Cartesi-provided
+> `/usr/sbin/cartesi-init` run as the unprivileged user `dapp`. By
+> default, every flash drive is mounted with the ownership and
+> permissions baked into its image file, which typically means its root
+> directory is owned by `root`. As a result, `dapp` can read the drive
+> but cannot write to it. To allow writes, pass `user:dapp` to the
+> `--flash-drive` command-line option so the emulator changes the owner
+> of the drive’s mount point to `dapp` after mounting. The same is true
+> of NVRAMs: by default, they are only writeable by `root`.
+> Alternatively, the `--user=root` command-line option causes
+> `/usr/sbin/cartesi-init` to run commands as `root`, which can write to
+> the drive without any ownership changes. For safety, running as `dapp`
+> is preferred.
+
+For example, running the machine
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --flash-drive="label:foo,data_filename:foo.ext2,user:dapp" \
+    -- "ls /mnt/foo/*.txt && cp /mnt/foo/bar.txt /mnt/foo/baz.txt && ls /mnt/foo/*.txt"
+```
+
+produces the output
+
+``` text
+/mnt/foo/bar.txt
+/mnt/foo/bar.txt  /mnt/foo/baz.txt
+
+Halted
+Cycles: 62126424
+```
+
+indicating that the file-system was modified, at least from the
+perspective of the guest. However, inspecting the `foo.ext2` image file
+from outside the emulator shows it is unchanged.
+
+``` bash
+e2ls -aln foo.ext2:*.txt
+```
+
+``` text
+         11  -rw-r--r--  1000  1000       13  1-Jan-1970 00:00 bar.txt
+```
+
+This behavior is appropriate when the flash drives will only be used as
+inputs. For output flash drives, guest changes to the drives must
+reflect on the associated image files. For that purpose, the parameter
+`shared` can be passed to command-line option `--flash-drive`, causing
+the image files to be mapped to host memory in a *shared* fashion. For
+example,
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --flash-drive="label:foo,data_filename:foo.ext2,shared,user:dapp" \
+    -- "ls /mnt/foo/*.txt && cp /mnt/foo/bar.txt /mnt/foo/baz.txt && ls /mnt/foo/*.txt"
+```
+
+produces exactly the same output as before. However, `e2ls` now shows
+the image file `foo.ext2` has indeed been modified.
+
+``` bash
+e2ls -aln foo.ext2:*.txt
+```
+
+``` text
+         11  -rw-r--r--  1000  1000       13  1-Jan-1970 00:00 bar.txt
+         12  -rw-r--r--  1001  1001       13  1-Jan-1970 00:00 baz.txt
+```
+
+### Limiting execution
+
+The machine’s processor includes a control and status register (CSR),
+named `mcycle`, that starts at 0 and is incremented after every
+instruction cycle. By default the `cartesi-machine` utility only returns
+when the machine halts (or yields manual), as the [introductory
+example](#command-line-interface) showed. The maximum cycle can be
+specified with the command-line option `--max-mcycle=<number>`.
+
+For example, running
+
+``` bash
+cartesi-machine --max-mcycle=37056250
+```
+
+produces the output
+
+``` text
+
+         .
+        / \
+      /    \
+\---/---\  /----\
+ \       X       \
+  \----/  \---/---\
+       \    / CARTESI
+```
+
+Note the execution was interrupted before the splash screen was even
+completed. The ability to limit computation to an arbitrary number of
+cycles is fundamental to the verifiability of Cartesi Machines, as is
+explained in detail under the [blockchain
+perspective](#verification-game).
+
+### State hashes
+
+The `cartesi-machine` utility can also be used to print Cartesi Machine
+state hashes. State hashes are Merkle tree root hashes of the entire
+64-bit address space of the Cartesi Machine, where the leaves are
+aligned 256-bit words. (See [Hash-view of state](#hash-view-of-state)
+for an explanation of Merkle trees.) Since Cartesi Machines are
+transparent, the contents of this address space encompass the entire
+machine state, including all processor CSRs and general-purpose
+registers, the contents of RAM, of all flash drives and NVRAMs, and of
+all other devices connected to the board, and even the state of the
+uarch. State hashes therefore work as cryptographic signatures of the
+machine, and implicitly of the computation they are about to execute.
+
+To obtain the state hash right before execution starts, use the
+command-line option `--initial-hash`. Conversely, to obtain the state
+hash right after execution is done, use the option `--final-hash`. For
+example,
+
+``` bash
+cartesi-machine \
+    --max-mcycle=37056250 \
+    --initial-hash \
+    --final-hash
+```
+
+produces the output
+
+``` text
+0: d28274b4ff458388fccda9766418ad2412e25ca3f745290e8258462a6bf2fbcb
+
+         .
+        / \
+      /    \
+\---/---\  /----\
+ \       X       \
+  \----/  \---/---\
+       \    / CARTESI
+37056250: 9b691ed47293f8ec0db5a89c65496f1c61f4c5e9e47d842d9d2a11c56a3152c3
+```
+
+The initial state hash `d28274b4…` is the Merkle tree root hash for the
+initial Cartesi Machine state. Since Cartesi Machines are reproducible,
+the initial state hash also works as a *promise* on the result of the
+entire computation.
+
+In other words, the “final state hash” `9b691ed4…` is the “only”
+possible outcome for the `--final-hash` at cycle `37056250`, given the
+result of the `--initial-hash` operation was `d28274b4…`.
+
+> [!NOTE]
+>
+> The scare quotes around “only” are pedantic. It is true that there are
+> a multitude of machine states that produce the same state hash. After
+> all, the Keccak-256 state hashes fit in 256-bits, whereas machine
+> states can take gigabytes. There are therefore many more possible
+> machine states than possible state hashes. By the pigeonhole
+> principle, there must be multiple machines with the same hash (i.e.,
+> hash collisions). However, given only the state hash, finding a
+> Cartesi Machine with that state hash should be virtually impossible.
+> Given a Cartesi Machine and its state hash, finding a *second*
+> (distinct) Cartesi Machine with the same state hash should also be
+> virtually impossible. Even finding two different Cartesi Machines that
+> have the same state hash (any hash) should be virtually impossible.
+> Cryptographic hash functions, such as Keccak-256, were designed
+> *specifically* to have these properties.
+
+Allowing the machine to run until it halts
+
+``` bash
+cartesi-machine \
+    --initial-hash \
+    --final-hash
+```
+
+produces instead the output
+
+``` text
+0: d28274b4ff458388fccda9766418ad2412e25ca3f745290e8258462a6bf2fbcb
+
+         .
+        / \
+      /    \
+\---/---\  /----\
+ \       X       \
+  \----/  \---/---\
+       \    / CARTESI
+        \ /   MACHINE
+         '
+
+Nothing to do.
+
+Halted
+Cycles: 41860482
+41860482: e8cf5abc4fd1c72a6ec106c9d3f9ad2f2053ef6d142864fc12c5e084458ac0bc
+```
+
+Naturally, the initial state hash is the same as before.
+
+However, the final state hash `e8cf5abc…` now pertains to cycle
+`41860482`, where the machine is halted. This is the “only” possible
+state hash for a *halted* machine that started from state hash
+`d28274b4…`.
+
+### Persistent Cartesi Machines
+
+At any point in their execution, Cartesi Machines can be stored to disk.
+A stored machine can later be loaded to continue its execution from
+where it left off. To store a machine to a given `<directory>`, use the
+command-line option `--store=<directory>`. (In `<directory>`, the `%h`
+escape will be replaced by the state hash in hex.) The machine is stored
+as it was right before `cartesi-machine` returns to the command line.
+For example, to store the machine corresponding to state hash
+`9b691ed4…`
+
+``` bash
+cartesi-machine \
+    --max-mcycle=37056250 \
+    --store="machine-%8h"
+```
+
+This command creates a directory `machine-9b691ed4`, containing a
+variety of files that allow the Cartesi Machine emulator to recreate a
+machine state. Every image file is copied into the directory, so no
+external dependencies remain.
+
+> [!NOTE]
+>
+> If the machine initialization involved large image files or a
+> considerable amount of RAM, this operation may consume significant
+> disk space. It will also take the time required by the copying of
+> image files into the directory, and by the computation of the state
+> hash.
+
+If the directory already exists, the operation will fail. (This prevents
+the overwriting of a Cartesi Machine by mistake.) Once created, the
+directory can be compressed and transferred to other hosts. To restore
+the corresponding Cartesi Machine, use the command-line option
+`--load=<directory>`. For example,
+
+``` bash
+cartesi-machine \
+    --load="machine-9b691ed4" \
+    --initial-hash \
+    --final-hash
+```
+
+produces the output
+
+``` text
+Loading machine: please wait
+37056250: 9b691ed47293f8ec0db5a89c65496f1c61f4c5e9e47d842d9d2a11c56a3152c3
+
+        \ /   MACHINE
+         '
+
+Nothing to do.
+
+Halted
+Cycles: 41860482
+41860482: e8cf5abc4fd1c72a6ec106c9d3f9ad2f2053ef6d142864fc12c5e084458ac0bc
+```
+
+Note that, other than `--load`, no initialization command-line options
+were used. These initializations were used to define the machine before
+it was stored: their values are implicitly encoded in the stored state.
+The machine continues from where it left off, and reaches the same final
+state hash `e8cf5abc…`, as if it had never been interrupted.
+
+Note also that the initial state hash `9b691ed4…` after `--load` matches
+the final state hash before `--store`. After all, they are state hashes
+concerning the state of the same machine at the same cycle. `--load`
+verifies the archive format version recorded in the stored machine, and
+the pre-store and post-load state hashes are equal because the same
+machine state is restored.
+
+The `cartesi-machine-stored-hash` command-line utility can be used to
+extract the state hash from a stored Cartesi Machine. The command
+
+``` bash
+cartesi-machine-stored-hash machine-9b691ed4
+```
+
+produces the output
+
+``` text
+9b691ed47293f8ec0db5a89c65496f1c61f4c5e9e47d842d9d2a11c56a3152c3
+```
+
+### Running as root
+
+Starting at version 4.0 of `rootfs.ext2`, the Cartesi-provided
+`/usr/sbin/cartesi-init` script runs the entrypoint command as
+`uid=1001(dapp) gid=1001(dapp) groups=1001(dapp)`. This can be seen by
+running:
+
+``` bash
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    -- id
+```
+
+It shows the user and group are indeed `dapp`:
+
+``` text
+uid=1001(dapp) gid=1001(dapp) groups=1001(dapp)
+```
+
+To instead run your guest application as `root`, pass the `--user=root`
+command-line option:
+
+``` bash
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    --user=root \
+    -- id
+```
+
+The output now shows the user and group are `root`:
+
+``` text
+uid=0(root) gid=0(root) groups=0(root)
+```
+
+Running as root is not recommended. To perform setup tasks that require
+elevated permissions, use instead the `--append-init` command-line
+option:
+
+``` bash
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    --append-init="echo Before init ends: && id" \
+    -- "echo After entrypoint starts: && id"
+```
+
+This runs the init part as `root`, but the entrypoint part as `dapp`:
+
+``` text
+Before init ends:
+uid=0(root) gid=0(root)
+After entrypoint starts:
+uid=1001(dapp) gid=1001(dapp) groups=1001(dapp)
+```
+
+The `--append-init-file=<filename>` command-line option works like
+`--append-init`, but appends to init the entire contents of file
+`<filename>`.
+
+### Cartesi Machine templates
+
+*Templates* are one of the key uses for Cartesi Machines stored to disk.
+Cartesi Machine templates are machines in which the contents of one or
+more flash drives or NVRAMs are still unknown. To put it another way,
+Cartesi Machine templates behave like functions whose parameters are the
+yet-to-be-defined contents of these drives.
+
+As discussed in detail under [the blockchain
+perspective](#hash-view-of-state), starting from template hashes, the
+hashes of the drives, and a small amount of additional information, it
+is possible to obtain the state hash of the *instantiated template*—the
+state hash for a Cartesi Machine with drives replaced by their actual
+contents. This is how a smart contract can specify a computation to be
+performed off-chain over arbitrary input. Starting from the template
+hash, and in possession of the drive hashes, it instantiates the
+template, generating the initial state hash for the corresponding
+Cartesi Machine.
+
+As an example, consider a Cartesi Machine that operates as an
+arbitrary-precision arithmetic expression evaluator. The machine will
+take the expression in text format from an input NVRAM labeled `input`,
+and will copy the output in text format into an output NVRAM labeled
+`output` (`shared`, of course, so the output persists after the emulator
+is done).
+
+NVRAMs bind directly to a memory-backed UIO device exposed inside the
+guest as `/dev/uioN`. Unlike flash drives, they have no file-system
+layer and no page cache between the guest and the underlying memory
+range, so writes are immediately visible to the emulator and there is no
+need to flush a cache before snapshotting. This makes NVRAMs faster than
+flash drives for cases where the guest only needs raw access to a region
+of bytes.
+
+Because UIO devices do not support ordinary `read()` or `write()`
+against the device file, the machine guest utilities include the
+`readmmap` and `writemmap` tools to read and write NVRAMs. They resolve
+the label, `mmap()` the device, and copy bytes to/from standard input or
+standard output. Both also work on flash drives.
+
+The `bc` command-line utility is the perfect tool to evaluate the
+arithmetic expressions. The command passed to `cartesi-machine` below
+uses `readmmap` to read the contents of the input NVRAM, extracts a
+zero-terminated string from it using a tiny Lua script run by the
+`lua5.4` interpreter, pipes the result through `bc`, and uses
+`writemmap` to copy the result back into the output NVRAM. Here is the
+sample playground session
+
+``` bash
+truncate -s 4K output.raw
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+cartesi-machine \
+    --no-init-splash \
+    --nvram="label:input,length:1<<12,data_filename:input.raw" \
+    --nvram="label:output,length:1<<12,data_filename:output.raw,shared,user:dapp" \
+    -- $'readmmap input | lua5.4 -e \'print((string.unpack("z", io.read("a"))))\' | bc | writemmap output'
+```
+
+> [!NOTE]
+>
+> The `$'...'` form here is bash’s ANSI-C-quoted string, used throughout
+> the manual for entrypoint commands. It passes the contents to
+> `cartesi-machine` as a single argument, leaves host-side variable
+> references like `$i` unexpanded (so they reach the guest shell
+> verbatim), and accepts `\'` as an escape for a single quote inside the
+> string. This last property matters when the entrypoint wraps a
+> single-quoted sub-command, such as a `lua5.4 -e '...'` invocation.
+
+Using the `truncate` command-line utility, the session creates a 4KiB
+file `output.raw` containing only zeros to serve as the output drive
+image. Then, it creates the `input.raw` file for use as the input drive
+image containing the expression `6*2^1024 + 3*2^512\n` to be evaluated.
+This file is then padded with zeros to 4KiB in size by the `truncate`
+utility. The session then invokes the `cartesi-machine` command-line
+utility to evaluate the expression. The output of the `cartesi-machine`
+command is
+
+``` text
+
+Halted
+Cycles: 62993917
+```
+
+Once the emulator returns, a tiny Lua script, run by the `lua5.4` Lua
+interpreter, prints the contents of the output drive
+
+``` bash
+lua5.4 -e 'print((string.unpack("z", io.read("a"))))' < output.raw
+```
+
+which reads
+
+``` text
+10786158809173895446375831144734148401707861873653839436405804869463\
+96054833005778796250863934445216126720683279228360145952738612886499\
+73495708458383684478649003115037698421037988831222501494715481595948\
+96901677837132352593468675094844090688678579236903861342030923488978\
+36036892526733668721977278692363075584
+```
+
+This is indeed the result of 6×2<sup>1024</sup>+3×2<sup>512</sup>.
+
+To create the template, simply omit the input and output image
+filenames. This will cause the Cartesi Machine to assume both drives are
+filled with zeros. Then, limit the computation with `--max-mcycle=0`, to
+prevent the Cartesi Machine from running. Finally, use the
+`--store="calculator-template"` command-line option to store the Cartesi
+Machine template. The `--final-hash` command-line option prints the
+resulting template hash.
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --nvram="label:input,length:1<<12" \
+    --nvram="label:output,length:1<<12,user:dapp" \
+    --max-mcycle=0 \
+    --final-hash \
+    --store="calculator-template" \
+    -- $'readmmap input | lua5.4 -e \'print((string.unpack("z", io.read("a"))))\' | bc | writemmap output'
+```
+
+The result is as follows
+
+``` text
+0: 882c28a0ed7ec54dc58b7d12c82cc7d218eeda536d1b1241b5a6d15938084d9e
+Storing machine: please wait
+```
+
+The directory `calculator-template/` now contains the Cartesi Machine
+template. And indeed, running
+
+``` bash
+cartesi-machine-stored-hash calculator-template/
+```
+
+we can see from the output
+
+``` text
+882c28a0ed7ec54dc58b7d12c82cc7d218eeda536d1b1241b5a6d15938084d9e
+```
+
+that the stored template hash is `882c28a0…`.
+
+Templates are typically used by programs that control the emulator with
+the C++, Lua, or JSON-RPC interfaces.
+
+The `--replace-memory-range=label:<label>,data_filename:<filename>`
+command-line option of the `cartesi-machine` utility can be used to
+replace an existing memory range right after a machine is loaded. The
+memory range can be identified by `label`, by `start` and `length`, or
+both.
+
+This functionality can be used to test templates. For example, the
+following command loads the calculator template, and replaces its
+pristine input NVRAM with one containing the contents of the `input.raw`
+file. Then, it replaces the pristine output NVRAM so the machine saves
+results in the file `output.raw`.
+
+``` bash
+rm -f output.raw
+truncate -s 4K output.raw
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+cartesi-machine \
+    --no-init-splash \
+    --load="calculator-template" \
+    --replace-memory-range="label:input,data_filename:input.raw" \
+    --replace-memory-range="label:output,data_filename:output.raw,shared"
+lua5.4 -e 'print((string.unpack("z", io.read("a"))))' < output.raw
+```
+
+The result of running the command is, as expected,
+
+``` text
+10786158809173895446375831144734148401707861873653839436405804869463\
+96054833005778796250863934445216126720683279228360145952738612886499\
+73495708458383684478649003115037698421037988831222501494715481595948\
+96901677837132352593468675094844090688678579236903861342030923488978\
+36036892526733668721977278692363075584
+```
+
+### State value proofs
+
+*State value proofs* are proofs that a given node in the Merkle tree of
+the Cartesi Machine state has a given associated hash. Each Merkle tree
+node covers a contiguous range of the machine’s 64-bit address space.
+The size of a range is always a power of 2 (i.e., the `<log2_size>`
+power of 2). Since the leaves have size `32` bytes, the valid values for
+`<log2_size>` are `5`…`64`. The range corresponding to each node starts
+at an `<address>` that is a multiple of its size.
+
+The `cartesi-machine` command-line utility can generate proofs
+concerning the contents of the machine state. To generate a proof
+concerning the state as it is before the machine starts running, use the
+`--initial-proof=address:<number>,log2_size:<number>[,filename:<filename>]`
+or `--initial-proof=label:<label>[,filename:<filename>]`. The label form
+of the option searches for a flash drive or NVRAM with that label, from
+which it automatically obtains the corresponding `address` and
+`log2_size`. For proofs concerning the state after the emulator is done,
+use `--final-proof` instead. The proofs are output as Lua tables that
+can be loaded with the `require` function. To output JSON objects
+instead, add the `format:json` sub-key, as in
+`--initial-proof=label:<label>,filename:<filename>,format:json`. When
+`format:` is omitted, the format is inferred from the filename extension
+(`.json` or `.lua`), defaulting to Lua. In either case, the filename
+field is optional. When provided, the proof will be written to the
+corresponding file. Otherwise, the contents will be displayed on screen.
+
+For example, to generate a proof that the Cartesi Machine template above
+indeed contains a pristine input drive, use the command line
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --load="calculator-template" \
+    --max-mcycle=0 \
+    --initial-hash \
+    --initial-proof="label:input,filename:pristine-input-proof.lua"
+```
+
+The output of the command is
+
+``` text
+Loading machine: please wait
+0: 882c28a0ed7ec54dc58b7d12c82cc7d218eeda536d1b1241b5a6d15938084d9e
+```
+
+In addition, the `pristine-input-proof.lua` file now contains a Lua
+table with the requested proof. The value of field `root_hash` is the
+expected initial state hash `0x882c28…` seen in the output of the
+`cartesi-machine` command. The `target_address` value `0xa0000000` is
+the start of the input NVRAM. The `log2_target_size` value `12` refers
+to the size of the 4KiB input NVRAM. The `target_hash` value `0x292c23…`
+in the proof gives the hash of the input NVRAM.
+
+The hash of the input NVRAM can be also computed externally with the
+`cartesi-hash-tree-hash` command-line utility. The utility can produce
+the hash of any file with a power-of-2 size. The
+`--log2-root-size=<log2_size>` option specifies the size. If an input
+file is smaller than the specified size, the utility assumes the missing
+data is composed entirely of bytes 0. The utility deals efficiently with
+zero paddings of any size because pristine hashes for all power-of-2
+sizes can be precomputed. For example, to quickly generate the hash for
+a pristine input with 4KiB size, run
+
+``` bash
+head -c 0 | cartesi-hash-tree-hash --log2-root-size=12
+```
+
+to obtain
+
+``` text
+292c23a9aa1d8bea7e2435e555a4a60e379a5a35f3f452bae60121073fb6eead
+```
+
+As expected, the hash values match.
+
+The `sibling_hashes` array contains the hashes of the siblings to all
+nodes in the path from the root all the way down to the target node
+(excluding the root, which has no sibling). In a process explained in
+the [blockchain perspective](#hash-view-of-state), using the `address`
+field, the `target_hash` hash, and the `sibling_hashes` array, it is
+possible to go up the tree computing the hashes along the path, until
+the root hash is produced. If the root hash obtained by this process
+matches the expected root hash, the proof is valid. Otherwise, something
+is amiss.
+
+To compute the hash for the desired `input.raw` file with contents
+`6*2^1024 + 3*2^512\n`, padded with zeros, run
+
+``` bash
+echo "6*2^1024 + 3*2^512" | cartesi-hash-tree-hash --log2-root-size=12
+```
+
+to obtain
+
+``` text
+d5ea32c164644e70ea918e4d868458bcbf038c764f551c5b0baa2dd8ac26fbea
+```
+
+The initial state hash for the instantiated template can be seen with
+the `cartesi-machine` command-line
+
+``` bash
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+cartesi-machine \
+    --no-init-splash \
+    --load="calculator-template" \
+    --replace-memory-range="label:input,data_filename:input.raw" \
+    --initial-hash \
+    --initial-proof="label:input,filename:input-proof.lua" \
+    --max-mcycle=0
+```
+
+This produces the output
+
+``` text
+Loading machine: please wait
+0: 60246ea0f5082b651bf85aeb41b9c276a030708c2c151c91ff4bc40ec8f351f5
+```
+
+In addition, the `input-proof.lua` file now contains a Lua table with
+the requested proof, which is produced after the input NVRAM has been
+replaced. The `target_hash` value `0xd5ea32…` reflects the hash computed
+for the input. The `root_hash` value `0x60246e…` differs from
+`882c28a0…` obtained for the template, as expected, and matches the
+final hash printed by the utility. Moreover, the `sibling_hashes`
+entries in the template Cartesi Machine and in the instantiated Cartesi
+Machine remain the same, reflecting the fact that there were no other
+changes in the machine’s initial state.
+
+Using a process similar to the proof verification described above, it is
+possible to go up the Merkle tree for the template using the
+`sibling_hashes` array in the proof, but starting from the hash
+`d5ea32c1…` of the desired `input.raw` image rather than hash
+`292c23a9…` of the template’s pristine NVRAM. The result would be the
+same root hash as that of the instantiated template.
+
+Another useful proof is the one for the *output* drive, once the machine
+is halted. To obtain this proof, run
+
+``` bash
+truncate -s 4K output.raw
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+cartesi-machine \
+    --no-init-splash \
+    --load="calculator-template" \
+    --replace-memory-range="label:input,data_filename:input.raw" \
+    --replace-memory-range="label:output,data_filename:output.raw,shared" \
+    --final-hash \
+    --final-proof="label:output,filename:output-proof.lua"
+```
+
+This produces the output
+
+``` text
+Loading machine: please wait
+
+Halted
+Cycles: 62993917
+62993917: a7fdb74dcc67232f5b64b3b245972a6b30e6fde1f11c5a11ae16dec44bcc79ae
+```
+
+The `root_hash` field in the proof `0xa7fdb7…` matches the final state
+hash output by the `cartesi-machine` command-line utility. The
+`target_hash` field `0x1beb37…` is the hash of the `output.raw` NVRAM.
+To compute it independently, use the `cartesi-hash-tree-hash`
+command-line utility
+
+``` bash
+cartesi-hash-tree-hash --log2-root-size=12 < output.raw
+```
+
+``` text
+1beb375bfd349ab9612a7a969f05c4f104d85471e5ec5754d96ceb5b9083ce1e
+```
+
+The `cartesi-machine` command-line utility accepts an arbitrary number
+of `--initial-proof` and `--final-proof` parameters. They are computed
+one-by-one, and either printed or stored in the specified files, as
+requested.
+
+To read more about proofs, refer to [the blockchain
+perspective](#hash-view-of-state).
+
+### Remote Cartesi Machines
+
+The `cartesi-machine` command-line utility, as used until now, has
+always instantiated its own local Cartesi Machine. However, it can also
+be used to control a remote Cartesi Machine. Remote Cartesi Machines are
+managed by the `cartesi-jsonrpc-machine` server. The server exposes a
+JSON-RPC interface through which the `cartesi-machine` command-line
+utility (or any other software) can control the machine remotely.
+
+To avoid confusion, it is best to run the server and client in separate
+shells in the playground container. Leaving the existing shell for the
+client, open a separate shell for the server (For example, by running
+`docker exec -it playground /bin/bash`), then run
+
+``` bash
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8080
+```
+
+The `--server-address=<address>` command-line option specifies the
+address and port the server will listen to.
+
+> [!NOTE]
+>
+> In this case, since we selected `127.0.0.1:8080`, the client must run
+> in the same container in order to communicate with the server. To be
+> accessible from outside the container, the `--server-address` option
+> would have to refer to an address and port that were *exposed* by the
+> container.
+
+To instruct the `cartesi-machine` command-line utility to connect with
+the server, add the command-line option `--remote-address=<address>` to
+specify the remote server to connect to. The option `--remote-shutdown`
+causes the server to be shut down by the client when the client exits.
+(Otherwise, the server will remain available for the next client.) The
+option `--remote-health-check` causes the client to connect to the
+server, confirm it is responsive, and exit without instantiating a
+machine. All other options work as before. Keep in mind that any image
+files referred to by an option passed to the command-line utility
+`cartesi-machine` must be accessible to the `cartesi-jsonrpc-machine`
+server (and not necessarily to the client). Additionally, terminal
+output for the Cartesi Machine instantiated by the server will appear in
+the remote shell where the server was run (not the client’s shell).
+Terminal input, when enabled, must also happen via the remote shell.
+
+With this in mind, running the command in the client shell
+
+``` bash
+while ! cartesi-machine \
+    --remote-address=127.0.0.1:8080 \
+    --remote-health-check 2>/dev/null; do sleep 1; done
+cartesi-machine \
+    --remote-address=127.0.0.1:8080 \
+    --remote-shutdown
+```
+
+produces the following output on the client shell
+
+``` text
+Connected to JSONRPC remote cartesi machine at '127.0.0.1:8080'
+
+Halted
+Cycles: 41860482
+Shutdown JSONRPC remote cartesi machine at '127.0.0.1:8080'
+```
+
+and the following output on the server shell
+
+``` text
+
+         .
+        / \
+      /    \
+\---/---\  /----\
+ \       X       \
+  \----/  \---/---\
+       \    / CARTESI
+        \ /   MACHINE
+         '
+
+Nothing to do.
+```
+
+The client first connects to the remote address and prints the
+connection status. It then asks the server to instantiate a machine (by
+sending the configuration over) and run it. The machine that runs in the
+server prints out the splash screen, boots Linux, and cedes control to
+the Cartesi-provided `/usr/sbin/cartesi-init` script. The
+`/usr/sbin/cartesi-init` script figures out there is nothing to do and
+halts the machine. The client detects the machine is halted and shuts
+down the server, as requested, printing the final message.
+
+When it is desirable to leave the server running and preserve the
+instantiated machine, omit the `--remote-shutdown` command-line option
+and add the `--no-remote-destroy`. For example, assuming the remote
+server has just been run:
+
+``` bash
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8081
+```
+
+use the `cartesi-machine` command-line utility to instantiate and run a
+Cartesi Machine for 2^20 cycles:
+
+``` bash
+while ! cartesi-machine \
+    --remote-address=127.0.0.1:8081 \
+    --remote-health-check 2>/dev/null; do sleep 1; done
+cartesi-machine \
+    --remote-address=127.0.0.1:8081 \
+    --no-remote-destroy \
+    --max-mcycle=1Mi \
+    -- echo "Still here!"
+```
+
+The client shell shows:
+
+``` text
+Connected to JSONRPC remote cartesi machine at '127.0.0.1:8081'
+Left alive JSONRPC remote cartesi machine at '127.0.0.1:8081'
+```
+
+To continue execution of the same Cartesi Machine until it halts, rather
+than instantiating a new one, use the `cartesi-machine` command-line
+utility with the option `--no-remote-create`:
+
+``` bash
+cartesi-machine \
+    --remote-address=127.0.0.1:8081 \
+    --remote-shutdown \
+    --no-remote-create
+```
+
+The client shell now shows:
+
+``` text
+Connected to JSONRPC remote cartesi machine at '127.0.0.1:8081'
+
+Halted
+Cycles: 50414034
+Shutdown JSONRPC remote cartesi machine at '127.0.0.1:8081'
+```
+
+The server shell shows the execution of both sessions:
+
+``` text
+
+         .
+        / \
+      /    \
+\---/---\  /----\
+ \       X       \
+  \----/  \---/---\
+       \    / CARTESI
+        \ /   MACHINE
+         '
+
+Still here!
+```
+
+Remote Cartesi Machines have one ability that local Cartesi Machines
+lack: they can be *forked*, producing a copy that runs forward
+independently in a child server while the original is preserved in the
+parent. Inspect-state requests and rejected advance-state requests
+require that changes to the state of the Rolling Cartesi Machine be
+reverted. One way to implement this is for the host to run the inspect
+or advance against a fork, then discard it.
+
+### Rolling Cartesi Machines
+
+Applications involving Rolling Cartesi Machines are not designed to
+interact with the `cartesi-machine` command-line utility. Instead, they
+rely on a variety of software components that allow a front-end to post
+to the blockchain requests to advance the state of the server. The
+Cartesi Node polls the blockchain for advance-state requests posted by
+others so a local copy of the server can be kept in sync. It also allows
+a front-end to inspect the state of the server.
+
+Nevertheless, in debugging or prototyping tasks, the `cartesi-machine`
+command-line utility can simulate the external environment that a guest
+application (running inside a Rolling Cartesi Machine) would encounter
+in production. To use this functionality, the developer creates a
+sequence of advance-state requests as numbered files, or a single
+inspect-state request as a file, and instructs the `cartesi-machine`
+command-line utility to feed them to the guest application. As each
+request is processed, the utility stores the responses as separate
+files.
+
+An advance-state request is a single ABI-encoded
+`EvmAdvance(uint256 chainId, address appContract, address msgSender, uint256 blockNumber, uint256 blockTimestamp, uint256 prevRandao, uint256 index, bytes payload)`
+calldata blob carrying the fields important for the operation of Cartesi
+Rollups. Recall that, as responses, the guest application can issue
+*vouchers*, *notices*, *reports*, and *exceptions*. In contrast, an
+inspect-state request carries only a *query* and, as response, produces
+only reports and exceptions. The query in an inspect-state request
+consists of an application-specific payload.
+
+Guest applications running inside Rolling Cartesi Machines do not access
+the network or the file-system directly. They communicate with the host
+through a Cartesi-specific mechanism, detailed under [Communication
+between guest and host](#communication-between-guest-and-host) in the
+guest perspective.
+
+In a nutshell, the process is as follows. To obtain the next request,
+the guest application *yields* control back to the host (in our case,
+the `cartesi-machine` command-line utility). The host writes the next
+request where the guest can read it and resumes the machine, so the
+guest application can process it. When the guest application emits an
+output (a voucher, notice, report, or exception), it again yields
+control to the host so it can collect the output (in our case, saving it
+to a file or printing it to the terminal) before resuming the machine.
+
+To help debugging applications, developers can obtain from Cartesi
+Rollups, as files, the inputs associated to each advance-state request,
+so the sequence can be replayed locally in the command line. When
+prototyping, developers can create their own files simulating requests
+that test the behavior of their guest application under customized
+conditions.
+
+#### Encoding requests
+
+The `cartesi-rollup-data.lua` command-line utility, available in the
+`cartesi/machine-emulator-docs` Docker image, can encode advance-state
+requests and inspect-state queries to files, and decode vouchers,
+notices, reports, exceptions, and delegate-call vouchers from files. The
+calculator we will run treats the payload of each advance-state request
+as an arbitrary-precision arithmetic expression and emits the result as
+a notice. The following commands encode six such requests as
+`input-1.bin` through `input-6.bin`, sharing their common structure
+through a small `encode_input` shell function, and one inspect-state
+query as `query.bin`:
+
+``` bash
+encode_input() {
+  cartesi-rollup-data.lua encode advance <<EOF
+{
+  "chain_id": 0,
+  "app_contract": "0x0000000000000000000000000000000000000000",
+  "msg_sender": "$(printf '0x%040d' "$1")",
+  "block_number": 0,
+  "block_timestamp": 0,
+  "prev_randao": "0x0000000000000000000000000000000000000000000000000000000000000000",
+  "index": $1,
+  "payload": "$(printf '%s\n' "$2" | hex --encode)"
+}
+EOF
+}
+encode_input 1 '6*2^1024 + 3*2^512' > input-1.bin
+encode_input 2 'invalid input' > input-2.bin
+encode_input 3 '2^2048' > input-3.bin
+encode_input 4 '(2^256 - 1) * (2^256 - 1)' > input-4.bin
+encode_input 5 'scale=80; sqrt(2)' > input-5.bin
+encode_input 6 'scale=100; 355/113' > input-6.bin
+cartesi-rollup-data.lua encode inspect > query.bin <<EOF
+{
+  "payload": "$(printf 'scale=70; (1+sqrt(5))/2\n' | hex --encode)"
+}
+EOF
+```
+
+Listing the files created with `ls *.bin`, we see
+
+``` text
+input-1.bin
+input-2.bin
+input-3.bin
+input-4.bin
+input-5.bin
+input-6.bin
+query.bin
+```
+
+The six numbered files are advance-state requests, and `query.bin` is an
+inspect-state query.
+
+#### A simple calculator guest application
+
+We will run an arbitrary-precision arithmetic expression evaluator that
+outputs, as notices, the result of the computation it receives as the
+payload of each advance-state request. We will rely on the `bc`
+command-line utility to perform the computations. To interact with the
+`/dev/cmio` Linux device (i.e., to obtain the advance-state request
+inputs and to generate the notices), we will use the `/usr/bin/rollup`
+command-line utility.
+
+The `rollup` command-line utility supports the commands `accept`,
+`reject`, `voucher`, `notice`, `report`, and `exception`. It uses JSON
+objects as inputs and outputs. The `accept` and `reject` commands accept
+or reject the previous request and output the next request. For
+advance-state requests, the output is in the format
+
+``` js
+{
+  "request_type": "advance_state",
+  "data": {
+    "chain_id": <number>,
+    "app_contract": <address>,
+    "msg_sender": <address>,
+    "block_number": <number>,
+    "block_timestamp": <number>,
+    "prev_randao": <hex-uint256>,
+    "index": <number>,
+    "payload": <hex-data>
+  }
+}
+```
+
+Appropriately, the `notice` command generates a notice. The input format
+is as follows
+
+``` js
+{
+  "payload": <hex-data>
+}
+```
+
+and the output gives the index of the just-output notice as follows
+
+``` js
+{
+  "index": <number>
+}
+```
+
+The `report` command takes the same input format as `notice`. However,
+since reports are not verifiable, there is no associated index to print
+out.
+
+Shell scripts become surprisingly powerful with the help of the
+`rollup`, `hex`, and `jq` command-line utilities. A `bc`-based arbitrary
+precision application, for example, might look like this:
+
+``` bash
+#!/bin/bash
+set -o pipefail
+
+declare -A emit=([advance_state]=notice [inspect_state]=report)
+reqfile=$(mktemp /tmp/calc.XXXXXX)
+status="accept"
+while :
+do
+  rollup $status > "$reqfile"
+  request_type=$(jq -j .request_type < "$reqfile")
+  status="reject"
+  jq -j '.data.payload' < "$reqfile" | \
+    hex --decode | \
+      bc | \
+        grep . | \
+          tr -d '\\\n' | \
+            hex --encode | \
+              jq -R '{ payload: . }' | \
+                rollup "${emit[$request_type]}" > /dev/null && \
+                  status="accept"
+done
+rm "$reqfile"
+```
+
+The loop in the `calc.sh` script calls `rollup accept` or
+`rollup reject` (shortcuts for `rollup finish`) to accept or reject the
+previous request and obtain the next one. It uses `jq` to read the
+`request_type` field, which selects the output verb: an advance-state
+request emits the result as a notice, and an inspect-state request emits
+it as a report. Both kinds of request carry the expression at
+`.data.payload`, which `jq` extracts. The hex-encoded payload is decoded
+back to bytes by `hex --decode` and passed to `bc`, which outputs the
+result split into lines terminated by `\`. Unfortunately, `bc` does not
+exit with an error when it detects one. Instead, it prints a message to
+the error stream and exits successfully. The `grep .` exits with an
+error in that case, because the output stream of `bc` will be empty.
+Otherwise, `grep .` simply passes the output through unchanged. In that
+case, `tr` utility joins the lines back together. The joined result is
+hex-encoded by `hex --encode` and fed to `jq`, which assembles the
+proper JSON object with a `"payload"` field that is passed to
+`rollup notice` or `rollup report`, the verb chosen by the request type.
+
+To run `calc.sh`, first create a file-system with the program:
+
+``` bash
+mkdir calc
+cp calc.sh calc
+chmod +x calc/calc.sh
+tar \
+    --sort=name \
+    --mtime="2022-01-01" \
+    --owner=1000 \
+    --group=1000 \
+    --numeric-owner \
+    -cf calc.tar \
+    --directory=calc .
+xgenext2fs \
+    -fzB 4096 \
+    -i 4096 \
+    -a calc.tar \
+    calc.ext2
+```
+
+Running a Rolling Cartesi Machine in the command line requires using the
+`cartesi-jsonrpc-machine` server in combination with the
+`cartesi-machine` client. The server provides the fork functionality the
+client uses to roll the machine state back when an input to
+advance-state request is rejected, or after an inspect-state request.
+With the encoded inputs and `calc.ext2` in the working directory, run
+the remote server with the command
+
+``` bash
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8082
+```
+
+We will run the inputs in two separate epochs against this server, kept
+alive between runs. From a different shell into the same container, run
+the client to process the first epoch
+
+``` bash
+while ! cartesi-machine \
+    --remote-address=127.0.0.1:8082 \
+    --remote-health-check 2>/dev/null; do sleep 1; done
+cartesi-machine \
+    --no-init-splash \
+    --remote-address=127.0.0.1:8082 \
+    --no-remote-destroy \
+    --flash-drive=label:calc,data_filename:calc.ext2,user:dapp \
+    --cmio-advance-state=input_index_begin:1,input_index_end:4,hashes \
+    --final-hash=epoch-1-state-hash.bin \
+    -- /mnt/calc/calc.sh
+```
+
+This run instantiates the machine from the `calc.ext2` flash drive and
+advances inputs 1 to 3. Passing `--no-remote-destroy` and omitting
+`--remote-shutdown` leaves both the server and the machine it holds
+alive for the next epoch.
+
+The client shell shows
+
+``` text
+Connected to JSONRPC remote cartesi machine at '127.0.0.1:8082'
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 65021670
+
+Before input 1
+65021670: f40b532cb800b1ca70942a156555257aedb6a18a29d9ba835b005395c2d89bed
+65021670: c9ba6e6287903ded8a9d37fc9cae3de1ded01e98441e9c66908009e131bb3ad4
+
+Automatic yield tx-output (2) (0x000184 data)
+Cycles: 110210177
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 117115963
+Storing output-0-input-1.bin
+Storing input-1-output-hashes-root-hash.bin
+Storing input-1-output-hashes-root-hash-proof.lua
+
+Before input 2
+117115963: cc1e65210ef20e6ec3261e726c47556850a811a508d8d5c48768e347ead68b36
+117115963: d3277d37176d813a454579f91b6c062ac79a025e89dcfa4c48580960f5ce7778
+
+Automatic yield tx-output (2) (0x000044 data)
+Cycles: 159574065
+
+Manual yield rx-rejected (2) (0x000000 data)
+Cycles: 164228493
+Storing rejected-output-1-input-2.bin
+
+Before input 3
+117115963: cc1e65210ef20e6ec3261e726c47556850a811a508d8d5c48768e347ead68b36
+117115963: eb4fbed094aba57cc7a62ec74973641e764e50b1bf9045c4e1bb308ccf0e6d21
+
+Automatic yield tx-output (2) (0x0002c4 data)
+Cycles: 161573955
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 168348264
+Storing output-1-input-3.bin
+Storing input-3-output-hashes-root-hash.bin
+Storing input-3-output-hashes-root-hash-proof.lua
+Storing output-0-input-1-proof.lua
+Storing output-1-input-3-proof.lua
+Left alive JSONRPC remote cartesi machine at '127.0.0.1:8082'
+```
+
+The client starts by printing information about the remote server it
+connected to. It then runs the machine in a loop, occasionally
+transferring information in and out. The first
+`manual yield rx-accepted`, at cycle `65021670`, is the point at which
+the calculator attempted to obtain its first request.
+
+Upon receiving control back, the client prints input index 1 and the
+state hash `f40b532c…`. It loads `input-1.bin` as the next request,
+prints the modified state hash `c9ba6e62…`, and resumes the machine. The
+calculator evaluates `6*2^1024 + 3*2^512` and emits the result as a
+notice. That emission is an `automatic yield tx-output` at cycle
+`110210177`, which returns control to the client. The client collects
+the emitted output and stores it as `output-0-input-1.bin`. The
+`manual yield rx-accepted` at cycle `117115963` signals that input index
+1 was accepted. At this point the client also stores the output hashes
+root hash the guest reported, as `input-1-output-hashes-root-hash.bin`,
+and double-checks it against its own local computation of the same hash.
+This hash commits to every output the machine has emitted so far.
+
+The client then loads input index 2 and resumes the machine. The payload
+`invalid input` is not an expression that `bc` understands, so the
+calculator rejects the request. An empty notice is still emitted just
+before the rejection. Shell pipelines run concurrently, so
+`rollup notice` has already run by the time `bc`’s failure is detected.
+Rejection discards all outputs, such as this notice. For debugging
+purposes, the client saves the notice contents as
+`rejected-output-1-input-2.bin`. The resulting
+`manual yield rx-rejected` at cycle `164228493` rolls the machine state
+back to what it was before the input was processed. The state hash
+before input 3, `cc1e6521…`, is identical to the hash after input 1 was
+accepted, which confirms the rejected input left no trace.
+
+Input index 3, with payload `2^2048`, is accepted like the first, so the
+client stores `output-1-input-3.bin` and
+`input-3-output-hashes-root-hash.bin`. On each accept the client also
+writes the proof that the output hashes root hash occupied the machine’s
+CMIO tx buffer, as `input-1-output-hashes-root-hash-proof.lua` and
+`input-3-output-hashes-root-hash-proof.lua`. The two output proofs for
+this epoch, `output-0-input-1-proof.lua` and
+`output-1-input-3-proof.lua`, are written at the end, once all of the
+epoch’s outputs are known. Each proves that one of the epoch’s outputs
+belongs to the tree the final output hashes root hash commits to. The
+`--final-hash` option saves the machine state hash at the end of the
+epoch, as `epoch-1-state-hash.bin`, the state a dispute over this epoch
+would settle on.
+
+Now run the client to process the second epoch in the same server
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --remote-address=127.0.0.1:8082 \
+    --no-remote-create \
+    --remote-shutdown \
+    --cmio-advance-state=input_index_begin:4,input_index_end:7,last_output_proof:output-1-input-3-proof.lua,hashes \
+    --cmio-inspect-state=query:query.bin,hashes
+```
+
+The command-line option `--no-remote-create` reuses the machine where
+the first epoch left off. The output hashes tree inside the machine
+keeps growing across the epoch boundary on its own. The
+`last_output_proof:output-1-input-3-proof.lua` option is there for the
+`cartesi-machine` command-line-utility alone, which uses the first
+epoch’s last output proof to rebuild its own copy of the output hashes
+tree as it stood at the end of that epoch. With this copy, the output
+hashes root hash `cartesi-machine` computes for each accepted input
+matches the one produced inside the emulator, which is what the default
+`check_output_hashes_root_hash` verifies. The copy also lets
+`cartesi-machine` emit correct proofs, at the right global output
+indices, for the outputs it collects during this epoch. The three inputs
+evaluate `(2^256 - 1) * (2^256 - 1)`, `sqrt(2)` to 80 decimal places,
+and `355/113` to 100 decimal places. Arbitrary-precision results like
+these are awkward to compute on the blockchain, whose native arithmetic
+works on fixed-width 256-bit integers and has no fractions. Their
+outputs continue the global output index, becoming outputs 2, 3, and 4.
+The run passes `--remote-shutdown` to stop the server once the epoch is
+done.
+
+The client shell now shows
+
+``` text
+Connected to JSONRPC remote cartesi machine at '127.0.0.1:8082'
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 168348264
+
+Before input 4
+168348264: 3eaec139ee67c9e1e7b2ce72c9ef695c1937d737fcec04810b2bb7acd8bf9144
+168348264: 797a3fb86a58af26a75f63f3fd1ff75c4792488daf1baa6a9a99b6faf15d9993
+
+Automatic yield tx-output (2) (0x0000e4 data)
+Cycles: 211152478
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 217833232
+Storing output-2-input-4.bin
+Storing input-4-output-hashes-root-hash.bin
+Storing input-4-output-hashes-root-hash-proof.lua
+
+Before input 5
+217833232: a68c74bc16ff6e00d256eb11022412d26ca789a659a8cc12db64c517836c7f1c
+217833232: 97177926d0977e2e243aab26d20e25d241daf18d1b983b490759bfc62770565b
+
+Automatic yield tx-output (2) (0x0000a4 data)
+Cycles: 260790937
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 267595780
+Storing output-3-input-5.bin
+Storing input-5-output-hashes-root-hash.bin
+Storing input-5-output-hashes-root-hash-proof.lua
+
+Before input 6
+267595780: e97d3ce5156c6c16c0cd49a6b8f62f3ce87051688c0f57c1ec9512b1a2833818
+267595780: d8f35a7c5b1e4c1ad7b83f5cfb2403162c145210c7b5a9c2b09ee838102163fc
+
+Automatic yield tx-output (2) (0x0000c4 data)
+Cycles: 310194028
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 316884774
+Storing output-4-input-6.bin
+Storing input-6-output-hashes-root-hash.bin
+Storing input-6-output-hashes-root-hash-proof.lua
+Storing output-2-input-4-proof.lua
+Storing output-3-input-5-proof.lua
+Storing output-4-input-6-proof.lua
+
+Before query
+316884774: 02335a2d2b09587e726a3e8896714d292edbda6a791943dbf4185c409869dc3e
+316884774: 55988c3c3e496603daf47858245803eaeb6c82f934de83f57cf0f58c8b6d6f4d
+
+Automatic yield tx-report (4) (0x000048 data)
+Cycles: 359653822
+Storing query-report-0.bin
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 366329171
+
+After query
+Shutdown JSONRPC remote cartesi machine at '127.0.0.1:8082'
+```
+
+After the second epoch’s advances, the same run sends the inspect-state
+query from `query.bin`. The calculator evaluates
+`scale=70; (1+sqrt(5))/2`, the golden ratio, and returns it as a report
+rather than a notice. An inspect-state request cannot emit verifiable
+outputs such as notices or vouchers, because any change its processing
+makes to the machine state is reverted afterward. The client saves the
+report as `query-report-0.bin`.
+
+The hash operations behind the output proofs are explained later, under
+[The output hashes tree](#the-output-hashes-tree) in the Blockchain
+perspective.
+
+The server shell shows only the error message output by `bc` and
+`rollup`. In production, these error messages should have been captured
+and output as a report, rather than being allowed to leak into the
+console.
+
+``` text
+(standard_in) 1: syntax error
+```
+
+#### Decoding responses
+
+The `cartesi-rollup-data.lua` command-line utility can also decode the
+binary records produced by the guest application.
+
+For example, to see the value of `sqrt(2)` computed in the second epoch,
+decode its notice with the command
+
+``` bash
+cartesi-rollup-data.lua decode notice < output-3-input-5.bin | \
+    jq -j .payload | \
+    hex --decode | \
+    fold -w 68
+```
+
+to produce
+
+``` text
+1.414213562373095048801688724209698078569671875376948073176679737990
+73247846210703
+```
+
+This is `sqrt(2)` to 80 decimal places.
+
+The inspect-state report is decoded the same way, with `decode report`
+
+``` bash
+cartesi-rollup-data.lua decode report < query-report-0.bin | \
+    jq -j .payload | \
+    hex --decode | \
+    fold -w 68
+```
+
+to produce
+
+``` text
+1.618033988749894848204586834365638117720309179805762862135448622705
+2604
+```
+
+This is the golden ratio to 70 decimal places.
+
+Vouchers, exceptions, and delegate-call vouchers are also supported by
+`cartesi-rollup-data.lua decode`. A voucher carries a *destination*, a
+*value*, and a *payload*. Payloads are 0x-prefixed hex.
+
+### Rolling Cartesi Machine templates
+
+A Rolling Cartesi Machine template is a machine that has been configured
+to support Cartesi Rollups, is running a guest application in a
+request-processing loop, is ready to process the next request, and has
+been stored.
+
+A template is the genesis of a Cartesi Rollups application. Its state
+hash is what a freshly deployed application looks like to the
+blockchain, and the stored template is the artifact distributed to
+anyone who wants to run the application in their own Cartesi Node.
+
+We store the calculator from the previous section as a template with the
+command
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --assert-rolling-template \
+    --flash-drive=label:calc,data_filename:calc.ext2,user:dapp \
+    --store="rolling-calculator-template" \
+    --final-hash \
+    -- /mnt/calc/calc.sh
+```
+
+The `--assert-rolling-template` option makes `cartesi-machine` exit with
+a status-code reporting failure if the generated machine is not a
+Rolling Cartesi Machine template, which helps catch errors. The result
+is as follows
+
+``` text
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 65021670
+65021670: f40b532cb800b1ca70942a156555257aedb6a18a29d9ba835b005395c2d89bed
+Storing machine: please wait
+```
+
+The machine execution stops when the first call to `rollup finish`
+yields, and the machine at that state is stored in directory
+`"rolling-calculator-template"`. The `--final-hash` option prints the
+state hash of the stored machine, the genesis state hash that identifies
+this application to the blockchain.
+
+> [!NOTE]
+>
+> In production, if the guest application finds an irrecoverable error
+> during initialization, it should abort with an exception. In that
+> case, the `cartesi-machine` command-line utility will detect the
+> exception, print it to the console, and exit with a status-code
+> reporting failure.
+
+To run the application, load the template into a server and feed it the
+same inputs. With the encoded inputs and the stored template in the
+working directory, run the remote server with the command
+
+``` bash
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8083
+```
+
+From a different shell into the same container, run the client
+
+``` bash
+while ! cartesi-machine \
+    --remote-address=127.0.0.1:8083 \
+    --remote-health-check 2>/dev/null; do sleep 1; done
+cartesi-machine \
+    --no-init-splash \
+    --remote-address=127.0.0.1:8083 \
+    --remote-shutdown \
+    --cmio-advance-state=input_index_begin:1,input_index_end:7,output_proof:,hashes \
+    --load="rolling-calculator-template"
+```
+
+This loads the machine from the stored template and advances all six
+inputs. Abbreviated, the client shell shows
+
+``` text
+Connected to JSONRPC remote cartesi machine at '127.0.0.1:8083'
+Loading machine: please wait
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 65021670
+
+Before input 1
+65021670: f40b532cb800b1ca70942a156555257aedb6a18a29d9ba835b005395c2d89bed
+65021670: c9ba6e6287903ded8a9d37fc9cae3de1ded01e98441e9c66908009e131bb3ad4
+
+Automatic yield tx-output (2) (0x000184 data)
+Cycles: 110210177
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 117115963
+Storing output-0-input-1.bin
+...
+Cycles: 310194028
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 316884774
+Storing output-4-input-6.bin
+Storing input-6-output-hashes-root-hash.bin
+Storing input-6-output-hashes-root-hash-proof.lua
+Shutdown JSONRPC remote cartesi machine at '127.0.0.1:8083'
+```
+
+The outputs and their hashes are identical to those produced in the
+previous section, because the template captured exactly the same genesis
+state.
+
+### Additional options
+
+> [!WARNING]
+>
+> This is an advanced section, not needed by regular users of the
+> Cartesi platform.
+
+A guest application can inform the host of its progress by using the
+Cartesi-specific `/dev/cmio` Linux device. Within the guest, the device
+can be controlled from the shell with the `/usr/bin/yield` utility,
+pre-installed in the root file-system `rootfs.ext2`. The progress
+feedback is accessed via the `automatic progress <permil>` command-line
+option.
+
+For example, during the execution of the loop,
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    -- $'for i in $(seq 0 5 1000); do yield automatic progress $i; done'
+```
+
+the `cartesi-machine` utility receives control back from the emulator at
+every iteration, when the guest executes the `yield` utility. (The
+directory `/usr/bin/`, where `yield` resides, is in the default `PATH`.)
+
+By default, the emulator honors automatic yield requests from the guest.
+Passing `--no-htif-yield-automatic` makes `cartesi-machine` ignore them,
+but be careful since doing so would *also* prevent Rolling Cartesi
+Machines from generating outputs. Each time `cartesi-machine` receives
+control due to a yield, it prints a progress message (shown at 44%
+below) and resumes the emulator so it can continue working.
+
+``` text
+Progress:  44.00
+```
+
+This feature is most useful when the emulator is controlled
+programmatically, via its Lua, C++, or JSON-RPC interfaces, where
+Cartesi Machines typically run disconnected from the console. In these
+situations, the progress device can be used to drive a dynamic user
+interface element that reassures users progress is being made during
+long, silent computations. Its handling by `cartesi-machine`, which does
+have access to the console, is simply to help with prototyping and
+debugging.
+
+The protocols followed by the `yield` utility to interact with the
+`/dev/cmio` driver and by the driver itself to communicate with the HTIF
+device are explained in detail under the [guest
+perspective](#system-architecture). In particular, the section explains
+the *manual* yield commands needed for proper operation of Cartesi
+Rollups.
+
+The command-line option `--append-bootargs=<string>` can be used to
+append any `<string>` to the kernel command-line. A detailed description
+of all kernel command-line parameters is beyond the scope of this
+document. Please refer to the appropriate [section of the kernel
+documentation](https://www.kernel.org/doc/html/v6.5/admin-guide/kernel-parameters.html).
+
+For example, to prevent clutter in the console, the `cartesi-machine`
+utility automatically adds the `quiet` option to the kernel
+command-line, disabling most log messages. To override this setting and
+see more of the log messages output to console, use the `loglevel=<n>`
+parameter.
+
+``` bash
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    --append-bootargs="loglevel=8"
+```
+
+The output is
+
+``` text
+[    0.000000] OF: reserved mem: 0x0000000080000000..0x000000008007ffff (512 KiB) nomap non-reusable fw_resv@80000000
+[    0.000000] Zone ranges:
+[    0.000000]   DMA32    [mem 0x0000000080000000-0x0000000087ffffff]
+[    0.000000]   Normal   empty
+[    0.000000] Movable zone start for each node
+[    0.000000] Early memory node ranges
+[    0.000000]   node   0: [mem 0x0000000080000000-0x000000008007ffff]
+[    0.000000]   node   0: [mem 0x0000000080080000-0x0000000087ffffff]
+[    0.000000] Initmem setup node 0 [mem 0x0000000080000000-0x0000000087ffffff]
+[    0.000000] riscv: base ISA extensions acdfim
+[    0.000000] riscv: ELF capabilities acdfim
+[    0.000000] pcpu-alloc: s0 r0 d32768 u32768 alloc=1*32768
+[    0.000000] pcpu-alloc: [0] 0 
+[    0.000000] Kernel command line: quiet earlycon=sbi console=hvc0 uio_pdrv_genirq.of_id=generic-uio root=/dev/pmem0 rw init=/usr/sbin/cartesi-init loglevel=8
+[    0.000000] Dentry cache hash table entries: 16384 (order: 5, 131072 bytes, linear)
+[    0.000000] Inode-cache hash table entries: 8192 (order: 4, 65536 bytes, linear)
+[    0.000000] Built 1 zonelists, mobility grouping on.  Total pages: 32256
+[    0.000000] mem auto-init: stack:all(zero), heap alloc:off, heap free:off
+[    0.000000] Memory: 111868K/131072K available (4184K kernel code, 4774K rwdata, 2048K rodata, 2101K init, 342K bss, 19204K reserved, 0K cma-reserved)
+[    0.000000] SLUB: HWalign=64, Order=0-3, MinObjects=0, CPUs=1, Nodes=1
+[    0.000000] NR_IRQS: 64, nr_irqs: 64, preallocated irqs: 0
+[    0.000000] riscv-intc: 64 local interrupts mapped
+[    0.000000] plic: plic@40100000: mapped 31 interrupts with 1 handlers for 2 contexts.
+[    0.000000] clocksource: riscv_clocksource: mask: 0xffffffffffffffff max_cycles: 0x1d854df40, max_idle_ns: 225687143485440 ns
+[    0.000000] sched_clock: 64 bits at 16kHz, resolution 64000ns, wraps every 140737488352000ns
+[    0.000960] Console: colour dummy device 80x25
+[    0.001152] printk: console [hvc0] enabled
+[    0.001152] printk: console [hvc0] enabled
+[    0.001472] printk: bootconsole [sbi0] disabled
+[    0.001472] printk: bootconsole [sbi0] disabled
+[    0.001856] Calibrating delay loop (skipped), value calculated using timer frequency.. 0.03 BogoMIPS (lpj=156)
+[    0.002240] pid_max: default: 32768 minimum: 301
+[    0.002880] Mount-cache hash table entries: 512 (order: 0, 4096 bytes, linear)
+[    0.003136] Mountpoint-cache hash table entries: 512 (order: 0, 4096 bytes, linear)
+[    0.006336] RCU Tasks Trace: Setting shift to 0 and lim to 1 rcu_task_cb_adjust=1.
+[    0.006784] ASID allocator disabled (0 bits)
+[    0.007744] devtmpfs: initialized
+[    0.011392] clocksource: jiffies: mask: 0xffffffff max_cycles: 0xffffffff, max_idle_ns: 19112604462750000 ns
+[    0.011776] futex hash table entries: 256 (order: 0, 6144 bytes, linear)
+[    0.012864] NET: Registered PF_NETLINK/PF_ROUTE protocol family
+[    0.013696] DMA: preallocated 128 KiB GFP_KERNEL pool for atomic allocations
+[    0.014016] DMA: preallocated 128 KiB GFP_KERNEL|GFP_DMA32 pool for atomic allocations
+[    0.019200] HugeTLB: registered 2.00 MiB page size, pre-allocated 0 pages
+[    0.019456] HugeTLB: 0 KiB vmemmap can be freed for a 2.00 MiB page
+[    0.024192] clocksource: Switched to clocksource riscv_clocksource
+[    0.043968] NET: Registered PF_INET protocol family
+[    0.044544] IP idents hash table entries: 2048 (order: 2, 16384 bytes, linear)
+[    0.047936] tcp_listen_portaddr_hash hash table entries: 512 (order: 0, 4096 bytes, linear)
+[    0.048320] Table-perturb hash table entries: 65536 (order: 6, 262144 bytes, linear)
+[    0.048640] TCP established hash table entries: 1024 (order: 1, 8192 bytes, linear)
+[    0.049088] TCP bind hash table entries: 1024 (order: 2, 16384 bytes, linear)
+[    0.049472] TCP: Hash tables configured (established 1024 bind 1024)
+[    0.049856] UDP hash table entries: 256 (order: 1, 8192 bytes, linear)
+[    0.050176] UDP-Lite hash table entries: 256 (order: 1, 8192 bytes, linear)
+[    0.050752] NET: Registered PF_UNIX/PF_LOCAL protocol family
+[    0.051200] kvm [1]: hypervisor extension not available
+[    0.052672] workingset: timestamp_bits=46 max_order=15 bucket_order=0
+[    0.054016] squashfs: version 4.0 (2009/01/31) Phillip Lougher
+[    0.054272] 9p: Installing v9fs 9p2000 file system support
+[    0.059840] tun: Universal TUN/TAP device driver, 1.6
+[    0.062976] nd_pmem namespace0.0: unable to guarantee persistence of writes
+[    0.065344] Cartesi Machine cmio device: Module loaded
+[    0.066880] NET: Registered PF_PACKET protocol family
+[    0.067392] 9pnet: Installing 9P2000 support
+[    0.067968] NET: Registered PF_VSOCK protocol family
+[    0.113344] clk: Disabling unused clocks
+[    0.117440] EXT4-fs (pmem0): mounted filesystem 00000000-0000-0000-0000-000000000000 r/w without journal. Quota mode: disabled.
+[    0.118016] VFS: Mounted root (ext4 filesystem) on device 259:0.
+[    0.119936] devtmpfs: mounted
+[    0.123712] Freeing unused kernel image (initmem) memory: 2100K
+[    0.124032] Run /usr/sbin/cartesi-init as init process
+[    0.124224]   with arguments:
+[    0.124352]     /usr/sbin/cartesi-init
+[    0.124480]   with environment:
+[    0.124608]     HOME=/
+[    0.124736]     TERM=linux
+Nothing to do.
+[    0.232000] EXT4-fs (pmem0): re-mounted 00000000-0000-0000-0000-000000000000 ro. Quota mode: disabled.
+[    0.260736] reboot: Power down
+```
+
+To clear the kernel command-line, use the option `--no-bootargs`. Notice
+that, without any options, the machine will not operate properly. In
+particular, as explained under the [Lua interface](#lua-interface),
+flash-drives use kernel command-line arguments. For example, running the
+`cartesi-machine` command-line utility with no arguments produces a
+kernel command-line equivalent to running the command
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --no-bootargs \
+    --append-bootargs="quiet earlycon=sbi console=hvc0 uio_pdrv_genirq.of_id=generic-uio root=/dev/pmem0 rw init=/usr/sbin/cartesi-init"
+```
+
+The command-line option `--periodic-hashes=<period>[,start:<mcycle>]`
+causes the command-line utility to periodically obtain and print the
+state hash. The `<period>` argument gives the distance between hashes in
+cycles. The optional `start:<mcycle>` sub-key gives the starting cycle
+for the periodic hashes. (Both `--initial-hash` and `--final-hash` are
+implied by this option.)
+
+For example, to see the last 10 state hashes from the calculator machine
+computation, run the command
+
+``` bash
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+cartesi-machine \
+    --no-init-splash \
+    --load="calculator-template" \
+    --replace-memory-range="label:input,data_filename:input.raw" \
+    --periodic-hashes=1,start:62993907
+```
+
+The output is
+
+``` text
+Loading machine: please wait
+0: 60246ea0f5082b651bf85aeb41b9c276a030708c2c151c91ff4bc40ec8f351f5
+62993907: 6721a1d49cbfcc50368772b3cea57c5dc4ee3d7bf5ce57fa8744379fe0994fc7
+62993908: bca8788daf59e8879a348a0f091cda050b72c8511cfc485f207d6d6c2e55b89a
+62993909: 430dd1653c05242312e66bce73fd069827a5ec257574c6b482ad75ae9de52326
+62993910: 88aa4d1cb98af106093ba94dd935a29bd896935f52f0e65bdc40c3cf25c38869
+62993911: 9181b530647c874f2ea0fe968c558ba6ccd71ad644f02c654db2adb50d3cf99d
+62993912: fb5cae95e623b12a35638fc9f81a59365c457677d815c52456a801a2f18b22bb
+62993913: cae0b7ca22e93b16e7c88a1f23bba35f5a4adaa736662d44f4083a4c014e3296
+62993914: d86c520b5cec298218df680cdbddb901b16ee5dc3d1c4f879d4a3ee350e16f77
+62993915: fbf6c1d19478204042ce6eaf0782bc8cde3dfd3043e2da4280fb69252399e2e9
+62993916: cfd5865bea26a3c73af1f4c0801ac588f0318c5e98103825f9c32346933d4471
+
+Halted
+Cycles: 62993917
+62993917: a7fdb74dcc67232f5b64b3b245972a6b30e6fde1f11c5a11ae16dec44bcc79ae
+```
+
+The command-line option `--dump-memory-ranges[=<dir>]` causes the
+emulator to dump the contents of all memory ranges in the address space
+to files under `<dir>`. If `<dir>` is omitted, files are written to the
+current working directory. Each memory range produces a file
+`<start>--<length>.bin`. Every other byte in the address space has value
+0. This is useful to inspect the entire state of the machine from
+outside the emulator.
+
+The command-line options `--store-config` and `--load-config` store or
+load a Lua file with information that can be used to initialize the
+exact same Cartesi Machine that the `cartesi-machine` command-line
+utility will use. The format of these configuration files is explained
+in detail under the [Lua interface](#lua-interface) to Cartesi Machines.
+In particular, the `--store-config` option, without arguments, dumps to
+screen all the options used to define the Cartesi Machine. This
+information can be very useful when debugging problems. Both options
+accept a `format:<lua|json>` sub-key to select between Lua and JSON.
+When `format:` is omitted, the format is inferred from the filename
+extension (`.json` or `.lua`), defaulting to Lua.
+
+The remaining options in the command-line utility `cartesi-machine` are
+mostly useful for low-level tests and debugging. As such, they require
+some context.
+
+During verification, the blockchain mediates a *verification game*
+between the disputing parties. This process is explained in detail under
+the [the blockchain perspective](#verification-game). In a nutshell,
+both parties started from a Cartesi Machine that has a known and agreed
+upon initial state hash. (E.g., an agreed upon template that was
+instantiated with an agreed upon input drive, or an agreed upon rolling
+template with an agreed upon advance-state input box.) At the end of the
+computation, these parties now disagree on the final state hash. (E.g.,
+the state hash for the halted machine, or the state hash of the yielded
+machine after a number of advance-state inputs have been processed.) The
+state hash evolves as the machine executes steps in its fetch-execute
+loop. The first stage of the verification game therefore searches for
+the *step of disagreement*: the particular main processor cycle such
+that the parties agree on the state hash before the step, but disagree
+on the state hash after the step. When the uarch is in use, every main
+processor instruction can also be implemented by a sequence of
+micro-instructions in the uarch interpreter, and a single uarch step is
+one of those micro-instructions. So the search is refined to find the
+*uarch step of disagreement*: the particular uarch cycle such that the
+parties agree on the state hash before the uarch step, but disagree on
+the state hash after the uarch step. Once this uarch step of
+disagreement is identified, one of the parties sends to the blockchain a
+log of state accesses that happen along the uarch step, including
+Merkle-tree proofs for every value read from or written to the state.
+This log proves to the blockchain that the execution of the uarch step
+transitions the state in such a way that it reaches the state hash
+claimed by the submitting party.
+
+Consider again the example in which the Cartesi Machine was stopped
+while it drew the splash screen. Let’s assume that this is the step of
+disagreement. In an honest Cartesi Machine, the main processor
+instruction about to execute when `mcycle` is `37056250` is the `sd`
+that issues a putchar command to the HTIF console device by writing it
+to the `htif.tohost` CSR. That single main processor instruction expands
+into many uarch instructions. The one that actually triggers the host to
+emit a character is an `ecall` with `a7 = UARCH_ECALL_FN_PUTCHAR` and
+`a0 = 0x0a`. This happens when `uarch_cycle` is `2242`.
+
+In the following command, the `--max-mcycle` and `--max-uarch-cycle`
+options tell `cartesi-machine` to stop just before the putchar `ecall`.
+The `--log-step-uarch` command-line option instructs `cartesi-machine`
+to then dump to screen a user-friendly version of the access log
+produced by a single uarch step:
+
+``` bash
+cartesi-machine \
+    --max-mcycle=37056250 \
+    --max-uarch-cycle=2242 \
+    --log-step-uarch
+```
+
+producing the log
+
+``` text
+Gathering uarch step log: please wait
+begin step
+  1: read uarch.cycle@0x400008(4194312): 0x8c2(2242)
+  2: read uarch.halt_flag@0x400000(4194304): 0x0(0)
+  3: read uarch.pc@0x400010(4194320): 0x600b38(6294328)
+  4: read uarch.ram@0x600b38(6294328): 0x806700000073(141179869986931)
+  begin ecall
+    5: read uarch.x17@0x4000a0(4194464): 0x2(2)
+    6: read uarch.x10@0x400068(4194408): 0xa(10)
+    7: write uarch.pc@0x400010(4194320): 0x600b38(6294328) -> 0x600b3c(6294332)
+  end ecall
+  8: write uarch.cycle@0x400008(4194312): 0x8c2(2242) -> 0x8c3(2243)
+end step
+```
+
+Understanding these logs in detail is unnecessary for all but the most
+low-level internal development at Cartesi. It requires deep knowledge of
+not only RISC-V architecture, but also how Cartesi’s uarch interpreter
+implements the main processor fetch-execute loop. The material is
+therefore beyond the scope of this document.
+
+This particular example, however, was hand-picked for illustration
+purposes. The uarch instruction logged is the `ecall` that asks the host
+to emit one character. At this point, register `a7` (i.e., `uarch_x17`)
+holds the value `2` (`UARCH_ECALL_FN_PUTCHAR`) and register `a0` (i.e.,
+`uarch_x10`) holds the character `0x0a` (a line-feed). When the host
+processes this `ecall`, it emits the line-feed to the console,
+completing the row `\    / CARTESI` in the splash screen.
+
+The command-line options `--cmio-rx-buffer=<key>:<value>...` and
+`--cmio-tx-buffer=<key>:<value>...` configure backing-store options for
+the two memory ranges used by the `/dev/cmio` device. The RX buffer
+occupies `start:0x60000000,length:2<<20` and the TX buffer occupies
+`start:0x60800000,length:2<<20`. Although their addresses and lengths
+are fixed and cannot be overridden, their backing storage can be
+configured. See the [guest perspective](#system-architecture) for
+details on how these buffers are used by Cartesi Rollups, and the
+section on [Rolling Cartesi Machines](#rolling-cartesi-machines) for the
+request/response data flow.
+
+Automatic and manual yields are enabled by default. Disable them with
+`--no-htif-yield-automatic` or `--no-htif-yield-manual` (note that
+disabling automatic yield prevents Rolling Cartesi Machines from
+generating outputs).
+
+## Lua interface
+
+> [!CAUTION]
+>
+> This entire chapter is for advanced users only, since typical users of
+> the Cartesi platform will likely never need to programmatically
+> control a Cartesi Machine.
+
+The Lua interface to Cartesi Machines is available from the `cartesi`
+Lua module. In a properly setup installation (such as what is available
+in the playground Docker image), the module can be loaded with the
+`require` function
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require"cartesi"
+```
+
+A Cartesi Machine instance is defined by its *organization* and the
+*contents* of its state. The organization specifies a variety of memory
+ranges (such as RAM, flash drives, NVRAMs, the DTB, and CMIO buffers).
+To support Cartesi Machine’s transparency, all these memory ranges are
+mapped into the machine’s 64-bit physical memory address space. The
+layout defines each entry’s start and length in the address space. The
+DTB and the CMIO buffers have fixed layouts. RAM has a fixed start, but
+its length is user-configurable. For flash drives and NVRAMs, the user
+chooses the start and length of each entry. The contents of the state
+include the values stored in all these memory ranges, in addition to the
+values of all processor registers and device-specific state.
+
+### Instantiation by configuration
+
+Cartesi Machines can be instantiated directly from a configuration
+structure.
+
+<a name="machine_config"></a>
+
+``` lua
+machine_config ::= {
+    processor ::= processor_config,
+
+    ram ::= {
+        backing_store ::= backing_store_config,
+        length ::= number
+    },
+
+    dtb ::= {
+        backing_store ::= backing_store_config,
+        bootargs ::= string,
+        init ::= string,
+        entrypoint ::= string
+    },
+
+    flash_drive ::= {
+        [1] ::= memory_range_config, -- flash drive 0
+        [2] ::= memory_range_config, -- flash drive 1
+        ...
+        [n] ::= memory_range_config
+    },
+
+    nvram ::= {
+        [1] ::= memory_range_config, -- nvram 0
+        [2] ::= memory_range_config, -- nvram 1
+        ...
+        [n] ::= memory_range_config
+    },
+
+    cmio ::= {
+        rx_buffer ::= {
+            backing_store ::= backing_store_config
+        },
+        tx_buffer ::= {
+            backing_store ::= backing_store_config
+        }
+    },
+
+    uarch ::= {
+        processor ::= uarch_processor_config,
+
+        ram ::= {
+            backing_store ::= backing_store_config
+        }
+    },
+
+    pmas ::= {
+        backing_store ::= backing_store_config,
+    },
+
+    hash_tree ::= hash_tree_config,
+
+    virtio ::= virtio_config
+}
+```
+
+<a name="backing_store_config"></a>
+
+``` lua
+backing_store_config ::= {
+    data_filename ::= string,
+    shared ::= boolean,
+    create ::= boolean,
+    truncate ::= boolean,
+    dht_filename ::= string,
+    dpt_filename ::= string
+}
+```
+
+<a name="memory_range_config"></a>
+
+``` lua
+memory_range_config ::= {
+    backing_store ::= backing_store_config,
+    start ::= number,
+    length ::= number,
+    label ::= string,
+    read_only ::= boolean
+}
+```
+
+<a name="processor_config"></a>
+
+``` lua
+processor_config ::= {
+    backing_store ::= backing_store_config,
+
+    registers ::= {
+        x0 ::= number, -- always 0
+        x1 ::= number,
+        ...
+        x31 ::= number,
+        f0 ::= number,
+        ...
+        f31 ::= number,
+        fcsr ::= number,
+        pc ::= number,
+        mvendorid ::= number,
+        marchid ::= number,
+        mimpid ::= number,
+        mcycle ::= number,
+        misa ::= number,
+        mstatus ::= number,
+        mtvec ::= number,
+        mscratch ::= number,
+        mepc ::= number,
+        mcause ::= number,
+        mtval ::= number,
+        mie ::= number,
+        mip ::= number,
+        medeleg ::= number,
+        mideleg ::= number,
+        mcounteren ::= number,
+        menvcfg ::= number,
+        stvec ::= number,
+        sscratch ::= number,
+        sepc ::= number,
+        scause ::= number,
+        stval ::= number,
+        satp ::= number,
+        scounteren ::= number,
+        senvcfg ::= number,
+        icycleinstret ::= number,
+        iflags ::= {
+            H ::= number,
+            X ::= number,
+            Y ::= number
+        },
+        ilrsc ::= number,
+        iprv ::= number,
+        iunrep ::= number,
+        htif ::= {
+            tohost ::= number,
+            fromhost ::= number,
+            ihalt ::= number,
+            iconsole ::= number,
+            iyield ::= number
+        },
+        clint ::= {
+           mtimecmp ::= number
+        },
+        plic ::= {
+            girqpend ::= number,
+            girqsrvd ::= number
+        }
+    },
+}
+```
+
+<a name="uarch_processor_config"></a>
+
+``` lua
+uarch_processor_config ::= {
+    backing_store ::= backing_store_config,
+    registers ::= {
+        halt_flag ::= number,
+        cycle ::= number,
+        pc ::= number,
+        x0 ::= number, -- always 0
+        x1 ::= number,
+        ...
+        x31 ::= number,
+    }
+}
+```
+
+<a name="hash_tree_config"></a>
+
+``` lua
+hash_tree_config ::= {
+    shared ::= boolean,
+    create ::= boolean,
+    sht_filename ::= string,
+    phtc_filename ::= string,
+    phtc_size ::= number,
+    hash_function ::= string
+}
+```
+
+Every memory range in a Cartesi Machine has a corresponding
+<a href="#backing_store_config">`backing_store`</a> entry. This is the
+basis for the implementation of persistent Cartesi Machines. Field
+`backing_store.data_filename` gives the filename of an image on disk in
+the host with the initial contents for that memory range. Since the
+image is mapped, its size on disk must exactly match the length of the
+memory range. When `backing_store.shared` is set to `true` (default is
+`false`), changes made by the guest to the memory range pass through to
+modify the host image file. Otherwise, changes are kept private to the
+guest. When `backing_store.create` is set to `true` (default is
+`false`), the emulator creates the file at `data_filename` at
+instantiation, zero-initialized to the entry’s `length`. In that case,
+`shared` must also be set to `true` (after all, the emulator is
+modifying the image file in the host). When `backing_store.truncate` is
+set to `true` (default is `false`), the emulator resizes an existing
+file at `data_filename` to match the memory range’s length before
+mapping it, padding with zeros if the file is smaller than the
+corresponding memory range. Once again, in that case, `shared` must be
+set to `true`. Fields `backing_store.dht_filename` (for *dense
+hash-tree*) and `backing_store.dpt_filename` (for *dirty-page tree*)
+support the efficient computation of state hashes and proofs. When
+instantiating a machine from scratch, these are normally left empty. In
+fact, for many of the entries in the `machine_config`, the
+`backing_store` field is populated and consumed automatically by the
+emulator when storing and loading persistent machines. I.e., when using
+`cartesi-machine` command-line options `--load=<directory>` and
+`--store=<directory>`, or when using the Lua API methods
+`machine:store(<directory>)` and `machine:load(<directory>)` on which
+they are based. The multiple instances of field `backing_store` will not
+be described individually.
+
+The `ram` entry in `machine_config` describes the main processor RAM.
+Field `length` gives the amount of RAM in bytes (RAM always starts at
+offset `0x80000000`). This length should be a multiple of 4Ki, the
+length of a RISC-V memory page. The `backing_store.data_filename` holds
+the filename of an image that will be loaded at the start of RAM. This
+is where the RAM image `linux.bin` generated by the
+[`machine-linux-image`](https://github.com/cartesi/machine-linux-image)
+repository is typically loaded.
+
+The `flash_drive` entry in `machine_config` is a list of
+<a href="#memory_range_config">`memory_range_config`</a> structures. The
+same is true of the `nvram` entry. In each `memory_range_config`, fields
+`start` and `length` give the start and length of the memory range in
+the machine’s address space. Once again, the length must be a multiple
+of 4Ki. The `start` of a drive must be aligned to its `length` rounded
+up to the next power of 2. No memory range in a Cartesi Machine can
+overlap with any other, considering their rounded-up lengths. If
+`length` is omitted, it defaults to the size of the backing image on
+disk. If `start` is omitted, it is automatically placed to respect the
+alignment and overlap restrictions. The first flash drive is placed past
+RAM, then each remaining flash drive is placed past the previous. The
+first NVRAM is placed past the last flash drive, and then each remaining
+NVRAM is placed past the previous. Field `label` is a string used by the
+emulator to expose the entry to the guest via DTB aliases. Each flash
+drive is exposed to the guest as a `/dev/pmem*` device, and each NVRAM
+as a `/dev/uio*` device. Field `read_only` is a Boolean (defaults to
+`false`) that makes the corresponding memory range read-only from the
+point of view of the guest. The `backing_store.data_filename` holds the
+filename of an image that will be loaded into the corresponding memory
+range.
+
+The `dtb` entry in `machine_config` describes the memory range that
+holds the device tree for the emulator. Field `entrypoint` is the
+user-mode command that `cartesi-init` runs after setup, by default as
+user `dapp`. This is what the `cartesi-machine` command-line utility
+appends to when arguments are passed after `--`. Field `init` is a shell
+snippet appended to the initialization phase, executed as `root` before
+the entrypoint. This is where the `cartesi-machine` command-line utility
+appends instructions to change ownership and permissions of flash-drives
+and NVRAMs, to mount flash-drives at `/mnt/<label>`, and other important
+initializations of the guest Linux environment. Field `bootargs` is the
+kernel command-line string passed to Linux at boot. When
+`dtb.backing_store.data_filename` is empty, the emulator generates the
+DTB image at instantiation from the rest of the configuration.
+
+The `cmio` entry in `machine_config` configures the two CMIO buffers
+used to send data in and out of the machine. Fields `rx_buffer` and
+`tx_buffer` each contain only a `backing_store` configuration. For
+example, the input to an advance-state request and the query to an
+inspect-state request are written to the `rx_buffer` memory range.
+Conversely, vouchers, notices, reports, and exceptions are written to
+the `tx_buffer` memory range. For more details on how exactly these
+memory ranges are used, please read the [architecture
+section](#system-architecture) under the guest perspective.
+
+The <a href="#processor_config">`processor`</a> entry in
+`machine_config` describes the main processor state. Field `registers`
+is a flat table of all general-purpose, floating-point, and
+control-and-status registers, plus the nested sub-tables `iflags`,
+`htif`, `clint`, and `plic`. Each register field is a number that sets
+its value. Most users only need to set `mvendorid`, `mimpid`, and
+`marchid`, which the emulator checks at instantiation to ensure the
+configuration matches the running emulator version. During prototyping,
+these can be set to `-1` to make the emulator accept any value. In
+production code, they should be hard-coded. Most CSRs are defined in
+volumes [1 and 2](https://riscv.org/technical/specifications/) of the
+ISA specification. The Cartesi-specific registers (`iprv`, `iunrep`,
+`iflags`, the HTIF and CMIO interfaces) are described under the
+[architecture section](#system-architecture) from the guest perspective.
+The `processor.registers.htif` sub-table holds the initial values of
+HTIF state. Field `iconsole` is a bitmask declaring whether the emulator
+honors console-putchar and console-getchar commands. Defaults to
+putchar-only. The `cartesi-machine` command-line option
+`-i`/`--htif-console-getchar` enables getchar. Field `iyield` is a
+bitmask declaring whether the emulator honors automatic and manual yield
+commands. Defaults to both enabled. The `cartesi-machine` command-line
+options `--no-htif-yield-automatic` and `--no-htif-yield-manual` clear
+the corresponding bits.
+
+The `uarch` entry describes the microarchitecture state. The
+`uarch.processor` field controls the uarch processor. Like the main
+processor, it includes a `uarch.processor.registers` flat table with all
+registers. Register `uarch.processor.registers.halt_flag` is non-zero
+when the uarch is halted. The `uarch.ram` field controls the uarch RAM.
+Unlike the main processor RAM, the uarch RAM is fixed in length.
+Moreover, the `uarch.ram.backing_store.data_filename` is typically left
+blank (other than in unit tests), as the emulator automatically fills
+the uarch RAM with an implementation of the main processor fetch-execute
+loop compiled to function within the uarch.
+
+The `pmas` entry describes the memory range containing one PMA (for
+*physical memory attributes*) entry for each address range that is
+visible to the main processor. This is automatically filled by the
+emulator during initialization. PMAs are described in the [PMAs
+subsection](#pmas) of the system architecture chapter.
+
+The `hash_tree` entry configures the global hash-tree structure that
+supports efficient computation of state hashes and proofs. Field
+`hash_tree.hash_function` controls the hash function used in the hash
+tree. It defaults to `"keccak256"`, and is suitable for use with the
+uarch. Set it to `"sha256"` for use with the ZK prover instead. These
+options are mutually exclusive: a machine that was initialized for use
+with the uarch can never be used with the ZK prover (and vice-versa).
+Fields `hash_tree.phtc_size` and `hash_tree.phtc_filename` control the
+*page hash-tree cache*. This is a cache that contains the entire dense
+hash tree for the most recently used pages in the address space. Field
+`hash_tree.phtc_size` gives the number of entries, and
+`hash_tree.phtc_filename` gives the filename for the backing image in
+the host. Field `hash_tree.sht_filename` gives the filename for the
+backing image of the global *sparse hash tree* that combines the dense
+hash trees of the different memory ranges.
+
+Finally, the `virtio` entry is a list of configuration for VirtIO
+devices that can be used when the machine is used in non-reproducible
+mode during development.
+
+### Default configuration
+
+The `cartesi.machine:get_default_config()` method can be used to obtain
+the default Cartesi Machine configuration:
+
+``` lua
+-- Load the Cartesi module and utilities
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+
+-- Obtain default config
+local default_config = cartesi.machine:get_default_config()
+
+-- Pretty-print it
+io.write("return ")
+util.dump_table(default_config, io.stdout)
+```
+
+This produces:
+
+``` lua
+return {
+  cmio = {
+    rx_buffer = {
+      backing_store = {
+        create = false,
+        data_filename = "",
+        dht_filename = "",
+        dpt_filename = "",
+        shared = false,
+        truncate = false,
+      },
+    },
+    tx_buffer = {
+      backing_store = {
+        create = false,
+        data_filename = "",
+        dht_filename = "",
+        dpt_filename = "",
+        shared = false,
+        truncate = false,
+      },
+    },
+  },
+  dtb = {
+    backing_store = {
+      create = false,
+      data_filename = "",
+      dht_filename = "",
+      dpt_filename = "",
+      shared = false,
+      truncate = false,
+    },
+    bootargs = "quiet earlycon=sbi console=hvc0 uio_pdrv_genirq.of_id=generic-uio root=/dev/pmem0 rw init=/usr/sbin/cartesi-init",
+    entrypoint = "",
+    init = "",
+  },
+  flash_drive = {},
+  hash_tree = {
+    create = false,
+    hash_function = "keccak256",
+    phtc_filename = "",
+    phtc_size = 0x1000,
+    shared = false,
+    sht_filename = "",
+  },
+  nvram = {},
+  pmas = {
+    backing_store = {
+      create = false,
+      data_filename = "",
+      dht_filename = "",
+      dpt_filename = "",
+      shared = false,
+      truncate = false,
+    },
+  },
+  processor = {
+    backing_store = {
+      create = false,
+      data_filename = "",
+      dht_filename = "",
+      dpt_filename = "",
+      shared = false,
+      truncate = false,
+    },
+    registers = {
+      clint = {
+        mtimecmp = 0x0,
+      },
+      f0 = 0x0,
+      f1 = 0x0,
+      f10 = 0x0,
+      f11 = 0x0,
+      f12 = 0x0,
+      f13 = 0x0,
+      f14 = 0x0,
+      f15 = 0x0,
+      f16 = 0x0,
+      f17 = 0x0,
+      f18 = 0x0,
+      f19 = 0x0,
+      f2 = 0x0,
+      f20 = 0x0,
+      f21 = 0x0,
+      f22 = 0x0,
+      f23 = 0x0,
+      f24 = 0x0,
+      f25 = 0x0,
+      f26 = 0x0,
+      f27 = 0x0,
+      f28 = 0x0,
+      f29 = 0x0,
+      f3 = 0x0,
+      f30 = 0x0,
+      f31 = 0x0,
+      f4 = 0x0,
+      f5 = 0x0,
+      f6 = 0x0,
+      f7 = 0x0,
+      f8 = 0x0,
+      f9 = 0x0,
+      fcsr = 0x0,
+      htif = {
+        fromhost = 0x0,
+        iconsole = 0x2,
+        ihalt = 0x1,
+        iyield = 0x3,
+        tohost = 0x0,
+      },
+      icycleinstret = 0x0,
+      iflags = {
+        H = 0x0,
+        X = 0x0,
+        Y = 0x0,
+      },
+      ilrsc = 0xffffffffffffffff,
+      iprv = 0x3,
+      iunrep = 0x0,
+      marchid = 0x14,
+      mcause = 0x0,
+      mcounteren = 0x0,
+      mcycle = 0x0,
+      medeleg = 0x0,
+      menvcfg = 0x0,
+      mepc = 0x0,
+      mideleg = 0x0,
+      mie = 0x0,
+      mimpid = 0x14,
+      mip = 0x0,
+      misa = 0x800000000014112d,
+      mscratch = 0x0,
+      mstatus = 0xa00000000,
+      mtval = 0x0,
+      mtvec = 0x0,
+      mvendorid = 0x6361727465736920,
+      pc = 0x80000000,
+      plic = {
+        girqpend = 0x0,
+        girqsrvd = 0x0,
+      },
+      satp = 0x0,
+      scause = 0x0,
+      scounteren = 0x0,
+      senvcfg = 0x0,
+      sepc = 0x0,
+      sscratch = 0x0,
+      stval = 0x0,
+      stvec = 0x0,
+      x0 = 0x0,
+      x1 = 0x0,
+      x10 = 0x0,
+      x11 = 0x7ff00000,
+      x12 = 0x0,
+      x13 = 0x0,
+      x14 = 0x0,
+      x15 = 0x0,
+      x16 = 0x0,
+      x17 = 0x0,
+      x18 = 0x0,
+      x19 = 0x0,
+      x2 = 0x0,
+      x20 = 0x0,
+      x21 = 0x0,
+      x22 = 0x0,
+      x23 = 0x0,
+      x24 = 0x0,
+      x25 = 0x0,
+      x26 = 0x0,
+      x27 = 0x0,
+      x28 = 0x0,
+      x29 = 0x0,
+      x3 = 0x0,
+      x30 = 0x0,
+      x31 = 0x0,
+      x4 = 0x0,
+      x5 = 0x0,
+      x6 = 0x0,
+      x7 = 0x0,
+      x8 = 0x0,
+      x9 = 0x0,
+    },
+  },
+  ram = {
+    backing_store = {
+      create = false,
+      data_filename = "",
+      dht_filename = "",
+      dpt_filename = "",
+      shared = false,
+      truncate = false,
+    },
+    length = 0x0,
+  },
+  uarch = {
+    processor = {
+      backing_store = {
+        create = false,
+        data_filename = "",
+        dht_filename = "",
+        dpt_filename = "",
+        shared = false,
+        truncate = false,
+      },
+      registers = {
+        cycle = 0x0,
+        halt_flag = 0x0,
+        pc = 0x600000,
+        x0 = 0x0,
+        x1 = 0x0,
+        x10 = 0x0,
+        x11 = 0x0,
+        x12 = 0x0,
+        x13 = 0x0,
+        x14 = 0x0,
+        x15 = 0x0,
+        x16 = 0x0,
+        x17 = 0x0,
+        x18 = 0x0,
+        x19 = 0x0,
+        x2 = 0x0,
+        x20 = 0x0,
+        x21 = 0x0,
+        x22 = 0x0,
+        x23 = 0x0,
+        x24 = 0x0,
+        x25 = 0x0,
+        x26 = 0x0,
+        x27 = 0x0,
+        x28 = 0x0,
+        x29 = 0x0,
+        x3 = 0x0,
+        x30 = 0x0,
+        x31 = 0x0,
+        x4 = 0x0,
+        x5 = 0x0,
+        x6 = 0x0,
+        x7 = 0x0,
+        x8 = 0x0,
+        x9 = 0x0,
+      },
+    },
+    ram = {
+      backing_store = {
+        create = false,
+        data_filename = "",
+        dht_filename = "",
+        dpt_filename = "",
+        shared = false,
+        truncate = false,
+      },
+    },
+  },
+  virtio = {},
+}
+```
+
+As it is, the default configuration is not functional. At a minimum, it
+is missing the RAM length, the image to be loaded into RAM, and a flash
+drive with the root file-system.
+
+The `dtb.bootargs` field carries the default kernel command line. The
+individual parameters have the following meaning:
+
+- `quiet earlycon=sbi console=hvc0 ` silences the printing of kernel
+  initialization messages, enables the SBI-based early console, used
+  before the main console is up, and sets the main console to the
+  hypervisor console virtual device;
+- `uio_pdrv_genirq.of_id=generic-uio ` instructs the UIO platform driver
+  to bind to nodes with the `generic-uio` compatible string, used by
+  NVRAM ranges;
+- `root=/dev/pmem0 rw ` sets the first flash drive (exposed by the
+  kernel as a persistent-memory block device) as the root file-system
+  and instructs the kernel to mount the root file-system read-write;
+- `init=/usr/sbin/cartesi-init` runs the Cartesi-provided init script,
+  ends up reading the property `/cartesi-machine/entrypoint` from the
+  device tree (with the contents of `dtb.entrypoint`) running it as user
+  `dapp`.
+
+### Generating configurations
+
+The `cartesi-machine` command-line utility can be used to output
+complete Cartesi Machine configurations. Recall from an [earlier
+example](#initialization) that the `cartesi-machine` command
+
+``` bash
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    -- ls /bin
+```
+
+builds a Cartesi Machine that, when run, lists the contents of the
+`/bin/` directory before gracefully halting. The kernel `linux.bin` and
+root file-system `rootfs.ext2` come from the defaults under
+`/usr/share/cartesi-machine/images/`.
+
+The command-line option `--store-config[=<filename>]` makes the utility
+capture the initial machine configuration. Without an argument, the
+configuration is printed to standard output. With `=<filename>`, it is
+written to that file (and `--load-config=<filename>` reloads it later).
+
+Adding `--store-config` to the example above, we obtain the complete
+contents of the corresponding `machine_config`, including default values
+conveniently marked as such by the `cartesi-machine` utility. Editing
+them out and storing into a file, we would get:
+
+``` lua
+return {
+  dtb = {
+    entrypoint = "ls /bin",
+  },
+  flash_drive = {
+    {
+      backing_store = {
+        data_filename = "/usr/share/cartesi-machine/images/rootfs.ext2",
+      },
+      label = "root",
+      length = 0x94e6000,
+      start = 0x90000000,
+    },
+  },
+  ram = {
+    backing_store = {
+      data_filename = "/usr/share/cartesi-machine/images/linux.bin",
+    },
+    length = 0x8000000,
+  },
+}
+```
+
+Flash drives are exposed by the kernel as `/dev/pmem<i>` devices. NVRAMs
+are exposed as `/dev/uio<i>` devices. The emulator publishes each
+drive’s `label` field inside the device-tree node `/aliases`.
+
+When the user passes arguments after `--` on the `cartesi-machine`
+command line, the utility appends them to `dtb.entrypoint`. The emulator
+then publishes this in the device-tree property `entrypoint` of the
+`/cartesi-machine` node.
+
+The command-line utility can also run Cartesi Machines with additional
+flash drives. Adding `--store-config` to the [earlier
+example](#flash-drives) that loaded `foo.ext2` as a flash drive
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --flash-drive="label:foo,data_filename:foo.ext2" \
+    -- "cat /mnt/foo/bar.txt"
+```
+
+captures a configuration whose essential, edited-down form is
+
+``` lua
+return {
+  dtb = {
+    entrypoint = "cat /mnt/foo/bar.txt",
+    init = "dev=$(flashdrive foo)\
+busybox mkdir -p \"/mnt/foo\" && busybox mount \"$dev\" \"/mnt/foo\"\
+",
+  },
+  flash_drive = {
+    {
+      backing_store = {
+        data_filename = "/usr/share/cartesi-machine/images/rootfs.ext2",
+      },
+      label = "root",
+      length = 0x94e6000,
+      start = 0x90000000,
+    },
+    {
+      backing_store = {
+        data_filename = "foo.ext2",
+      },
+      label = "foo",
+      length = 0x8000,
+      start = 0xa0000000,
+    },
+  },
+  ram = {
+    backing_store = {
+      data_filename = "/usr/share/cartesi-machine/images/linux.bin",
+    },
+    length = 0x8000000,
+  },
+}
+```
+
+The new flash drive with label `foo` is added by the `cartesi-machine`
+command-line utility right after `root`. The utility also adds a small
+snippet to `dtb.init` that mounts the drive at `/mnt/foo`. The emulator
+adds the contents of `dtb.init` to the device-tree as property `init` of
+node `/cartesi-machine`, and the Cartesi-provided init script sources it
+as user `root` before executing the entrypoint. As a result, the
+file-system carried by `foo.ext2` on the host is mounted at `/mnt/foo`
+in the guest. That is where the entrypoint `cat /mnt/foo/bar.txt` finds
+the file to dump to the console.
+
+### Additional sample configurations
+
+Here are the (simplified) configurations for the other examples from the
+documentation of the `cartesi-machine` command-line utility.
+
+A Cartesi Machine that has nothing to do. This is the [introductory
+example](#command-line-interface), and its configuration, edited down to
+its essential, is
+
+``` lua
+return {
+  dtb = {
+    init = "echo \"\
+         .\
+        / \\\\\
+      /    \\\\\
+\\\\---/---\\\\  /----\\\\\
+ \\\\       X       \\\\\
+  \\\\----/  \\\\---/---\\\\\
+       \\\\    / CARTESI\
+        \\\\ /   MACHINE\
+         '\
+\"\
+",
+  },
+  flash_drive = {
+    {
+      backing_store = {
+        data_filename = "/usr/share/cartesi-machine/images/rootfs.ext2",
+      },
+      label = "root",
+      length = 0x94e6000,
+      start = 0x90000000,
+    },
+  },
+  ram = {
+    backing_store = {
+      data_filename = "/usr/share/cartesi-machine/images/linux.bin",
+    },
+    length = 0x8000000,
+  },
+}
+```
+
+The `dtb.init` field carries the ASCII-art splash that the
+`cartesi-machine` utility appends to its setup phase by default. This is
+what produces the Cartesi logo printed before each entrypoint runs.
+
+A Cartesi Machine that periodically reports its progress using the HTIF
+Yield device:
+
+``` lua
+return {
+  dtb = {
+    entrypoint = "for i in $(seq 0 5 1000); do yield automatic progress $i; done",
+  },
+  flash_drive = {
+    {
+      backing_store = {
+        data_filename = "/usr/share/cartesi-machine/images/rootfs.ext2",
+      },
+      label = "root",
+      length = 0x94e6000,
+      start = 0x90000000,
+    },
+  },
+  ram = {
+    backing_store = {
+      data_filename = "/usr/share/cartesi-machine/images/linux.bin",
+    },
+    length = 0x8000000,
+  },
+}
+```
+
+A Cartesi Machine that computes the value of a generic mathematical
+expression:
+
+``` lua
+return {
+  dtb = {
+    entrypoint = "readmmap input | lua5.4 -e 'print((string.unpack(\"z\", io.read(\"a\"))))' | bc | writemmap output",
+    init = "dev=$(nvram input)\
+busybox chmod 0664 \"$dev\"\
+dev=$(nvram output)\
+busybox chmod 0664 \"$dev\"\
+busybox chown dapp: \"$dev\"\
+",
+  },
+  flash_drive = {
+    {
+      backing_store = {
+        data_filename = "/usr/share/cartesi-machine/images/rootfs.ext2",
+      },
+      label = "root",
+      length = 0x94e6000,
+      start = 0x90000000,
+    },
+  },
+  nvram = {
+    {
+      backing_store = {
+        data_filename = "input.raw",
+      },
+      label = "input",
+      length = 0x1000,
+      start = 0xa0000000,
+    },
+    {
+      backing_store = {
+        data_filename = "output.raw",
+        shared = true,
+      },
+      label = "output",
+      length = 0x1000,
+      start = 0xa0001000,
+    },
+  },
+  ram = {
+    backing_store = {
+      data_filename = "/usr/share/cartesi-machine/images/linux.bin",
+    },
+    length = 0x8000000,
+  },
+}
+```
+
+Note the two NVRAMs, one for the input and one for the output, and how
+the `cartesi-machine` utility adds a snippet to `dtb.init` that changes
+permissions and ownership of the corresponding devices.
+
+### Loading and running machines
+
+To create a new handle for a machine, use the `cartesi.new()` function.
+The returned `machine` handle can hold a single machine instance, and
+starts empty. To instantiate a Cartesi Machine from a machine
+configuration (e.g., the configurations produced by the
+`cartesi-machine` utility above), use the
+`machine:create(<machine_config>)` method. Alternatively, the shortcut
+`cartesi.machine(<machine_config>)` combines the effects of
+`cartesi.new()` and `machine:create(<machine_config>)` into a single
+call.
+
+For example, the script
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+```
+
+loads a machine configuration from the Lua module specified in the
+command-line (using `require(arg[1])`). It then creates an instance by
+calling the `cartesi.machine(<machine_config>)` constructor, which it
+stores in the `machine` local variable.
+
+The `machine:run(<max_mcycle>)` method of the Cartesi Machine instance
+runs the corresponding machine until the register `mcycle` reaches at
+most `<max_mcycle>`. The value `math.maxinteger` of `<max_mcycle>` used
+in the script is a very large integer, providing the machine with enough
+cycles to run until it halts or yields manual. Note that the
+`machine:run()` method can return prematurely for a variety of reasons
+(see below), so it should always be called inside a loop. It returns a
+break reason explaining why control was returned to the caller, taken
+from the `cartesi.BREAK_REASON_*` set. The script’s loop terminates when
+the break reason is `BREAK_REASON_HALTED` or
+`BREAK_REASON_YIELDED_MANUALLY`, the two reasons that signal the machine
+has reached a state past which it cannot continue on its own.
+
+At any point, the `machine:get_initial_config()` method can be used to
+obtain the configuration that was used to create a Cartesi Machine
+instance.
+
+<a name="run-cat-foo-bar"></a>
+
+For example, to run the configuration stored in
+`./config-cat-foo-bar.lua` (assuming `./foo.ext2` is available) simply
+run
+
+``` bash
+lua5.4 run-config.lua config-cat-foo-bar
+```
+
+``` text
+Hello world!
+```
+
+(The function call `require(arg[1])` translates the argument
+`"config-cat-foo-bar"` to `"config-cat-foo-bar.lua"` and loads that
+file.)
+
+### Instantiation from persistent state
+
+At any point in their execution, Cartesi Machines can be stored to disk.
+A stored machine can later be loaded to continue its execution from
+where it left off.
+
+> [!NOTE]
+>
+> If the machine initialization involved large image files or a
+> considerable amount of RAM, this operation may consume significant
+> disk space. It will also take the time required by the copying of
+> image files into the directory.
+
+To store a machine at its current state, use the
+`machine:store(<directory>)` method of the Cartesi Machine instance. The
+function call fails when the directory already exists, so existing
+persistent Cartesi Machines are not inadvertently overwritten:
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Instantiate machine from configuration
+local config = require("config-cat-foo-bar")
+local machine = cartesi.machine(config)
+
+-- Store persistent state to directory
+machine:store("cat-foo-bar")
+```
+
+After the execution of the script above, the directory `./cat-foo-bar/`
+contains all the information needed to instantiate the same machine,
+including copies of all necessary image files. There are no external
+dependencies.
+
+To load a machine from disk, use the `machine:load(<directory>)` method
+on an empty `machine` handle. Alternatively, the shortcut
+`machine = cartesi.machine(<directory>)` combines the effects of
+`machine = cartesi.new()` and `machine:load(<directory>)` into a single
+call. In fact, running the following script
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Instantiate machine from persistent state directory
+local machine = cartesi.machine("cat-foo-bar")
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+```
+
+has exactly the same effect as the example [above](#run-cat-foo-bar),
+where the machine was instantiated from the configuration and directly
+run until it halted:
+
+``` text
+Hello world!
+```
+
+As before, the configuration that was used to instantiate a Cartesi
+Machine can be obtained from the machine instance with the method
+`machine:get_initial_config()`. Note that this is *not* the
+configuration that was used to instantiate the machine for the first
+time, but rather the configuration used to instantiate a copy of the
+machine that was stored. More specifically, any
+`backing_store.data_filename` fields point to copies that reside inside
+the storage `<directory>`. Likewise, the values of all registers will
+reflect the values as they were when stored. As for the contents of the
+initial backing files, they may have been modified by the running
+instance before a copy was saved into `<directory>`.
+
+### Limiting execution
+
+The host cannot predict how many cycles the emulator will need until a
+call to `machine:run(math.maxinteger)` returns. One of the uses for the
+`<max_mcycle>` argument in production code is to ensure the call returns
+at a desired frequency, rather than potentially blocking the caller
+indefinitely.
+
+The following script illustrates the process
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+local CHUNK = 1000000 -- 1 million cycles
+-- Loop until machine halts or yields manual
+local chunks = 0
+repeat
+    -- Execute at most CHUNK additional cycles, then potentially perform other tasks
+    local break_reason = machine:run(machine:read_reg("mcycle") + CHUNK)
+    chunks = chunks + 1
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+
+-- Print the number of chunks
+stderr("%u chunks\n", chunks)
+```
+
+Each iteration runs the machine for at most an additional `CHUNK`
+cycles. Reading the `mcycle` register with `machine:read_reg("mcycle")`
+returns the current cycle count, which is used to set the new limit to
+`mcycle+CHUNK`. After the call to `machine:run()` returns, the
+application is free to perform other tasks. The loop exits when the
+returned break reason is `BREAK_REASON_HALTED` or
+`BREAK_REASON_YIELDED_MANUALLY`. Any other reason (such as
+`BREAK_REASON_REACHED_TARGET_MCYCLE`, signalling the chunk expired) just
+continues the loop.
+
+``` bash
+lua5.4 run-config-in-chunks.lua config-cat-foo-bar
+```
+
+``` text
+Hello world!
+57 chunks
+```
+
+### Progress feedback
+
+When the computation running inside a Cartesi Machine is intensive, it
+may be desirable to inform users of the progress, so they can plan
+accordingly. On its own, the current value of `mcycle` does not give any
+information concerning how much of the computation still remains. What
+is needed is the value of `mcycle` when the machine halts. This is,
+unfortunately, difficult to estimate from the outside. The guest
+application is in a much better position to estimate its own progress.
+However, it needs a mechanism to communicate its progress back to the
+program controlling the emulator.
+
+The command-line utility `/usr/bin/yield` can be used for this purpose.
+Internally, the tool uses an `ioctl` system-call on the Cartesi-specific
+`/dev/cmio` device. The protocols followed by the `/usr/bin/yield`
+utility to interact with the `/dev/cmio` driver, and by the driver
+itself to communicate with the HTIF Yield device are explained in detail
+under the [guest perspective](#system-architecture). The focus here is
+on its effect on the host program controlling the emulator.
+
+By default, a Cartesi Machine is configured via
+`processor.registers.htif.iyield` to accept HTIF yield automatic
+commands. The field is a bitmask of enabled commands. Setting the
+`cartesi.HTIF_YIELD_CMD_AUTOMATIC_MASK` bit accepts yield automatic, and
+setting `cartesi.HTIF_YIELD_CMD_MANUAL_MASK` accepts yield manual. The
+default machine configuration sets both bits. When automatic yields are
+accepted, a yield automatic command causes the emulator to return
+prematurely from `machine:run(<max_mcycle>)` with break reason
+`BREAK_REASON_YIELDED_AUTOMATICALLY`. When the bit is clear, the command
+is silently ignored and execution continues until the machine halts or
+`mcycle` hits `<max_mcycle>`.
+
+The following example illustrates how Lua scripts can receive progress
+information throughout a computation performed inside a Cartesi Machine:
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+local CHUNK = 1000000 -- 1 million cycles
+local max_mcycle = CHUNK
+-- Loop until machine halts or yields manual
+repeat
+    -- Execute up to max_mcycle
+    local break_reason = machine:run(max_mcycle)
+    -- Check if machine yielded automatic with a progress report
+    if
+        break_reason == cartesi.BREAK_REASON_YIELDED_AUTOMATICALLY
+        and machine:read_reg("htif_tohost_reason") == cartesi.HTIF_YIELD_AUTOMATIC_REASON_PROGRESS
+    then
+        local permil = machine:read_reg("htif_tohost_data")
+        -- Show progress feedback
+        stderr("Progress: %6.2f\r", permil / 10)
+    end
+    -- Refill the time slice for the next iteration
+    if break_reason == cartesi.BREAK_REASON_REACHED_TARGET_MCYCLE then
+        max_mcycle = max_mcycle + CHUNK
+        -- Potentially perform other tasks
+    end
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+-- Machine is now halted or yielded manual
+stderr("\nCycles: %u\n", machine:read_reg("mcycle"))
+```
+
+The loop repeats until the break reason returned by `machine:run()` is
+`BREAK_REASON_HALTED` or `BREAK_REASON_YIELDED_MANUALLY`. As before, the
+computation is performed in chunks. At each iteration, the script tries
+to advance the computation until the end of the next chunk. A
+`BREAK_REASON_YIELDED_AUTOMATICALLY` return means the guest ran a yield
+automatic command. That command can be called for different reasons. The
+reason and the associated data are available in the `htif_tohost_reason`
+and `htif_tohost_data` registers, which expose pre-decoded fields of the
+HTIF `tohost` register. The constant
+`cartesi.HTIF_YIELD_AUTOMATIC_REASON_PROGRESS` corresponds to a progress
+report, in which case `htif_tohost_data` holds the progress in
+per-mille. A `BREAK_REASON_REACHED_TARGET_MCYCLE` return means the chunk
+expired without a yield or halt. In that case the script bumps
+`max_mcycle` by another `CHUNK` and could perform any desired
+“per-chunk” tasks before looping.
+
+For example, running the script with the command-line
+
+``` bash
+lua5.4 run-config-in-chunks-with-progress.lua config-progress
+```
+
+produces the output (shown at 44% completion) below
+
+``` text
+Progress:  44.00
+```
+
+This is similar to the `cartesi-machine` command-line
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    -- $'for i in $(seq 0 5 1000); do yield automatic progress $i; done'
+```
+
+which uses an equivalent mechanism for progress reports.
+
+### Cartesi Machine templates
+
+Recall that, to instantiate a [Cartesi Machine
+template](#cartesi-machine-templates), we first replace its NVRAM
+place-holders with their actual content. After that, we can run the
+resulting machine. We saved the simple calculator template into
+directory `"calculator-template"` by running the `cartesi-machine`
+utility with `--store="calculator-template"`, [as shown
+earlier](#cartesi-machine-templates). There, we also instantiated and
+ran the template with `cartesi-machine`’s `--replace-memory-range`
+command-line option. Internally, the utility uses the
+`machine:replace_memory_range(<memory_range_config>)` method of the
+Cartesi Machine instance to replace an existing memory range. The
+replacement target is identified by the `memory_range_config`’s `start`
+and `length` fields, which must match those of an existing memory range
+in the Cartesi Machine instance. If the memory range is a flash drive or
+an NVRAM, the `label` field can be used to identify it instead. The
+following code snippet shows how to instantiate a Cartesi Machine
+template using the Lua API:
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Instantiate machine from template
+local machine = cartesi.machine("calculator-template")
+
+-- Replace input NVRAM by label
+machine:replace_memory_range({
+    label = "input",
+    backing_store = { data_filename = assert(arg[1], "missing input image filename") },
+})
+
+-- Replace output NVRAM by label
+machine:replace_memory_range({
+    label = "output",
+    backing_store = {
+        data_filename = assert(arg[2], "missing output image filename"),
+        shared = true,
+    },
+})
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+```
+
+The code starts by loading the calculator template from directory
+`"calculator-template"`. It then calls
+`machine:replace_memory_range(<memory_range_config>)` to replace the
+input NVRAM, identifying it by `label` and pointing
+`backing_store.data_filename` at the filename passed as the first
+argument to the script. A second call replaces the output NVRAM
+analogously, also setting `backing_store.shared` to `true` so results
+can be read from the file after the machine is executed. Finally, the
+script runs the machine until it halts or yields manual.
+
+To see the example running,
+
+``` bash
+lua5.4 run-calculator-with-new-drives.lua input.raw output.raw
+lua5.4 -e 'print((string.unpack("z", io.read("a"))))' < output.raw
+```
+
+The result is, as expected,
+
+``` text
+10786158809173895446375831144734148401707861873653839436405804869463\
+96054833005778796250863934445216126720683279228360145952738612886499\
+73495708458383684478649003115037698421037988831222501494715481595948\
+96901677837132352593468675094844090688678579236903861342030923488978\
+36036892526733668721977278692363075584
+```
+
+### State hashes
+
+State hashes (defined earlier under [State hashes](#state-hashes)) are
+Merkle tree root hashes of the machine’s entire address space. Here we
+obtain them from a Cartesi Machine instance with the following script:
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Converts hash from binary to hexadecimal string
+local function hexhash(hash)
+    return (string.gsub(hash, ".", function(c)
+        return string.format("%02x", string.byte(c))
+    end))
+end
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+-- Print the initial cycle count and root hash
+stderr("%u: %s\n", machine:read_reg("mcycle"), hexhash(machine:get_root_hash()))
+
+-- Run machine until it halts or yields manual
+local break_reason
+repeat
+    break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+
+-- Print machine status
+if break_reason == cartesi.BREAK_REASON_HALTED then
+    stderr("\nHalted\n")
+else
+    stderr("\nYielded manual\n")
+end
+stderr("Cycles: %u\n", machine:read_reg("mcycle"))
+
+-- Print the final cycle count and root hash
+stderr("%u: %s\n", machine:read_reg("mcycle"), hexhash(machine:get_root_hash()))
+```
+
+State hashes can be obtained with the `machine:get_root_hash()` method,
+which returns the corresponding Keccak-256 hash as a 32-byte binary
+string. State hashes are produced from an internal Merkle tree data
+structure that is maintained in a lazy fashion. The performance penalty
+imposed on the emulator, were it required to keep the Merkle tree
+up-to-date, would be unacceptable (by several orders of magnitude). If
+no state hashes are needed, the Merkle tree is not updated and
+negligible cost is incurred. However, depending on the extent to which
+the state was modified since the Merkle tree was last updated, the cost
+of implicitly updating it prior to returning the state hash can be
+substantial.
+
+In past releases, the Merkle-tree was kept in memory only. When a
+machine was stored to disk with `machine:store(<directory>)`, the root
+hash was updated and stored along with the machine state. Then, when it
+was loaded with `machine:load(<directory>)`, the root hash was computed
+from scratch and compared against what was stored.
+
+Now, every address range in the machine has an associated
+`backing_store` that includes the `backing_store.dht_filename` (for
+dense hash tree) and `backing_store.dpt_filename` (for dirty-page tree)
+fields, and the `machine_config` includes a new `hash_tree` entry with
+`phtc_filename` (for page hash-tree cache) and `sht_filename` (for
+sparse hash tree) fields. These were added to enable persistent Merkle
+trees. A call to `machine:store(<directory>)` stores the Merkle tree
+structures in their current state. Conversely,
+`machine:load(<directory>)` loads the tree structure back up. Moreover,
+when these files are marked as `shared` in the configuration, the tree
+is maintained up-to-date on disk as well. This means that it is now
+possible to operate a machine entirely from disk with minimal additional
+overhead.
+
+Before running the machine, the script obtains the initial state hash,
+converts it to hexadecimal, and prints the result. The script then runs
+the machine until it halts or yields manual. Once the machine is halted,
+the script obtains and prints the final state hash.
+
+Initial state hashes can be used to ensure the machine instantiated by
+the script indeed matches the machine created by the `cartesi-machine`
+utility, and final state hashes to verify that computations also agree.
+The output of running
+
+``` bash
+lua5.4 run-config-with-hashes.lua config-nothing-to-do
+```
+
+is exactly the same as running the same Cartesi Machine via the
+`cartesi-machine` utility.
+
+``` bash
+cartesi-machine \
+    --initial-hash \
+    --final-hash
+```
+
+``` text
+0: d28274b4ff458388fccda9766418ad2412e25ca3f745290e8258462a6bf2fbcb
+
+         .
+        / \
+      /    \
+\---/---\  /----\
+ \       X       \
+  \----/  \---/---\
+       \    / CARTESI
+        \ /   MACHINE
+         '
+
+Nothing to do.
+
+Halted
+Cycles: 41860482
+41860482: e8cf5abc4fd1c72a6ec106c9d3f9ad2f2053ef6d142864fc12c5e084458ac0bc
+```
+
+Note that the initial state hashes and the final state hashes match, as
+expected.
+
+### External state access
+
+The entire Cartesi Machine state is transparently exposed to the
+controlling program. A variety of methods can be used to query a machine
+instance for any value in its state.
+
+The method `machine:read_word(<address>)` returns the 64-bit word at
+`<address>`, which must be 8-byte aligned. (Due to the alignment
+requirements, this always falls entirely inside a single address range.)
+
+The value of any register can be obtained by name with the
+`machine:read_reg("<name>")` method. The valid names are derived from
+the leaves of `processor.registers` in the
+[`processor_config`](#processor_config) schema by joining nested
+sub-tables with an underscore. For example,
+`processor.registers.htif.tohost` becomes `htif_tohost`,
+`processor.registers.iflags.H` becomes `iflags_H`, and
+`processor.registers.clint.mtimecmp` becomes `clint_mtimecmp`. (The call
+`machine:read_reg("mcycle")` has already been encountered several
+times.) In addition, the pre-decoded `dev`, `cmd`, `reason`, and `data`
+fields of the `htif_tohost` and `htif_fromhost` registers are exposed by
+appending the field name (e.g. `htif_tohost_reason`). Most registers are
+part of the [RISC-V
+ISA](https://content.riscv.org/wp-content/uploads/2017/05/riscv-spec-v2.2.pdf),
+and its [privileged
+architecture](https://content.riscv.org/wp-content/uploads/2017/05/riscv-privileged-v1.10.pdf).
+Cartesi-specific registers are described under the guest perspective
+sections that cover the [processor](#the-main-processor) and
+[board](#the-board) of the Cartesi Machine architecture.
+
+The method `machine:read_memory(<start>, <length>)` returns a string
+with `<length>` bytes starting at the physical-memory address `<start>`,
+anywhere in the machine address space. This region can fall inside RAM,
+any of the flash drives or NVRAMs, the DTB, the CMIO buffers etc. It can
+straddle two adjacent memory ranges, or even touch unmapped memory
+(which is presumed filled with zeros for this purpose).
+
+Conversely, any value in the state of a Cartesi Machine instance can be
+modified by the controlling program. In contrast to reading the state,
+writing to the state requires extreme care. First, for obvious reasons,
+external modifications to the state break the reproducibility of Cartesi
+Machines. Second, careless state modifications can easily panic the
+Linux kernel or crash any programs running under it. Nevertheless, there
+are a few scenarios where these modifications are safe and useful.
+
+The method `machine:write_word(<address>, <value>)` writes a 64-bit
+value at the 8-byte aligned `<address>`, with the same address range as
+`read_word`.
+
+The value of any register can be changed with the
+`machine:write_reg("<name>", <value>)` method, where `<name>` is one of
+the names accepted by `read_reg` and `<value>` is a 64-bit integer.
+
+The `machine:write_memory(<start>, <data>)` method writes the string
+`<data>` into any memory range in the state, starting at the
+physical-memory address `<start>`. In contrast to
+`machine:read_memory()`, the bytes in the string `<data>` must fit
+entirely inside a single memory range (i.e., it cannot straddle an
+address range boundary and cannot fall in a range mapped to a device, or
+in an unmapped region). Memory ranges include the RAM, the DTB, any of
+the flash drives or NVRAMs, the CMIO buffers, etc.
+
+The typical use for `machine:write_memory()` is when a new input to a
+Rolling Cartesi Machine has become available from Cartesi Rollups.
+Another use is when an input flash drive or NVRAM was instantiated
+without an image file, and is thus filled with zeros in the initial
+machine state. Before running the machine for the first time, it is safe
+to replace the contents of the range with the desired input. (Note,
+however, that if a memory range does have an associated `shared` image
+file, the `machine:write_memory()` method *will* modify the associated
+image file on disk as well as its mapping in the Cartesi Machine state.)
+Another use case is in low-level debugging sessions. (The `gdb` remote
+serial protocol requires the ability to externally modify the state.)
+
+As an example, consider the following script:
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+
+-- Instantiate machine from configuration
+local calculator_config = require("config-calculator")
+local machine = cartesi.machine(calculator_config)
+
+-- Write expression to input NVRAM
+local input_nvram = assert(util.find_drive(calculator_config, "nvram", "input"))
+machine:write_memory(input_nvram.start, table.concat(arg, " ") .. "\n")
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+
+-- Read result from output NVRAM
+local output_nvram = assert(util.find_drive(calculator_config, "nvram", "output"))
+print((string.unpack("z", machine:read_memory(output_nvram.start, output_nvram.length))))
+```
+
+The script loads `calculator_config` from its Lua module
+`./config-calculator.lua` and instantiates a Cartesi Machine from it.
+This is the configuration for using the `bc` program to evaluate an
+arithmetic expression. It locates the pristine input and output NVRAMs
+with the `cartesi.util.find_drive(<config>, <kind>, <label>)` helper,
+which returns the `<kind>` drive (here an `nvram`) carrying the given
+`<label>`, with its `log2_size` filled in. The script concatenates its
+command-line arguments, line-terminates them, and writes them at the
+start of the input NVRAM. It then runs the machine until it halts or
+yields manual. Finally, it reads the output NVRAM contents, extracts the
+first null-terminated string from it, and prints the result.
+
+Running the script with the command-line
+
+``` bash
+lua5.4 run-calculator.lua 6*2^1024 + 3*2^512
+```
+
+produces the output
+
+``` text
+10786158809173895446375831144734148401707861873653839436405804869463\
+96054833005778796250863934445216126720683279228360145952738612886499\
+73495708458383684478649003115037698421037988831222501494715481595948\
+96901677837132352593468675094844090688678579236903861342030923488978\
+36036892526733668721977278692363075584
+```
+
+The number is indeed the value of the expression
+6×2<sup>1024</sup>+3×2<sup>512</sup>.
+
+External state modifications are widely used in the setup of artificial,
+unexpected conditions for regression tests.
+
+### State value proofs
+
+Value proofs concerning the state of the Cartesi Machine can be obtained
+from any instance using the method
+`machine:get_proof(<address>, <log2_target_size>[, <log2_root_size>])`.
+
+*State value proofs* are proofs that a given node in the Merkle tree of
+the Cartesi Machine state has a given hash. Each Merkle tree node covers
+a contiguous range of the machine’s 64-bit address space. The size of a
+range is always a power of 2 (given by the `<log2_target_size>`
+parameter). Since the leaves have size `32` bytes, the valid values for
+`<log2_target_size>` are `5`…`64`. The range corresponding to each node
+starts at an `<address>` that is a multiple of its size.
+
+Recall that the state Merkle tree is maintained in a lazy fashion.
+Therefore, just like with the `machine:get_root_hash()` method, the
+Merkle tree will be implicitly updated to account for state changes.
+This means the time it takes to obtain a proof depends on the extent to
+which the state has been modified since the Merkle tree was last
+updated.
+
+The `machine:get_proof()` method returns a table with the following
+structure:
+
+``` lua
+proof ::= {
+  root_hash ::= string,
+  target_hash ::= string,
+  sibling_hashes ::= {
+    [1] ::= string,
+    [2] ::= string,
+    ...
+    [log2_root_size-log2_target_size] ::= string
+  }
+}
+```
+
+Field `root_hash` is the root hash of the 2^`<log2_root_size>`-byte
+subtree containing `<address>`. The value of `<log2_root_size>` defaults
+to `cartesi.HASH_TREE_LOG2_ROOT_SIZE`, in which case `root_hash` equals
+the value returned by `machine:get_root_hash()`. The `target_hash` field
+contains the hash of the node corresponding to the `<address>` and
+`<log2_target_size>` arguments.
+
+To understand the contents of the `sibling_hashes` array, consider a
+path from the target node (included), up the Merkle tree, all the way to
+the root node (excluded). When this path is traversed, a number of nodes
+are visited. The `sibling_hashes` array contains the hashes of the
+*siblings* of all nodes visited.
+
+Using the data in a proof, it is possible to verify the claim that a
+Merkle tree with a given root hash contains a target node with a given
+hash and size at the position given by its address. The following script
+verifies the state value proof for the output NVRAM in the calculator
+example discussed above. It uses two helper functions from the
+`hash-tree.lua` sample module to check the proof returned by
+`machine:get_proof()`. These helpers are shown and explained under
+[Slicing and splicing](#slicing-and-splicing) in the Blockchain
+perspective.
+
+The `cartesi.keccak256(<string>)` function of the `cartesi` Lua module
+returns the hash of the byte string `<string>`. The
+`cartesi.keccak256(<hash1>, <hash2>)` overload returns the hash of the
+concatenation of `<hash1>` and `<hash2>`. The `cartesi.sha256(<string>)`
+and `cartesi.sha256(<hash1>, <hash2>)` behave analogously.
+
+The calculator script requires this module and uses `verify_slice` to
+verify the output NVRAM proof.
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+local hash_tree = require("cartesi.hash-tree")
+
+-- Instantiate machine from configuration
+local config = require("config-calculator")
+local machine = cartesi.machine(config)
+
+-- Write expression to input NVRAM
+local input_nvram = assert(util.find_drive(config, "nvram", "input"))
+machine:write_memory(input_nvram.start, table.concat(arg, " ") .. "\n")
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+
+-- Obtain value proof for output NVRAM
+local output_state_hash = machine:get_root_hash()
+local output_nvram = assert(util.find_drive(config, "nvram", "output"))
+local output_proof = machine:get_proof(output_nvram.start, output_nvram.log2_size)
+
+-- Proof must be a whole-machine proof rooted at the current machine state
+assert(output_proof.log2_root_size == cartesi.HASH_TREE_LOG2_ROOT_SIZE, "proof depth mismatch")
+assert(output_proof.root_hash == output_state_hash, "proof root mismatch")
+
+-- Verify proof
+hash_tree.verify_slice(output_proof)
+print("\nOutput NVRAM proof accepted!\n")
+
+print((string.unpack("z", machine:read_memory(output_nvram.start, output_nvram.length))))
+```
+
+Running the script with the command-line
+
+``` bash
+lua5.4 run-calculator-with-proof.lua 6*2^1024 + 3*2^512
+```
+
+produces the output
+
+``` text
+
+Output NVRAM proof accepted!
+
+10786158809173895446375831144734148401707861873653839436405804869463\
+96054833005778796250863934445216126720683279228360145952738612886499\
+73495708458383684478649003115037698421037988831222501494715481595948\
+96901677837132352593468675094844090688678579236903861342030923488978\
+36036892526733668721977278692363075584
+```
+
+### Remote Cartesi Machines
+
+The Lua API can also be used to control a Remote Cartesi Machine. The
+functionality is available as the `cartesi.jsonrpc` module. Denote by
+`cartesi_jsonrpc` the module returned by `require"cartesi.jsonrpc"`.
+
+The `cartesi_jsonrpc.connect_server(<remote-address>[, <timeout-ms>])`
+function opens a connection to an existing Remote Cartesi Machine server
+and returns a handle to the connection. Denote the handle by
+`cartesi_jsonrpc_machine`. It is the remote counterpart to the local
+`cartesi.machine`, and behaves in the same way, other than being
+connected to the remote server and exposing additional server-control
+methods.
+
+The `cartesi_jsonrpc_machine:fork_server()` call creates a new server,
+in the same remote computer as the server `cartesi_jsonrpc_machine`
+points to, with an exact, independent copy of the current machine
+instance (if any), and returns a handle connected to this new server.
+
+Just as `cartesi.machine(<machine_config>)` instantiates a local
+machine, `cartesi_jsonrpc_machine(<machine_config>)` instantiates a
+remote machine in the server. Each server can hold a single machine, and
+therefore the machine handle returned is the server handle itself. It
+supports all methods that a local machine supports, and these behave in
+exactly the same way. We will describe the remote-specific behavior.
+
+If a machine already exists in the server, trying to instantiate a new
+one will cause an error. Use the `cartesi_jsonrpc_machine:is_empty()`
+method to check if the server holds a machine instance
+(`cartesi_jsonrpc_machine:destroy()` destroys an existing instance).
+
+The `cartesi_jsonrpc_machine:get_server_version()` method returns a
+`semantic_version` object that contains the server version:
+
+``` lua
+semantic_version ::= {
+  major ::= number,
+  minor ::= number,
+  patch ::= number,
+  pre_release ::= string,
+  build ::= string
+}
+```
+
+The `cartesi_jsonrpc_machine:set_cleanup_call(<call>)` method controls
+what happens when the handle is closed or garbage-collected. The three
+constants `cartesi_jsonrpc.NOTHING`, `cartesi_jsonrpc.DESTROY`, and
+`cartesi_jsonrpc.SHUTDOWN` select the cleanup action. In a handle
+created by `cartesi_jsonrpc.connect_server()`, this defaults to
+`NOTHING`. After all, the server was created by some other process that
+should control its cleanup. In a handle created by
+`cartesi_jsonrpc.spawn_server()`, this defaults to `SHUTDOWN`. The new
+server starts as owned by the current script, and when the handle is
+destroyed, so is the server process.
+
+The following script illustrates the use of the `cartesi.jsonrpc`
+module:
+
+``` lua
+-- Load the JSON-RPC submodule for remote Cartesi Machines
+local cartesi_jsonrpc = require("cartesi.jsonrpc")
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Connect to remote Cartesi Machine server (shut it down automatically on exit)
+local remote_address = assert(arg[1], "missing remote address")
+stderr("Connecting to remote cartesi machine at '%s'\n", remote_address)
+local cartesi_jsonrpc_machine <close> =
+    assert(cartesi_jsonrpc.connect_server(remote_address)):set_cleanup_call(cartesi_jsonrpc.SHUTDOWN)
+
+-- Print server version (and test connection)
+local v = assert(cartesi_jsonrpc_machine:get_server_version())
+stderr("Connected: remote version is %d.%d.%d\n", v.major, v.minor, v.patch)
+
+-- Instantiate remote machine from configuration
+local machine = cartesi_jsonrpc_machine((require(arg[2])))
+
+-- Run machine until it halts or yields
+while machine:read_reg("iflags_H") == 0 and machine:read_reg("iflags_Y") == 0 do
+    machine:run(math.maxinteger)
+end
+
+-- Print machine status
+if machine:read_reg("iflags_H") ~= 0 then
+    stderr("\nHalted\n")
+else
+    stderr("\nYielded manual\n")
+end
+-- Print cycle count
+stderr("Cycles: %u\n", machine:read_reg("mcycle"))
+```
+
+The script loads the `cartesi.jsonrpc` module and connects to the server
+address given as the first command-line argument. It calls
+`cartesi_jsonrpc_machine:get_server_version()` to test the connection
+and prints the version number. It then instantiates a remote machine by
+calling `cartesi_jsonrpc_machine` with the configuration obtained from
+the second command-line argument, and runs it until it halts or yields.
+The `<close>` annotation combined with
+`set_cleanup_call(cartesi.jsonrpc.SHUTDOWN)` retires the server
+automatically when the script exits.
+
+Recall that, to run a server inside the playground, we opened a separate
+shell into the same playground container (for example, by running
+`docker exec -it playground /bin/bash`), and then ran the
+`cartesi-jsonrpc-machine` server in it
+
+``` bash
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8084
+```
+
+Now, instead of using the `cartesi-machine` command-line utility to
+control it, run the `run-remote-config.lua` client script in the other
+shell
+
+``` bash
+lua5.4 run-remote-config.lua \
+    127.0.0.1:8084 \
+    config-nothing-to-do
+```
+
+The client shell produces
+
+``` text
+Connecting to remote cartesi machine at '127.0.0.1:8084'
+Connected: remote version is 0.6.0
+
+Halted
+Cycles: 41860482
+```
+
+The server shell produces
+
+``` text
+
+         .
+        / \
+      /    \
+\---/---\  /----\
+ \       X       \
+  \----/  \---/---\
+       \    / CARTESI
+        \ /   MACHINE
+         '
+
+Nothing to do.
+```
+
+### Rolling Cartesi Machines
+
+Guest applications running inside Rolling Cartesi Machines communicate
+with the outside world by using Cartesi Rollups. In production, the
+Cartesi Node is responsible for passing advance-state and inspect-state
+requests to the machine and collecting the responses (vouchers, notices,
+reports, and exceptions) that were generated while processing each
+request. When prototyping, the `cartesi-machine` command-line utility
+can be used to play the same part, loading sequentially-numbered
+requests from files and storing sequentially-numbered responses to
+files. Naturally, the Lua interface can also be used to feed requests to
+a Rolling Cartesi Machine and obtain the responses it produces.
+
+The guest application uses the `/dev/cmio` device (typically using the
+libcmt library) to notify the host it is done with the current request
+and ready for the next. While processing each request, it again uses the
+`/dev/cmio` to notify the host of each new output or report it
+generates. In both cases, the host retrieves the yield *command*,
+*reason*, and request *data* via `machine:receive_cmio_request()`. When
+transitioning between requests, the reason can take the values
+`cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED` (previous request was
+accepted), `cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED` (previous
+request was rejected), or
+`cartesi.HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION` (an unrecoverable error
+was encountered). When generating a new response to a request, the
+reason can take the self-explanatory values
+`cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT` (a voucher or notice)
+and `cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT`.
+
+The data associated with new requests is sent to the machine in the CMIO
+memory range defined by the `memory_range_config` entry stored in the
+`machine_config` as `cmio.rx_buffer`. Conversely, the data associated
+with responses (or exceptions) is obtained from the machine in the
+`cmio.tx_buffer` memory range. The host does not need to access these
+ranges directly. The call
+`machine:send_cmio_response(<revert_root_hash>, <reason>, <data>)`
+records `<revert_root_hash>` in the machine state, writes `<data>` into
+`cmio.rx_buffer`, records the reason and length in `htif_fromhost`, and
+clears `iflags_Y` so the machine can resume. Conversely, the *data*
+value returned by `machine:receive_cmio_request()` is the contents of
+`cmio.tx_buffer` at the yield.
+
+Advance-state inputs are passed as ABI-encoded
+`EvmAdvance(uint256 chainId, address appContract, address msgSender, uint256 blockNumber, uint256 blockTimestamp, uint256 prevRandao, uint256 index, bytes payload)`
+calldata blobs. The *block timestamp* field is in seconds since the
+*Unix epoch*, and the *prev randao* field is a 32-byte big-endian
+unsigned integer. (See the table in the guest perspective
+[architecture](#rollup).)
+
+Outputs come back as ABI-encoded `Voucher(address,uint256,bytes)` or
+`Notice(bytes)` calldata blobs. Reports, exceptions, and inspect-state
+queries are raw payload bytes with no ABI wrapping. The `cartesi.evmu`
+Lua submodule provides `encode_calldata` and `decode_calldata` helpers
+for these signatures.
+
+The following script illustrates how the Lua API can be used to send
+advance-state requests to a Rolling Cartesi Machine, and how it can be
+used to collect the notices produced as responses (we will use the
+server calculator [example](#rolling-cartesi-machines)):
+
+``` lua
+-- Load the JSON-RPC submodule and the EVM ABI helpers
+local cartesi = require("cartesi")
+local cartesi_jsonrpc = require("cartesi.jsonrpc")
+local evmu = require("cartesi.evmu")
+
+local EVM_ADVANCE = "EvmAdvance(uint256 chain_id, address app_contract, address msg_sender, "
+    .. "uint256 block_number, uint256 block_timestamp, uint256 prev_randao, uint256 index, bytes payload)"
+local NOTICE = "Notice(bytes payload)"
+local ZERO_ADDRESS = "0x0000000000000000000000000000000000000000"
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Encode a raw expression as an EvmAdvance request payload (bc needs a
+-- trailing newline to accept the line as a complete expression)
+local function encode_advance(expr, index)
+    local bint = evmu.bint
+    return evmu.encode_calldata(EVM_ADVANCE, {
+        chain_id = bint.new(0),
+        app_contract = ZERO_ADDRESS,
+        msg_sender = ZERO_ADDRESS,
+        block_number = bint.new(0),
+        block_timestamp = bint.new(os.time()),
+        prev_randao = bint.new(0),
+        index = bint.new(index),
+        payload = evmu.raw(expr .. "\n"),
+    })
+end
+
+-- Print a string folded into lines of width w
+local function fold(s, w)
+    for i = 1, #s, w do
+        print(s:sub(i, i + w - 1))
+    end
+end
+
+-- Decode a response inside a notice
+local function print_decoded_notice(data)
+    fold(evmu.decode_calldata(NOTICE, data, "raw").payload, 68)
+end
+
+-- Connect to remote Cartesi Machine server (and shut it down on exit)
+local remote_address = assert(arg[1], "missing remote address")
+stderr("Connecting to remote cartesi machine at '%s'\n", remote_address)
+local cartesi_jsonrpc_machine <close> =
+    assert(cartesi_jsonrpc.connect_server(remote_address)):set_cleanup_call(cartesi_jsonrpc.SHUTDOWN)
+
+-- Print server version (and test connection)
+local v = assert(cartesi_jsonrpc_machine:get_server_version())
+stderr("Connected: remote version is %d.%d.%d\n", v.major, v.minor, v.patch)
+
+-- Load remote machine from the rolling-calculator template
+local machine = cartesi_jsonrpc_machine("rolling-calculator-template")
+
+-- Snapshot via fork: the backup server keeps the pre-input state
+local backup
+local function snapshot()
+    backup = machine:fork_server()
+end
+local function commit()
+    if backup then
+        backup:shutdown_server()
+    end
+    backup = nil
+end
+local function rollback()
+    assert(backup, "no snapshot to rollback to")
+    local address = machine:get_server_address()
+    machine:shutdown_server()
+    machine:swap(backup)
+    machine:rebind_server(address)
+    backup = nil
+end
+
+-- Run the machine until it halts or stdin closes
+local i = 0
+repeat
+    local break_reason = machine:run(math.maxinteger)
+    if break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY then
+        local _, yield_reason = machine:receive_cmio_request()
+        if yield_reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED then
+            commit()
+            stderr("type expression\n")
+            local expr = io.read()
+            if not expr then
+                break
+            end
+            stderr("%s\n", expr) -- echo the input so non-tty transcripts make sense
+            i = i + 1
+            snapshot()
+            machine:send_cmio_response(
+                machine:get_root_hash(),
+                cartesi.HTIF_YIELD_REASON_ADVANCE_STATE,
+                encode_advance(expr, i)
+            )
+        elseif i > 0 and yield_reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED then
+            stderr("input rejected\n")
+            rollback()
+        else
+            stderr("machine initialization failed\n")
+            break
+        end
+    elseif break_reason == cartesi.BREAK_REASON_YIELDED_AUTOMATICALLY then
+        local _, yield_reason, data = machine:receive_cmio_request()
+        if yield_reason == cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT then
+            stderr("result is\n")
+            print_decoded_notice(data)
+        end
+    end
+until break_reason == cartesi.BREAK_REASON_HALTED
+commit()
+```
+
+Rolling Cartesi Machines must be rolled-back to the state they were at
+before they received an advance-state request they later rejected. This
+requires snapshot and rollback support, which are easy to implement
+using the fork functionality of Remote Cartesi Machines. The script
+therefore uses the `cartesi.jsonrpc` module to instantiate a remote
+machine based on the `"rolling-calculator-template"`. The
+`machine:fork_server()` call creates a backup server with a copy of the
+current state. On rejection, the script shuts down the server that
+rejected the input, swaps the backup handle into `machine`, and rebinds
+it to the original server address. On acceptance, it shuts down the
+now-stale backup.
+
+It then enters its main loop, which is executed until the machine halts.
+For each iteration, the script invokes `machine:run(math.maxinteger)` to
+run the machine until it yields or halts. When the call returns, it
+checks if the machine yielded manual. If so, it checks the reason for
+the yield.
+
+If the reason was `cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED`, the
+application accepted the previous request and is ready for the next. The
+script then attempts to obtain a mathematical expression from the
+console. If the user provides one, it creates a new snapshot,
+ABI-encodes the expression as `EvmAdvance` calldata with `cartesi.evmu`,
+and feeds the encoded input through
+`machine:send_cmio_response(machine:get_root_hash(), cartesi.HTIF_YIELD_REASON_ADVANCE_STATE, ...)`.
+If, however, the reason was anything else, the script rolls back the
+machine and continues with the next loop iteration.
+
+> [!NOTE]
+>
+> The `machine:get_root_hash()` passed to `machine:send_cmio_response()`
+> is recorded into the machine state as the state hash to revert to in
+> case the guest application rejects the input. This is required for
+> dispute resolution to operate properly.
+
+If the machine yielded automatic, the script once again checks for the
+yield reason. If the reason was
+`cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT`, the script decodes the
+data as a `Notice` calldata blob, extracts its `payload` field as raw
+bytes, and prints the formatted result to the console.
+
+Here is what a session looks like. First, open a separate shell into the
+same docker container (for example, by running
+`docker exec -it playground /bin/bash`) and run the
+`cartesi-jsonrpc-machine` server in it
+
+``` bash
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8085
+```
+
+Then, run the `run-rolling-calculator.lua` client script in the other
+shell
+
+``` bash
+lua5.4 run-rolling-calculator.lua 127.0.0.1:8085
+```
+
+The client prints the connection status to the console and then prompts
+us to type an expression. Entering `6*2^1024 + 3*2^512` causes the
+expected result to be printed, after which the client asks for a new
+expression. Entering an invalid expression `1+(` causes the `calc.sh`
+script running inside the Rolling Cartesi Machine to reject the input.
+Finally, entering `^D` causes the client script to exit and shut down
+the server. The full transcript is
+
+``` text
+Connecting to remote cartesi machine at '127.0.0.1:8085'
+Connected: remote version is 0.6.0
+type expression
+6*2^1024 + 3*2^512
+result is
+10786158809173895446375831144734148401707861873653839436405804869463
+96054833005778796250863934445216126720683279228360145952738612886499
+73495708458383684478649003115037698421037988831222501494715481595948
+96901677837132352593468675094844090688678579236903861342030923488978
+36036892526733668721977278692363075584
+type expression
+1+(
+result is
+input rejected
+type expression
+```
+
+The remote console shows only the error generated when the invalid
+expression `1+(` was entered:
+
+``` text
+(standard_in) 2: syntax error
+```
+
+### Output proofs
+
+Recall that the advance-state requests serviced by a Rolling Cartesi
+Machine are grouped into epochs. The outputs that these requests
+produce, across every epoch, are accumulated in order from genesis as
+the leaves of a single fixed-height Merkle tree. The root of this tree
+over the outputs accepted so far is the *output hashes root hash*. The
+guest writes it to the CMIO tx buffer on every accept, so it is part of
+the machine state.
+
+Disputes are settled over the machine state hash at the end of an epoch.
+The latest output hashes root hash sits in the tx-buffer in that state.
+A [state value proof](#state-value-proofs-1) of the tx-buffer word it
+occupies ties it to the state hash. Therefore, once the [verification
+game](#verification-game) settles the state hash, the output hashes root
+hash is settled with it. The blockchain then verifies any output with
+its *output proof* alone, checking that the leaf `keccak256(<output>)`
+rolls up to the settled output hashes root hash from its global output
+index.
+
+The `hash-tree.lua` sample module accumulates the output hashes tree
+with an incremental keccak Merkle accumulator whose leaves are
+`keccak256(<output>)`. A *frontier* captures the outputs accepted so
+far. At genesis, the frontier is
+`hash_tree.frontier(<log2_max_leaves>)`. The frontier for a later epoch
+can be obtained from the previous epoch’s last output using
+`hash_tree.frontier(<last_output_proof>)`. As each output is accepted,
+`hash_tree.frontier_push_back(<frontier>, <leaf>)` folds its leaf in,
+and `hash_tree.frontier_get_root_hash(<frontier>)` yields the output
+hashes root hash to check against the one the guest wrote. Once the
+epoch closes, `hash_tree.frontier_next_proofs(<frontier>, <leaves>)`
+returns one proof per new output, all against the single final root.
+These helpers are shown and explained under [The output hashes
+tree](#the-output-hashes-tree) in the Blockchain perspective.
+
+The following script extends the Rolling Cartesi Machine calculator
+[example](#rolling-cartesi-machines-1) to collect output proofs and the
+state-value proof for the output hashes root hash. It buffers the
+outputs of each input until the input’s verdict is known. On accept, it
+folds the buffered outputs into the running frontier, checks the
+resulting root against the output hashes root hash the guest wrote to
+the tx buffer, and saves the state value proof of that tx-buffer word,
+obtained with
+`machine:get_proof(cartesi.AR_CMIO_TX_BUFFER_START, cartesi.HASH_TREE_LOG2_WORD_SIZE)`,
+whose `target_hash` equals `cartesi.keccak256(<root hash>)`. On reject,
+it simply discards the buffered outputs, leaving the tree untouched.
+Once the epoch closes, it generates the per-output proofs against the
+final root and verifies each with the same `verify_slice` used above.
+
+``` lua
+-- Load the JSON-RPC submodule, the EVM ABI helpers, and the hash-tree helpers
+local cartesi = require("cartesi")
+local cartesi_jsonrpc = require("cartesi.jsonrpc")
+local evmu = require("cartesi.evmu")
+local util = require("cartesi.util")
+local hash_tree = require("cartesi.hash-tree")
+
+local EVM_ADVANCE = "EvmAdvance(uint256 chain_id, address app_contract, address msg_sender, "
+    .. "uint256 block_number, uint256 block_timestamp, uint256 prev_randao, uint256 index, bytes payload)"
+local NOTICE = "Notice(bytes payload)"
+local ZERO_ADDRESS = "0x0000000000000000000000000000000000000000"
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Encode a raw expression as an EvmAdvance request payload (bc needs a
+-- trailing newline to accept the line as a complete expression)
+local function encode_advance(expr, index)
+    local bint = evmu.bint
+    return evmu.encode_calldata(EVM_ADVANCE, {
+        chain_id = bint.new(0),
+        app_contract = ZERO_ADDRESS,
+        msg_sender = ZERO_ADDRESS,
+        block_number = bint.new(0),
+        block_timestamp = bint.new(os.time()),
+        prev_randao = bint.new(0),
+        index = bint.new(index),
+        payload = evmu.raw(expr .. "\n"),
+    })
+end
+
+-- Print a string folded into lines of width w
+local function fold(s, w)
+    for i = 1, #s, w do
+        print(s:sub(i, i + w - 1))
+    end
+end
+
+-- Decode a response inside a notice
+local function print_decoded_notice(data)
+    fold(evmu.decode_calldata(NOTICE, data, "raw").payload, 68)
+end
+
+-- Serialize a proof as a Lua chunk and save it
+local function save_proof(proof, name)
+    local f <close> = assert(io.open(name, "w"))
+    f:write("return ")
+    util.dump_table(proof, f)
+    f:write("\n")
+    stderr("saved %s\n", name)
+end
+
+-- Connect to remote Cartesi Machine server (and shut it down on exit)
+local remote_address = assert(arg[1], "missing remote address")
+stderr("Connecting to remote cartesi machine at '%s'\n", remote_address)
+local cartesi_jsonrpc_machine <close> =
+    assert(cartesi_jsonrpc.connect_server(remote_address)):set_cleanup_call(cartesi_jsonrpc.SHUTDOWN)
+
+-- Print server version (and test connection)
+local v = assert(cartesi_jsonrpc_machine:get_server_version())
+stderr("Connected: remote version is %d.%d.%d\n", v.major, v.minor, v.patch)
+
+-- Load remote machine from the rolling-calculator template
+local machine = cartesi_jsonrpc_machine("rolling-calculator-template")
+
+-- Snapshot via fork: the backup server keeps the pre-input state
+local backup
+local function snapshot()
+    backup = machine:fork_server()
+end
+local function commit()
+    if backup then
+        backup:shutdown_server()
+    end
+    backup = nil
+end
+local function rollback()
+    assert(backup, "no snapshot to rollback to")
+    local address = machine:get_server_address()
+    machine:shutdown_server()
+    machine:swap(backup)
+    machine:rebind_server(address)
+    backup = nil
+end
+
+-- Seed frontier builds the end-of-epoch proofs, a running copy checks each input's root
+local seed_frontier = hash_tree.frontier(cartesi.CMIO_LOG2_MAX_OUTPUT_COUNT)
+local running_frontier = hash_tree.frontier_copy(seed_frontier)
+local output_hashes = {} -- keccak256 leaf of every accepted output, in order
+local output_inputs = {} -- the input index each accepted output came from
+local pending_outputs = {} -- outputs of the current input, buffered until its verdict is known
+
+-- On accept, fold the input's outputs into the tree and save its tx-buffer root-hash proof
+local function flush_accepted(input_index, root_hash)
+    for _, output in ipairs(pending_outputs) do
+        local leaf = cartesi.keccak256(output)
+        output_hashes[#output_hashes + 1] = leaf
+        output_inputs[#output_inputs + 1] = input_index
+        hash_tree.frontier_push_back(running_frontier, leaf)
+    end
+    pending_outputs = {}
+    assert(#root_hash == cartesi.HASH_SIZE, "expected output hashes root hash in tx buffer")
+    assert(hash_tree.frontier_get_root_hash(running_frontier) == root_hash, "output hashes root hash mismatch")
+    local proof = machine:get_proof(cartesi.AR_CMIO_TX_BUFFER_START, cartesi.HASH_TREE_LOG2_WORD_SIZE)
+    assert(proof.root_hash == machine:get_root_hash(), "proof root mismatch")
+    assert(proof.target_hash == cartesi.keccak256(root_hash), "tx buffer does not hold the output hashes root hash")
+    hash_tree.verify_slice(proof)
+    save_proof(proof, string.format("input-%d-output-hashes-root-hash-proof.lua", input_index))
+end
+
+-- Run the machine until it halts or stdin closes
+local i = 0
+repeat
+    local break_reason = machine:run(math.maxinteger)
+    if break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY then
+        local _, yield_reason, data = machine:receive_cmio_request()
+        if yield_reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED then
+            commit()
+            -- the just-run input was accepted, so close it out before feeding the next one
+            if i > 0 then
+                flush_accepted(i, data)
+            end
+            stderr("type expression\n")
+            local expr = io.read()
+            if not expr then
+                break
+            end
+            stderr("%s\n", expr) -- echo the input so non-tty transcripts make sense
+            i = i + 1
+            snapshot()
+            machine:send_cmio_response(
+                machine:get_root_hash(),
+                cartesi.HTIF_YIELD_REASON_ADVANCE_STATE,
+                encode_advance(expr, i)
+            )
+        elseif i > 0 and yield_reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED then
+            stderr("input rejected\n")
+            pending_outputs = {} -- discard the rejected input's outputs; the tree is left untouched
+            rollback()
+        else
+            stderr("machine initialization failed\n")
+            break
+        end
+    elseif break_reason == cartesi.BREAK_REASON_YIELDED_AUTOMATICALLY then
+        local _, yield_reason, data = machine:receive_cmio_request()
+        if yield_reason == cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT then
+            pending_outputs[#pending_outputs + 1] = data -- buffer until the input's verdict is known
+            stderr("result is\n")
+            print_decoded_notice(data)
+        end
+    end
+until break_reason == cartesi.BREAK_REASON_HALTED
+commit()
+
+-- Build, verify, and save one per-output proof against the final root
+local proofs = hash_tree.frontier_next_proofs(seed_frontier, output_hashes)
+for k, proof in ipairs(proofs) do
+    hash_tree.verify_slice(proof)
+    save_proof(proof, string.format("output-%d-input-%d-proof.lua", proof.target_address, output_inputs[k]))
+end
+```
+
+Here is what a session looks like. As before, open a separate shell into
+the same docker container and run the `cartesi-jsonrpc-machine` server
+in it
+
+``` bash
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8089
+```
+
+Then, run the `run-rolling-calculator-output-proofs.lua` client script
+in the other shell
+
+``` bash
+lua5.4 run-rolling-calculator-output-proofs.lua 127.0.0.1:8089
+```
+
+Entering `6*2^1024 + 3*2^512` produces the expected result, after which
+the client saves the tx-buffer-word proof tying the output hashes root
+hash into the accepting state, and then, once `^D` closes the epoch, the
+per-output proof against that root. The full transcript is
+
+``` text
+Connecting to remote cartesi machine at '127.0.0.1:8089'
+Connected: remote version is 0.6.0
+type expression
+6*2^1024 + 3*2^512
+result is
+10786158809173895446375831144734148401707861873653839436405804869463
+96054833005778796250863934445216126720683279228360145952738612886499
+73495708458383684478649003115037698421037988831222501494715481595948
+96901677837132352593468675094844090688678579236903861342030923488978
+36036892526733668721977278692363075584
+saved input-1-output-hashes-root-hash-proof.lua
+type expression
+saved output-0-input-1-proof.lua
+```
+
+The same proofs are what the `cartesi-machine` command-line utility
+writes for each accepted input and output when given
+`--cmio-advance-state=output_hashes_root_hash_proof:<pattern>,output_proof:<pattern>`.
+Verifying these proofs against a machine state hash, from the
+blockchain’s perspective, is shown under [Output
+verification](#output-verification).
+
+### State-transition proofs
+
+During verification, the blockchain mediates a [*verification
+game*](#verification-game) between the disputing parties. In brief, the
+parties agree on an initial state hash but claim different final state
+hashes. The game first narrows down the disagreement to the first
+main-processor instruction that deviates, and within it the first uarch
+instruction that deviates. After that, the honest party submits an
+access log, with Merkle-tree proofs for every value read from or written
+to the state, which the blockchain uses to identify the honest party.
+
+To obtain the access log for a specific uarch instruction in the
+execution of a Cartesi Machine instance, first advance to the last
+agreed `<mcycle>` using `machine:run(<mcycle>)`. Then advance the uarch
+to the last agreed `<uarch_cycle>` using
+`machine:run_uarch(<uarch_cycle>)`. Like `machine:run()`,
+`machine:run_uarch()` can return prematurely for a variety of reasons.
+It returns a break reason explaining why control was returned to the
+caller, taken from the `cartesi.UARCH_BREAK_REASON_*` set. For example,
+`cartesi.UARCH_BREAK_REASON_UARCH_HALTED` if the uarch halted before
+reaching the target cycle.
+
+Once the target uarch cycle has been reached, use the
+`machine:log_step_uarch(<log_type>)` function to produce a log that
+advances to the next uarch cycle. Alternatively, if the uarch is halted
+at that point, use `machine:log_reset_uarch()` to produce the log that
+reverts the state of the uarch to its pristine form. Note that the
+function indeed performs the action, and therefore modifies the uarch
+state, in addition to collecting the access log. The `<log_type>`
+argument is an integer bitfield formed by OR-ing
+`cartesi.ACCESS_LOG_TYPE_ANNOTATIONS` (to include the notes and brackets
+metadata consumed by the pretty-printer `util.print_log`) and
+`cartesi.ACCESS_LOG_TYPE_LARGE_DATA` (to include the full raw payload of
+large accesses, not just their hashes). Merkle-tree proofs are always
+included in the log.
+
+The format of the access log returned is as follows:
+
+``` lua
+access_log ::= {
+  log_type ::= {
+    annotations ::= boolean,
+    large_data  ::= boolean
+  },
+  accesses ::= {
+    [1] ::= access,
+    [2] ::= access,
+    ...
+    [n] ::= access
+  },
+  notes ::= {
+    [1] ::= string,
+    ...
+    [n] ::= string
+  },
+  brackets ::= {
+    [1] ::= bracket,
+    ...
+    [m] ::= bracket
+  }
+}
+
+access ::= {
+  type         ::= "read" | "write",
+  address      ::= number,
+  log2_size    ::= number,
+  read_hash    ::= string,
+  read         ::= string,
+  written_hash ::= string,
+  written      ::= string,
+  proof        ::= proof
+}
+
+proof ::= {
+  target_address   ::= number,
+  log2_target_size ::= number,
+  log2_root_size   ::= number,
+  target_hash      ::= string,
+  root_hash        ::= string,
+  sibling_hashes   ::= {
+    [1] ::= string,
+    ...
+    [k] ::= string
+  }
+}
+
+bracket ::= {
+  type  ::= "begin" | "end",
+  where ::= number,
+  text  ::= string
+}
+```
+
+The `accesses` array records, in order, all accesses to the machine
+state performed during the execution of the uarch step. Accesses can be
+of `type` either `"read"` or `"write"`. The `address` field gives the
+physical address of the accessed region and `log2_size` gives its size
+as a power of two. The `read_hash` field contains the hash of the data
+as read before the access. For `"write"` accesses, `written_hash`
+contains the hash of the written data. The `read` and `written` fields
+carry the data itself. For accesses at or above the 32-byte hash-tree
+leaf granularity (`log2_size >= 5`), each field is exactly `2^log2_size`
+bytes long. For sub-leaf accesses (`log2_size < 5`, typically
+`log2_size = 3` for an 8-byte word), the field contains the entire
+enclosing aligned 32-byte tree leaf. The `proof` field is used when
+[verifying state transitions](#verifying-state-transitions).
+
+#### Inspecting access logs
+
+When `log_type` includes `cartesi.ACCESS_LOG_TYPE_ANNOTATIONS`, the
+access log includes annotations that help put each access into a larger
+context.
+
+The `notes` array contains a string corresponding to each entry in the
+`accesses` array, describing the word access. The `brackets` contain
+information that groups ranges of word accesses into *scopes*. Each
+bracket entry `type` field tells if the entry marks the `"begin"` or
+`"end"` of a scope. The `where` field gives the position in the
+`accesses` array where the bracket should be “inserted”.
+
+The `print_log(<log>, <out>)` function in the `cartesi.util` module uses
+these annotations to dump a detailed description of the access `<log>`
+into an open file object `<out>` (E.g., `io.stdout` or the return of
+`io.open()`). It indents each access according to the number of
+enclosing scopes and uses the notes to identify what each address refers
+to (a register, a CSR, memory). Addresses and values are printed in
+hexadecimal and decimal.
+
+Running the `dump-uarch-step.lua` program:
+
+``` lua
+-- Load the Cartesi modules
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+-- Advance to the requested mcycle and uarch_cycle
+local mcycle = assert(tonumber(arg[2]), "missing mcycle")
+local ucycle = assert(tonumber(arg[3]), "missing uarch_cycle")
+machine:run(mcycle)
+assert(machine:read_reg("mcycle") == mcycle, "machine halted or yielded early")
+machine:run_uarch(ucycle)
+assert(machine:read_reg("uarch_cycle") == ucycle, "uarch halted before target")
+
+-- Obtain access log and dump it to screen
+local log = machine:log_step_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS)
+io.stderr:write(string.format("\nAccess log of uarch step at mcycle=%u uarch_cycle=%u:\n\n", mcycle, ucycle))
+util.print_log(log, io.stderr)
+```
+
+with command:
+
+``` bash
+lua5.4 dump-uarch-step.lua config-nothing-to-do "37056250" "2242"
+```
+
+produces the output:
+
+``` text
+
+         .
+        / \
+      /    \
+\---/---\  /----\
+ \       X       \
+  \----/  \---/---\
+       \    / CARTESI
+Access log of uarch step at mcycle=37056250 uarch_cycle=2242:
+
+begin step
+  1: read uarch.cycle@0x400008(4194312): 0x8c2(2242)
+  2: read uarch.halt_flag@0x400000(4194304): 0x0(0)
+  3: read uarch.pc@0x400010(4194320): 0x600b38(6294328)
+  4: read uarch.ram@0x600b38(6294328): 0x806700000073(141179869986931)
+  begin ecall
+    5: read uarch.x17@0x4000a0(4194464): 0x2(2)
+    6: read uarch.x10@0x400068(4194408): 0xa(10)
+    7: write uarch.pc@0x400010(4194320): 0x600b38(6294328) -> 0x600b3c(6294332)
+  end ecall
+  8: write uarch.cycle@0x400008(4194312): 0x8c2(2242) -> 0x8c3(2243)
+end step
+```
+
+Understanding these logs in detail is unnecessary for all but the most
+low-level internal development at Cartesi. It requires deep knowledge of
+not only RISC-V architecture, but also how Cartesi’s emulator implements
+it. The material is beyond the scope of this document. This particular
+example, however, was hand-picked for illustration purposes. The uarch
+step being executed is the ECALL micro-instruction that asks the
+emulator to print a line-feed (`0x0a`) to the console, completing the
+row `\    / CARTESI` in the splash screen.
+
+#### Verifying state transitions
+
+Each access carries a `proof` field. Using the known state hash before
+the access, it is possible to verify that the `read` value was indeed
+the value stored at `address` in the machine state. For a `"write"`
+access, the `sibling_hashes` in the proof can be used to compute the new
+state hash. Doing this for each access in sequence yields the state hash
+at the end of the step.
+
+The method
+`machine:verify_step_uarch(<state_hash_before>, <access_log>, <state_hash_after>)`
+performs this verification, additionally checking that the accesses
+correspond to the operation of the Cartesi Machine uarch starting from
+`<state_hash_before>`. Note there is no need for a Cartesi Machine
+instance to verify a transition: all required state information is in
+the access log.
+
+The following script illustrates the verification of a state transition.
+
+``` lua
+-- Load the Cartesi modules
+local cartesi = require("cartesi")
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+-- Advance to the requested mcycle and uarch_cycle
+local mcycle = assert(tonumber(arg[2]), "missing mcycle")
+local ucycle = assert(tonumber(arg[3]), "missing uarch_cycle")
+machine:run(mcycle)
+machine:run_uarch(ucycle)
+
+-- Obtain state hash before step, access log, and state hash after step
+local hash_before = machine:get_root_hash()
+local log = machine:log_step_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS)
+local hash_after = machine:get_root_hash()
+
+-- Potentially mess with the access log to provoke a verification failure
+if arg[4] then
+    local env = { string = string, cartesi = cartesi, log = log }
+    local f = assert(load(arg[4], arg[4], "t", env))
+    f()
+end
+
+-- Verify the uarch step access log
+machine:verify_step_uarch(hash_before, log, hash_after)
+io.stderr:write("State transition accepted!\n")
+```
+
+Running the script without arguments accepts the valid state transition:
+
+``` bash
+lua5.4 verify-uarch-step.lua config-nothing-to-do "37056250" "2242"
+```
+
+``` text
+State transition accepted!
+```
+
+The script is much more interesting when the argument is used to “mess”
+with the access log before verification. For example, changing the
+address of access \#7 (the write to `uarch.pc`) causes the program to
+reject the state transition proof:
+
+``` bash
+lua5.4 verify-uarch-step.lua config-nothing-to-do "37056250" "2242" 'log.accesses[7].address = 0x100'
+```
+
+``` text
+lua5.4: verify-uarch-step.lua:27: expected 7th access to write uarch.pc at address 0x400010(4194320)
+stack traceback:
+	[C]: in method 'verify_step_uarch'
+	verify-uarch-step.lua:27: in main chunk
+	[C]: in ?
+```
+
+Starting from `<state_hash_before>`, a true Cartesi Machine uarch would
+have written to `uarch.pc` at `0x400010` for the 7th access, not at
+`0x100` as our corrupt log claims.
+
+Changing the `written` data of the same access fails the access’s
+internal consistency check, because `written` no longer hashes to
+`written_hash`:
+
+``` bash
+lua5.4 verify-uarch-step.lua config-nothing-to-do "37056250" "2242" 'log.accesses[7].written = string.pack("<I8", 0x1234)..string.rep("\0", 24)'
+```
+
+``` text
+lua5.4: verify-uarch-step.lua:27: written data for uarch.pc does not match written hash in 7th access
+stack traceback:
+	[C]: in method 'verify_step_uarch'
+	verify-uarch-step.lua:27: in main chunk
+	[C]: in ?
+```
+
+Changing the `read` data of access \#5 (the read of `uarch.x17`) fails
+the same consistency check on the read side, because `read` no longer
+hashes to `read_hash`:
+
+``` bash
+lua5.4 verify-uarch-step.lua config-nothing-to-do "37056250" "2242" 'log.accesses[5].read = string.pack("<I8", 0x1234)..string.rep("\0", 24)'
+```
+
+``` text
+lua5.4: verify-uarch-step.lua:27: read data for uarch.x17 does not match read hash in 5th access
+stack traceback:
+	[C]: in method 'verify_step_uarch'
+	verify-uarch-step.lua:27: in main chunk
+	[C]: in ?
+```
+
+Updating `read_hash` to match the tampered `read` passes the internal
+consistency check, but the verifier still combines `read_hash` with the
+proof’s `sibling_hashes` to reconstruct the state hash before the
+access. That reconstruction no longer matches the expected root:
+
+``` bash
+lua5.4 verify-uarch-step.lua config-nothing-to-do "37056250" "2242" 'local a = log.accesses[5]; a.read = string.pack("<I8", 0x1234)..string.rep("\0", 24); a.read_hash = cartesi.keccak256(a.read)'
+```
+
+``` text
+lua5.4: verify-uarch-step.lua:27: siblings and read hash do not match root hash before 5th access to uarch.x17
+stack traceback:
+	[C]: in method 'verify_step_uarch'
+	verify-uarch-step.lua:27: in main chunk
+	[C]: in ?
+```
+
+In a nutshell, only valid state transitions are accepted by the
+`machine:verify_step_uarch()` method.
+
+# The guest perspective
+
+The goal of the guest perspective is to serve both guest
+application-developers and guest system-developers. The documentation
+therefore starts from the familiar Linux environment that runs inside
+Cartesi Machines. This is the abstraction level at which guest
+application-developers interact with Cartesi Machines. The documentation
+then moves towards the system architecture implemented by Cartesi
+Machines, including Cartesi-specific extensions to the RISC-V
+architecture. This is what surrounds the Linux environment, and is the
+abstraction level at which guest system-developers work.
+
+This is, of course, not the most natural order for presenting the
+material. After all, running the Linux environment experienced by
+application-developers is only possible after successful initialization
+of the Linux kernel, which in turn depends on knowledge of the system
+architecture. However, presenting the material in this order would
+quickly alienate application developers. Since there are many more
+application developers than system developers, we cater to the former.
+
+## Linux environment
+
+> [!NOTE]
+>
+> [The host perspective](#the-host-perspective) section describes in
+> detail the `cartesi-machine` command-line utility and the general
+> structure of Cartesi Machines. In order to avoid repetition, this
+> section assumes familiarity with the material presented there.
+
+The most direct way for guest developers to familiarize themselves with
+the Linux environment is to run the Cartesi Machine emulator in
+interactive mode. The `cartesi/machine-emulator-docs` Docker image comes
+pre-installed with the emulator, the default kernel and root
+file-system, and the host-side tooling used by the examples in this
+documentation (`xgenext2fs`, `pandoc`, the `e2tools` family, and
+assorted shell utilities). Inside that image, the following command
+instructs the emulator to load the default machine configuration and run
+a shell in interactive mode
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    -i \
+    -- sh
+```
+
+Once executed, the Cartesi Machine boots Linux and drops into an
+interactive shell (the `sh` argument in the command-line).
+
+``` text
+$ ls /bin
+'['			   gunzip	      rgrep
+ addpart		   gzexe	      rm
+ apt			   gzip		      rmdir
+ apt-cache		   hardlink	      rollup
+ apt-cdrom		   head		      rollup-http-server
+ apt-config		   hex		      rollup-init
+ apt-get		   hostid	      run-parts
+ apt-key		   hostname	      runcon
+ apt-mark		   iconv	      savelog
+...
+```
+
+The session shows a user listing the contents of `/bin/`, then leaving
+the emulator by pressing Ctrl+D at the prompt. The point of the exercise
+is that, from the inside, the environment will be familiar to any
+regular Unix user.
+
+One of the key differences is that, unlike stand-alone systems, many
+embedded systems are not self-hosting. None of the utilities visible
+inside the `/usr/bin/` and `/bin/` directories were built with a
+compiler that ran inside a Cartesi Machine. They were built in a
+separate host system, on which a cross-compiling toolchain for the
+target architecture has been installed. In the case of Linux, the key
+elements in the toolchain are the GNU Compiler Collection and the GNU C
+Library. Support for RISC-V is upstream in the official [GCC compiler
+collection](https://gcc.gnu.org/). The Rust language toolchain likewise
+supports RISC-V natively through [`rustup`](https://rustup.rs/). The
+examples below pull both toolchains in on demand via a multi-stage
+Docker build, so the only host-side prerequisite is `docker buildx`.
+
+### Building a custom root file-system
+
+To run a custom guest application inside the emulator, the most natural
+approach is to build a custom root file-system that replaces the default
+`rootfs.ext2`. The custom image contains the guest application alongside
+the Cartesi guest tools and any runtime dependencies.
+
+Once a custom image is in hand, there are two ways to put it in front of
+the emulator. A given `cartesi-machine` invocation can use
+`--flash-drive=label:root,data_filename:<path>.ext2` to override the
+default root flash drive with the file at `<path>`. The `root` label
+matches the label that `cartesi-machine` assigns to the default root
+flash drive, so this flag wins over the kernel-supplied default for the
+lifetime of that invocation. Alternatively, the file can be installed at
+`/usr/share/cartesi-machine/images/rootfs.ext2` (or symlinked there) so
+that every invocation picks it up by default.
+
+The example we work through here is the `rootfs-docs.ext2` image used by
+the `cartesi/machine-emulator-docs` Docker image as its `rootfs.ext2`.
+It contains a few small “Hello world!” programs in different languages,
+plus the `puppet` libcmt-rollup guest application used in the
+[rolling-machines walk-through](#rolling-cartesi-machines). The docs
+image installs it via the second mechanism above (`rootfs.ext2`
+symlinked to `rootfs-docs.ext2`), so the rest of this section can invoke
+`cartesi-machine` with no flash-drive override.
+
+Building the rootfs requires two host-side steps. The first assembles
+the rootfs with
+`docker buildx build --platform=linux/riscv64 --output type=tar`, which
+uses binfmt and QEMU to emulate riscv64 and emits the result as a flat
+tarball. The second converts the tarball into an ext2 image with
+[`xgenext2fs`](https://github.com/cartesi/genext2fs), which must be
+installed on the host (release `v1.5.6` or newer).
+
+> [!NOTE]
+>
+> The fourth stage of the multi-stage Dockerfile runs natively on
+> `riscv64` through `binfmt_misc` and QEMU emulation. Depending on your
+> host platform’s hardware (e.g., building on x86_64 vs. Apple Silicon),
+> emulating RISC-V instructions during package installation and setup
+> can introduce considerable execution overhead, leading to noticeably
+> slower build times.
+
+The Dockerfile below illustrates the approach with a four-stage build.
+The first stage cross-compiles a C17 and a C++23 “Hello world!” program
+using `g++-14-riscv64-linux-gnu` from the Ubuntu archives, and the
+`puppet` libcmt-rollup guest application against the headers and shared
+library shipped by `machine-guest-tools` (downloaded as a tarball
+release artifact and extracted into a sysroot inside the build stage).
+The second stage cross-compiles an equivalent Rust program, using
+`rustup` and the same RISC-V GCC as the linker. The third stage
+cross-compiles an equivalent Go program using the upstream `golang`
+Docker image with `GOARCH=riscv64`. The fourth stage runs natively on
+riscv64 (through binfmt and QEMU), installs the Cartesi
+`machine-guest-tools` Debian package alongside `libstdc++6` and a
+handful of scripting language interpreters, and copies the compiled
+binaries and example scripts into `/home/dapp/`. The C, C++, Rust, and
+`puppet` binaries are dynamically linked against the rootfs’s `libc`.
+The `puppet` binary also dynamically links to `libcmt.so`, which the
+`machine-guest-tools` Debian package installs at `/usr/lib/libcmt.so`
+inside the rootfs. The Go binary is fully static. The scripts depend on
+their interpreters being present.
+
+``` dockerfile
+ARG UBUNTU_TAG=24.04
+ARG UBUNTU_DIGEST=sha256:c4a8d5503dfb2a3eb8ab5f807da5bc69a85730fb49b5cfca2330194ebcc41c7b
+ARG RUST_TAG=1.83-slim
+ARG RUST_DIGEST=sha256:540c902e99c384163b688bbd8b5b8520e94e7731b27f7bd0eaa56ae1960627ab
+ARG GO_TAG=1.23-bookworm
+ARG GO_DIGEST=sha256:167053a2bb901972bf2c1611f8f52c44d5fe7e762e5cab213708d82c421614db
+ARG UBUNTU_SNAPSHOT=20260421T000000Z
+ARG MACHINE_GUEST_TOOLS_VERSION=0.18.0-test4
+ARG MACHINE_GUEST_TOOLS_DEB_SHA256=066ce57d039eada31159dce3a1e0704f3e7518f4828e66339b2a326d73a2e928
+ARG MACHINE_GUEST_TOOLS_TARGZ_SHA256=65b0a076a9b8a362b300eae2636cca0abe9500eeabfaee13e5cfa7723af5a0c0
+ARG DEBIAN_FRONTEND=noninteractive
+
+# Stage 1: cross-compile the C and C++ programs on the host architecture.
+FROM --platform=$BUILDPLATFORM ubuntu:${UBUNTU_TAG}@${UBUNTU_DIGEST} AS c-cpp-builder
+ARG DEBIAN_FRONTEND
+ARG MACHINE_GUEST_TOOLS_VERSION
+ARG MACHINE_GUEST_TOOLS_TARGZ_SHA256
+ARG UBUNTU_SNAPSHOT
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends ca-certificates && \
+    apt-get update --snapshot=${UBUNTU_SNAPSHOT} && \
+    apt-get install -y --no-install-recommends g++-14-riscv64-linux-gnu && \
+    rm -rf /var/lib/apt/lists/*
+ADD --checksum=sha256:${MACHINE_GUEST_TOOLS_TARGZ_SHA256} \
+    https://github.com/cartesi/machine-guest-tools/releases/download/v${MACHINE_GUEST_TOOLS_VERSION}/machine-guest-tools_riscv64.tar.gz \
+    /tmp/machine-guest-tools_riscv64.tar.gz
+RUN mkdir -p /sysroot && \
+    tar -xzf /tmp/machine-guest-tools_riscv64.tar.gz -C /sysroot && \
+    rm -f /tmp/machine-guest-tools_riscv64.tar.gz
+COPY hello/hello.c   /work/hello.c
+COPY hello/hello.cpp /work/hello.cpp
+COPY puppet.c        /work/puppet.c
+RUN riscv64-linux-gnu-gcc-14 -O2 -std=c17   -o /work/hello-c   /work/hello.c && \
+    riscv64-linux-gnu-g++-14 -O2 -std=c++23 -o /work/hello-cpp /work/hello.cpp && \
+    riscv64-linux-gnu-gcc-14 -O2 -std=c17 \
+        -I/sysroot/usr/include -L/sysroot/usr/lib \
+        -o /work/puppet /work/puppet.c -lcmt
+
+# Stage 2: cross-compile the Rust program on the host architecture.
+FROM --platform=$BUILDPLATFORM rust:${RUST_TAG}@${RUST_DIGEST} AS rust-builder
+ARG DEBIAN_FRONTEND
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends gcc-riscv64-linux-gnu libc6-dev-riscv64-cross && \
+    rm -rf /var/lib/apt/lists/* && \
+    rustup target add riscv64gc-unknown-linux-gnu
+WORKDIR /work
+RUN cargo init --name hello-rust --vcs none .
+COPY hello/hello.rs /work/src/main.rs
+ENV CARGO_TARGET_RISCV64GC_UNKNOWN_LINUX_GNU_LINKER=riscv64-linux-gnu-gcc
+RUN cargo build --release --target riscv64gc-unknown-linux-gnu
+
+# Stage 3: cross-compile the Go program on the host architecture.
+FROM --platform=$BUILDPLATFORM golang:${GO_TAG}@${GO_DIGEST} AS go-builder
+WORKDIR /work
+COPY hello/hello.go /work/hello.go
+ENV GOARCH=riscv64 GOOS=linux CGO_ENABLED=0
+RUN go build -ldflags="-s -w" -o /work/hello-go /work/hello.go
+
+# Stage 4: assemble the rootfs by emulating riscv64 through binfmt+QEMU.
+# The platform is set by `--platform=linux/riscv64` on the buildx invocation.
+FROM ubuntu:${UBUNTU_TAG}@${UBUNTU_DIGEST} AS rootfs
+ARG DEBIAN_FRONTEND
+ARG MACHINE_GUEST_TOOLS_VERSION
+ARG MACHINE_GUEST_TOOLS_DEB_SHA256
+ARG UBUNTU_SNAPSHOT
+ADD --checksum=sha256:${MACHINE_GUEST_TOOLS_DEB_SHA256} \
+    https://github.com/cartesi/machine-guest-tools/releases/download/v${MACHINE_GUEST_TOOLS_VERSION}/machine-guest-tools_riscv64.deb \
+    /tmp/
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends ca-certificates && \
+    apt-get update --snapshot=${UBUNTU_SNAPSHOT} && \
+    apt-get install -y --no-install-recommends \
+        /tmp/machine-guest-tools_riscv64.deb \
+        libstdc++6 \
+        bc curl device-tree-compiler gforth jq lua5.4 lua-socket \
+        python3-minimal tcl && \
+    apt-get purge -y --auto-remove ca-certificates && \
+    rm -f /var/cache/ldconfig/aux-cache && \
+    rm -rf /var/log/* && \
+    rm -rf /var/lib/apt/lists/* /tmp/machine-guest-tools_riscv64.deb
+
+# RUN apt-get update && \
+#     apt-get install -y --no-install-recommends nodejs ruby php-cli && \
+#     rm -rf /var/lib/apt/lists/*
+
+COPY --from=c-cpp-builder /work/hello-c                                               /home/dapp/hello-c
+COPY --from=c-cpp-builder /work/hello-cpp                                             /home/dapp/hello-cpp
+COPY --from=c-cpp-builder /work/puppet                                                /home/dapp/puppet
+COPY --from=rust-builder  /work/target/riscv64gc-unknown-linux-gnu/release/hello-rust /home/dapp/hello-rust
+COPY --from=go-builder    /work/hello-go                                              /home/dapp/hello-go
+COPY hello/hello.4th /home/dapp/hello.4th
+COPY hello/hello.awk /home/dapp/hello.awk
+COPY hello/hello.js  /home/dapp/hello.js
+COPY hello/hello.lua /home/dapp/hello.lua
+COPY hello/hello.pl  /home/dapp/hello.pl
+COPY hello/hello.php /home/dapp/hello.php
+COPY hello/hello.py  /home/dapp/hello.py
+COPY hello/hello.rb  /home/dapp/hello.rb
+COPY hello/hello.sh  /home/dapp/hello.sh
+COPY hello/hello.tcl /home/dapp/hello.tcl
+COPY hello/all.sh    /home/dapp/all.sh
+RUN chmod +x /home/dapp/hello-c /home/dapp/hello-cpp /home/dapp/hello-rust /home/dapp/hello-go /home/dapp/puppet /home/dapp/hello.* /home/dapp/all.sh && \
+    chown -R dapp:dapp /home/dapp
+```
+
+The C source compiled in the first stage is the ubiquitous “Hello
+world!” program, printing 5 lines:
+
+``` c
+#include <stdio.h>
+
+int main(void) {
+    for (int i = 1; i <= 5; i++) {
+        printf("%d: Hello world from C!\n", i);
+    }
+}
+```
+
+The C++ counterpart:
+
+``` cpp
+#include <print>
+
+int main() {
+    for (int i = 1; i <= 5; i++) {
+        std::println("{}: Hello world from C++!", i);
+    }
+}
+```
+
+The same stage also cross-compiles `puppet`, the libcmt-rollup guest
+application used in the rolling-machines walk-through. Its source is
+shown under [The libcmt library](#the-libcmt-library).
+
+The second step converts the tarball into an ext2 image:
+
+``` bash
+#!/bin/sh
+set -eu
+
+# Cross-compile the dapp and assemble the rootfs as a flattened tarball.
+docker buildx build --platform=linux/riscv64 \
+    --output type=tar,dest=rootfs-docs.tar \
+    -f Dockerfile.rootfs-docs .
+
+# Convert the tarball into an ext2 image.
+xgenext2fs -fzB 4096 -i 4096 -r +4000 \
+    -a rootfs-docs.tar -L docs rootfs-docs.ext2
+rm -f rootfs-docs.tar
+```
+
+The two additional flags here, relative to the base set introduced
+above, are `-r +50000` (reserve 50000 extra free blocks so the running
+system has room to write into the rootfs) and `-L docs` (ext2 volume
+label).
+
+### Guest “Hello world!”
+
+The C++ program can now be run inside the emulator. (The
+`machine-guest-tools` package post-install script creates the `dapp`
+Unix user, so the compiled binaries and example scripts will reside in
+`/home/dapp/`.)
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    -- /home/dapp/hello-cpp
+```
+
+The output is
+
+``` text
+1: Hello world from C++!
+2: Hello world from C++!
+3: Hello world from C++!
+4: Hello world from C++!
+5: Hello world from C++!
+
+Halted
+Cycles: 55539025
+```
+
+The Dockerfile’s second stage cross-compiles the following Rust program:
+
+``` rust
+fn main() {
+    for i in 1..6 {
+        println!("{}: Hello world from Rust!", i);
+    }
+}
+```
+
+The `rust-builder` stage runs
+`rustup target add riscv64gc-unknown-linux-gnu` and
+`cargo build --release --target riscv64gc-unknown-linux-gnu`, with
+`riscv64-linux-gnu-gcc` (from the `gcc-riscv64-linux-gnu` package) as
+the linker. The resulting binary is placed in `/home/dapp/hello-rust`.
+
+The Dockerfile’s third stage cross-compiles the following Go program:
+
+``` go
+package main
+
+import "fmt"
+
+func main() {
+	for i := 1; i <= 5; i++ {
+		fmt.Printf("%d: Hello world from Go!\n", i)
+	}
+}
+```
+
+The `go-builder` stage builds with
+`GOARCH=riscv64 GOOS=linux CGO_ENABLED=0`, which uses Go’s built-in
+cross-compilation toolchain to produce a fully-static binary. The
+resulting binary is placed in `/home/dapp/hello-go`.
+
+The rootfs also includes a selection of scripting language interpreters
+from the Ubuntu archives, so the same “Hello world!” can be realized in
+any of them:
+
+``` forth
+: main 6 1 do i 0 .r ." : Hello world from Forth!" cr loop ;
+main bye
+```
+
+``` awk
+#!/usr/bin/awk -f
+BEGIN {
+    for (i = 1; i <= 5; i++) {
+        printf "%d: Hello world from AWK!\n", i
+    }
+}
+```
+
+``` js
+#!/usr/bin/env node
+
+for (var i = 0; i < 5; i++) {
+    console.log((i+1) + ": Hello world from JavaScript!")
+}
+```
+
+``` lua
+#!/usr/bin/env lua5.4
+
+for i = 1, 5 do
+    print(i .. ": Hello world from Lua!")
+end
+```
+
+``` perl
+#!/usr/bin/env perl
+
+for my $i (1..5){
+	print("$i: Hello world from Perl!\n");
+}
+```
+
+``` php
+#!/usr/bin/env php
+<?php
+for ($i = 1; $i <= 5; $i++) {
+    print "$i: Hello world from PHP!\n";
+}
+?>
+```
+
+``` python
+#!/usr/bin/env python3
+
+for i in range(0,5):
+    print("{}: Hello world from Python3".format(i+1))
+```
+
+``` ruby
+#!/usr/bin/env ruby
+
+for i in 1..5 do
+    puts "%d: Hello world from Ruby!" % i
+end
+```
+
+``` bash
+#!/bin/sh
+
+for i in $(seq 1 5); do
+    echo "$i: Hello world from sh!"
+done
+```
+
+``` tcl
+#!/usr/bin/env tclsh
+
+for {set i 1} {$i <= 5} {incr i} {
+    puts "$i: Hello world from TCL!"
+}
+```
+
+The following shell script runs the examples one after another. In order
+not to bloat our example image, the heaviest interpreters were left out
+(Node.js, Ruby, and PHP). To add them back, uncomment the corresponding
+lines in the Dockerfile and in the `all.sh` script.
+
+``` bash
+#!/bin/sh
+
+cd $(dirname $0)
+
+./hello-c
+./hello-cpp
+./hello-rust
+./hello-go
+gforth hello.4th
+./hello.awk
+./hello.lua
+./hello.pl
+./hello.py
+./hello.sh
+./hello.tcl
+#./hello.js
+#./hello.rb
+#./hello.php
+```
+
+Running it inside the custom rootfs:
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    -- /home/dapp/all.sh
+```
+
+The output is
+
+``` text
+1: Hello world from C!
+2: Hello world from C!
+3: Hello world from C!
+4: Hello world from C!
+5: Hello world from C!
+1: Hello world from C++!
+2: Hello world from C++!
+3: Hello world from C++!
+4: Hello world from C++!
+5: Hello world from C++!
+1: Hello world from Rust!
+2: Hello world from Rust!
+3: Hello world from Rust!
+4: Hello world from Rust!
+5: Hello world from Rust!
+1: Hello world from Go!
+2: Hello world from Go!
+3: Hello world from Go!
+4: Hello world from Go!
+5: Hello world from Go!
+1: Hello world from Forth!
+2: Hello world from Forth!
+3: Hello world from Forth!
+4: Hello world from Forth!
+5: Hello world from Forth!
+1: Hello world from AWK!
+2: Hello world from AWK!
+3: Hello world from AWK!
+4: Hello world from AWK!
+5: Hello world from AWK!
+1: Hello world from Lua!
+2: Hello world from Lua!
+3: Hello world from Lua!
+4: Hello world from Lua!
+5: Hello world from Lua!
+1: Hello world from Perl!
+2: Hello world from Perl!
+3: Hello world from Perl!
+4: Hello world from Perl!
+5: Hello world from Perl!
+1: Hello world from Python3
+2: Hello world from Python3
+3: Hello world from Python3
+4: Hello world from Python3
+5: Hello world from Python3
+1: Hello world from sh!
+2: Hello world from sh!
+3: Hello world from sh!
+4: Hello world from sh!
+5: Hello world from sh!
+1: Hello world from TCL!
+2: Hello world from TCL!
+3: Hello world from TCL!
+4: Hello world from TCL!
+5: Hello world from TCL!
+
+Halted
+Cycles: 188033613
+```
+
+The take-away message is that developers can use the tools they are most
+familiar with to accomplish the task at hand.
+
+### Flash drives and NVRAMs
+
+Flash drives and NVRAMs are simply regions of physical memory accessible
+to the guest through different Linux drivers.
+
+Flash drives use the persistent-memory block-device driver
+`pmem-region`, which makes them accessible as block devices `/dev/pmem0`
+to `/dev/pmem7`. The initialization script added by `cartesi-machine` to
+the `machine_config` field `dtb.init` mounts any labeled flash drive
+containing a valid file-system at `/mnt/<label>`. In this fashion,
+file-systems present in all flash drives become available for use.
+
+The default kernel command-line parameter contains the substring
+`root=/dev/pmem0 rw`, which declares that the root file-system resides
+in device `/dev/pmem0`, i.e., flash drive 0, and that it should be
+mounted read-write.
+
+NVRAMs are raw byte buffers for guest code that needs unstructured
+memory without a file-system layer. They are backed by UIO devices,
+through driver `generic-uio`, and are accessible inside the guest as
+`/dev/uio0` to `/dev/uio7`. Unlike with flash drives, there is no page
+cache between the guest and the underlying memory range.
+
+Custom labels for flash drives and NVRAMs are published in the DTB
+`/aliases` node. The node also carries the auto-assigned aliases
+`flashdrive0` to `flashdrive7` and `nvram0` to `nvram7`. The `root`
+label is added by the `cartesi-machine` command-line utility as the
+custom label for `/dev/pmem0`. The command-line utilities `flashdrive`,
+`nvram`, and `memoryrange`, installed by `machine-guest-tools` can
+translate these labels to the corresponding devices and their extents in
+physical memory.
+
+A flash drive or NVRAM holds whatever data is made available by the
+emulator in the corresponding guest physical memory region. The data can
+come from an image file specified during machine instantiation, from an
+image file specified after instantiation via the
+`machine:replace_memory_range(<memory_range_config>)`, or through
+external state access method `machine:write_memory()`. Additionally, the
+`readmmap` and `writemmap` utilities can read and write NVRAM or
+flash-drive ranges by label.
+
+Some scripting languages, like the Lua programming language, have
+packing and unpacking libraries that can be very helpful for structured
+data.
+
+For example, the previously discussed [arbitrary-precision calculator
+Cartesi Machine](#cartesi-machine-templates) is given the entrypoint
+
+``` bash
+$'readmmap input | lua5.4 -e \'print((string.unpack("z", io.read("a"))))\' | bc | writemmap output'
+```
+
+The input is a null-terminated string containing the expression to be
+evaluated. This string is stored inside an NVRAM with label `input`. The
+output is once again a null-terminated string with the result, this time
+stored inside an NVRAM with label `output`.
+
+The `readmmap input` command therefore reads the entire 4KiB of the
+input NVRAM and sends it to the standard output. The second command,
+`lua5.4 -e 'print((string.unpack("z", io.read("a"))))'` extracts the
+first null-terminated string and prints it to standard out. This is the
+meaning of the `"z"` format argument to the `string.unpack()` function.
+There are a variety of other formats available, including reading
+integers of different sizes, big- or little-endian etc. Please see the
+[documentation for the
+`string.unpack()`](https://www.lua.org/manual/5.4/manual.html#6.4.2)
+function for more details. The string is received by the `bc`
+command-line utility. In the example, that string is
+`6*2^1024 + 3*2^512\n`. The `bc` command-line utility computes the value
+of the expression and sends it to standard out. This is finally received
+by `writemmap output`, which writes it to the output NVRAM. (No need to
+null-terminate, since the drive is already completely filled with
+zeros.)
+
+### Initialization
+
+Earlier versions of the emulator booted from a `rom.bin` image whose
+main purpose was to build, inside the guest itself, a [device
+tree](https://www.devicetree.org/) describing the hardware. Starting
+with version 0.16, the emulator builds the device tree in the host, at
+instantiation, derived from the machine configuration, and stores it in
+the DTB memory range immediately below RAM. The hart starts execution
+directly at the beginning of RAM (address `0x80000000`), where the RAM
+image is loaded. The start address of the DTB memory range
+(`0x7ff00000`) is pre-loaded in register `a1`, per the conventional
+RISC-V boot ABI.
+
+The Cartesi-provided `linux.bin` image is an OpenSBI `fw_payload`
+bundle, a small machine-mode firmware that exposes the Supervisor Binary
+Interface to Linux, linked together with the kernel. The firmware
+occupies the first 512KiB of RAM, declared as a no-map region in the
+device tree so the kernel does not touch it. OpenSBI initializes itself,
+then hands control to the kernel, passing along the address it received
+in `a1`. The kernel reads the device tree, loads drivers, and finishes
+its own initialization.
+
+When kernel initialization is complete, the kernel mounts the device
+named by the `root=` parameter, by default `/dev/pmem0`. It then
+executes the program named by `init=`, by default
+`/usr/sbin/cartesi-init`.
+
+The Cartesi-provided `cartesi-init` program sets up a basic Linux
+environment on which applications can run. It mounts `/proc`,
+`/dev/pts`, `/dev/shm`, `/sys`, `/tmp`, and `/run`, and sources any
+drop-in scripts under `/etc/cartesi-init.d/`. Next, it sources (as
+`root`) the script it reads from the device-tree node
+`/cartesi-machine/init`, which the emulator has filled from the contents
+of the `machine_config` at `dtb.init`. (The `cartesi-machine` utility
+adds there a script to mount each labeled flash drive carrying a
+recognized file-system at `/mnt/<label>`.) Finally, `cartesi-init` reads
+the entrypoint string from the device tree at
+`/cartesi-machine/entrypoint`, which the emulator fills from
+`machine_config` at `dtb.entrypoint`, and executes it in a shell, by
+default as user `dapp`. (This is where `cartesi-machine` puts the
+commands it finds after the `--` separator in the command-line.)
+
+Given a proper rootfs and an appropriate entrypoint, applications can
+run any general computation, consuming input from flash drives or NVRAMs
+and writing outputs to flash drives or NVRAMs, or run a Rolling Cartesi
+Machine loop that uses the `/dev/cmio` device to read inputs and write
+outputs (see below). When the application exits, control returns to
+`cartesi-init`, which unmounts file-systems and gracefully halts the
+machine.
+
+### Communication between guest and host
+
+Guest applications inside a Cartesi Machine drive the rollups model by
+issuing requests to the yield sub-device of HTIF, the Cartesi Machine’s
+host-guest communication device. HTIF itself and its yield sub-device
+are described later, under the System architecture chapter. The
+Cartesi-extended Linux kernel produced by
+[`machine-linux-image`](https://github.com/cartesi/machine-linux-image)
+exposes the rollups communication protocol to user-space through a
+single character device file, `/dev/cmio`.
+
+Guest applications interact with `/dev/cmio` through one of four layers,
+in decreasing order of convenience. When available, the preferred path
+is a language binding of the `libcmt` library included in
+[`machine-guest-tools`](https://github.com/cartesi/machine-guest-tools).
+C and C++ can use libcmt directly. In the future, other language
+ecosystems (Rust, Go, JavaScript, Python, Lua, and so on) will wrap
+libcmt and expose the rollups interface idiomatically. In the meantime,
+applications written in languages without a libcmt binding talk to the
+device through the `/usr/bin/rollup-http-server` daemon, which
+translates HTTP requests into libcmt operations. For shell-driven
+workflows, `machine-guest-tools` also includes the `/usr/bin/rollup`
+command-line utility, a libcmt consumer that exposes single libcmt
+operations on standard input and standard output. And for the
+adventurous, or for tooling that needs to talk to the device directly
+for testing or debugging, the raw `/dev/cmio` `ioctl` interface itself
+is documented at the bottom of this section, alongside the lower-level
+`/usr/bin/yield` command-line utility.
+
+When the application yields, the emulator returns control to the host.
+The host either provides a new input to the guest application, or
+processes an output generated by it. Manual yields require the host to
+reset the `iflags_Y` register before the machine can resume. Automatic
+yields briefly set the `iflags_X` register, which the emulator clears on
+the next instruction.
+
+#### The libcmt library
+
+The libcmt library comes with the `machine-guest-tools` package,
+installed in the rootfs as `/usr/lib/libcmt.{so,a}` with public headers
+under `/usr/include/libcmt/`. The high-level rollups loop lives in
+`rollup.h`. The supporting headers (`abi.h`, `buf.h`, `io.h`,
+`keccak.h`, `merkle.h`, `util.h`) exist mostly to back it.
+
+The `rollup.h` API mirrors the lifecycle of a guest application.
+`cmt_rollup_init()` opens `/dev/cmio` and maps the receive and transmit
+buffers. `cmt_rollup_finish()` accepts or rejects the previous request
+and blocks until the next one arrives. A field in the returned
+`cmt_rollup_finish_t` indicates whether the new request is an
+`HTIF_YIELD_REASON_ADVANCE_STATE` or an
+`HTIF_YIELD_REASON_INSPECT_STATE`. For an advance,
+`cmt_rollup_read_advance_state()` decodes the ABI-encoded
+`EvmAdvance(uint256 chainId, address appContract, address msgSender, uint256 blockNumber, uint256 blockTimestamp, uint256 prevRandao, uint256 index, bytes payload)`
+calldata blob from the CMIO RX buffer into a `cmt_rollup_advance_t`
+struct with one field per parameter. For an inspect,
+`cmt_rollup_read_inspect_state()` returns just the payload.
+
+While processing a request, the application emits zero or more outputs.
+`cmt_rollup_emit_voucher()`, `cmt_rollup_emit_delegate_call_voucher()`,
+`cmt_rollup_emit_notice()`, `cmt_rollup_emit_report()`, and
+`cmt_rollup_emit_exception()` emit the named output.
+`cmt_rollup_progress()` reports a per-mille progress value as an
+automatic yield. The rules of the request/response protocol and the
+meaning of each output type are spelled out under Rolling Cartesi
+Machines, in the host-side chapter. Finally, `cmt_rollup_fini()` tears
+down the mappings and closes the device.
+
+The `puppet` guest application is a small libcmt rollup loop whose
+advance-state payloads are commands. It exercises every emit call of the
+`rollup.h` API in roughly fifty lines.
+
+``` c
+/* Puppet: a libcmt rollup target driven by its inputs.
+ *
+ * Each advance-state payload is a command of the form "verb:data" (or
+ * a bare verb without a colon).  The verb selects the libcmt call; the
+ * data after the colon is the bytes the call receives.
+ *
+ *   notice:<data>     -> cmt_rollup_emit_notice(data), accept
+ *   report:<data>     -> cmt_rollup_emit_report(data), accept
+ *   voucher:<data>    -> cmt_rollup_emit_voucher(msg_sender, 0, data),
+ *                        accept
+ *   exception:<data>  -> cmt_rollup_emit_exception(data); halts
+ *   exit              -> break out of the loop and return from main;
+ *                        the machine halts on its own
+ *   <anything else>   -> reject the advance; the host rolls the state
+ *                        back
+ *
+ * An inspect-state query is echoed back as a single report, accepted.
+ */
+
+#include <string.h>
+#include "libcmt/rollup.h"
+
+static int verb_match(const cmt_abi_bytes_t *payload, const char *verb, cmt_abi_bytes_t *data) {
+    size_t verb_len = strlen(verb);
+    if (payload->length < verb_len) return 0;
+    if (memcmp(payload->data, verb, verb_len) != 0) return 0;
+    if (payload->length == verb_len) {
+        data->data = NULL;
+        data->length = 0;
+        return 1;
+    }
+    if (((const char *) payload->data)[verb_len] != ':') return 0;
+    data->data = (char *) payload->data + verb_len + 1;
+    data->length = payload->length - verb_len - 1;
+    return 1;
+}
+
+int main(void) {
+    cmt_rollup_t rollup;
+    if (cmt_rollup_init(&rollup) < 0) return 1;
+
+    cmt_rollup_finish_t finish = { .accept_previous_request = true };
+    if (cmt_rollup_finish(&rollup, &finish) < 0) return 1;
+
+    for (;;) {
+        bool accept = true;
+        bool should_exit = false;
+        if (finish.next_request_type == HTIF_YIELD_REASON_ADVANCE_STATE) {
+            cmt_rollup_advance_t advance;
+            if (cmt_rollup_read_advance_state(&rollup, &advance) < 0) break;
+            cmt_abi_bytes_t data;
+            if (verb_match(&advance.payload, "notice", &data)) {
+                cmt_rollup_emit_notice(&rollup, &data, NULL);
+            } else if (verb_match(&advance.payload, "report", &data)) {
+                cmt_rollup_emit_report(&rollup, &data);
+            } else if (verb_match(&advance.payload, "voucher", &data)) {
+                cmt_abi_u256_t value = {{0}};
+                cmt_rollup_emit_voucher(&rollup, &advance.msg_sender, &value, &data, NULL);
+            } else if (verb_match(&advance.payload, "exception", &data)) {
+                cmt_rollup_emit_exception(&rollup, &data);
+            } else if (verb_match(&advance.payload, "exit", &data) && data.length == 0) {
+                should_exit = true;
+            } else {
+                accept = false;
+            }
+        } else if (finish.next_request_type == HTIF_YIELD_REASON_INSPECT_STATE) {
+            cmt_rollup_inspect_t inspect;
+            if (cmt_rollup_read_inspect_state(&rollup, &inspect) < 0) break;
+            cmt_rollup_emit_report(&rollup, &inspect.payload);
+        }
+        if (should_exit) break;
+        finish.accept_previous_request = accept;
+        if (cmt_rollup_finish(&rollup, &finish) < 0) break;
+    }
+
+    cmt_rollup_fini(&rollup);
+    return 0;
+}
+```
+
+After `cmt_rollup_init` opens the device, the program makes the first
+call to `cmt_rollup_finish` with `accept_previous_request = true`, which
+signals that the guest is ready and blocks for the first request. The
+accept here is not optional: the alternative would have
+`cmt_rollup_finish` ask the host to revert the machine state, which has
+no meaning before any request has been processed. Each subsequent
+advance-state payload is a verb (`notice`, `report`, `voucher`,
+`exception`, or `exit`) optionally followed by `:` and arbitrary data.
+The verb selects a libcmt call to make with that data. `notice:<data>`,
+`report:<data>`, and `voucher:<data>` emit the named output and accept
+the request. `exception:<data>` emits an exception, halting the machine.
+`exit` breaks out of the loop and returns from `main`, and the machine
+halts when `cartesi-init` reaps the process. Any payload that does not
+match a known verb causes the advance-state request to be rejected, so
+the host rolls the state back. For inspect-state requests, the program
+emits a single report echoing the query and accepts. The loop exits when
+an error escapes from any libcmt call, which is also what happens when
+the host signals end of input by halting the machine.
+
+We can drive `puppet` through the same command-line harness used earlier
+for the calculator under [Rolling Cartesi
+Machines](#rolling-cartesi-machines). First, encode two advance-state
+requests and one inspect-state query:
+
+``` bash
+cartesi-rollup-data.lua encode advance > input-1.bin <<EOF
+{
+  "chain_id": 0,
+  "app_contract": "0x0000000000000000000000000000000000000000",
+  "msg_sender": "$(printf '0x%040d' 1)",
+  "block_number": 0,
+  "block_timestamp": 0,
+  "prev_randao": "0x0000000000000000000000000000000000000000000000000000000000000000",
+  "index": 1,
+  "payload": "$(printf 'notice:hello from input 1' | hex --encode)"
+}
+EOF
+cartesi-rollup-data.lua encode advance > input-2.bin <<EOF
+{
+  "chain_id": 0,
+  "app_contract": "0x0000000000000000000000000000000000000000",
+  "msg_sender": "$(printf '0x%040d' 2)",
+  "block_number": 0,
+  "block_timestamp": 0,
+  "prev_randao": "0x0000000000000000000000000000000000000000000000000000000000000000",
+  "index": 2,
+  "payload": "$(printf 'something the puppet does not understand' | hex --encode)"
+}
+EOF
+cartesi-rollup-data.lua encode inspect > query.bin <<EOF
+{
+  "payload": "$(printf 'hello from query!' | hex --encode)"
+}
+EOF
+```
+
+Then run the server and client, instantiating the machine directly from
+`/home/dapp/puppet`:
+
+``` bash
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8086
+```
+
+``` bash
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8086
+```
+
+From a different shell into the same container, run the client
+
+``` bash
+while ! cartesi-machine \
+    --remote-address=127.0.0.1:8086 \
+    --remote-health-check 2>/dev/null; do sleep 1; done
+cartesi-machine \
+    --no-init-splash \
+    --remote-address=127.0.0.1:8086 \
+    --remote-shutdown \
+    --cmio-advance-state=input_index_begin:1,input_index_end:3,hashes \
+    --cmio-inspect-state=hashes \
+    --final-hash \
+    -- /home/dapp/puppet
+```
+
+The payload of `input-1.bin` is `notice:hello from input 1`, so the
+`puppet` emits a single notice and accepts. The payload of `input-2.bin`
+does not match any known verb, so the `puppet` rejects the advance-state
+request and the client rolls the machine state back, discarding any
+side-effects from its processing. The contents of `query.bin` are echoed
+back as a report, and once again the state of the machine reverts after
+the inspect-state request is processed.
+
+The client shell shows
+
+``` text
+Connected to JSONRPC remote cartesi machine at '127.0.0.1:8086'
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 48382220
+
+Before input 1
+48382220: a77e53c14250fc58194d41ada3c0764782d2c1511104dcd241e4880c69989cfd
+48382220: 3a86c464780f438ec0b8cbb566c2dc5db3b381c388afa009b1b282b3726e0e1f
+
+Automatic yield tx-output (2) (0x000064 data)
+Cycles: 48400392
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 50514472
+Storing output-0-input-1.bin
+Storing input-1-output-hashes-root-hash.bin
+Storing input-1-output-hashes-root-hash-proof.lua
+
+Before input 2
+50514472: 77cdb2b3d03a6634f8ada5ae224a86c736a4950dbd13250afcfb495bee44ee7d
+50514472: 10b205e055092cbe69b6ff0bbf953cab6566eaa1261d54605ab0198061429f8e
+
+Manual yield rx-rejected (2) (0x000000 data)
+Cycles: 50518421
+Storing output-0-input-1-proof.lua
+
+Before query
+50514472: 77cdb2b3d03a6634f8ada5ae224a86c736a4950dbd13250afcfb495bee44ee7d
+50514472: 8edc853d7b97dafa37f77b9c7d0d134d7567e99a971f7c0316cc9c5092a034d4
+
+Automatic yield tx-report (4) (0x000011 data)
+Cycles: 50515684
+Storing query-report-0.bin
+
+Manual yield rx-accepted (1) (0x000020 data)
+Cycles: 50516774
+
+After query
+50514472: 77cdb2b3d03a6634f8ada5ae224a86c736a4950dbd13250afcfb495bee44ee7d
+Shutdown JSONRPC remote cartesi machine at '127.0.0.1:8086'
+```
+
+As expected, the yields and state hashes shown here follow the same
+pattern detailed for the calculator under [Rolling Cartesi
+Machines](#rolling-cartesi-machines).
+
+The `cartesi-rollup-data.lua` utility decodes the records the run
+produced. The advance-state request carries the command `puppet` acted
+on
+
+``` bash
+cartesi-rollup-data.lua decode advance < input-1.bin
+```
+
+``` js
+{
+  "chain_id":0,
+  "app_contract":"0x0000000000000000000000000000000000000000",
+  "msg_sender":"0x0000000000000000000000000000000000000001",
+  "block_number":0,
+  "block_timestamp":0,
+  "prev_randao":"0x0000000000000000000000000000000000000000000000000000000000000000",
+  "index":1,
+  "payload":"0x6e6f746963653a68656c6c6f2066726f6d20696e7075742031"
+}
+```
+
+The payload field carries the hex encoding of the bytes
+`notice:hello from input 1`, which the `puppet` parsed as a command to
+emit a notice with payload `hello from input 1`.
+
+Notices and reports carry only a payload, which we recover with
+
+``` bash
+cartesi-rollup-data.lua decode notice < output-0-input-1.bin | jq -j .payload | hex --decode
+```
+
+``` text
+hello from input 1
+```
+
+``` bash
+cartesi-rollup-data.lua decode report < query-report-0.bin | jq -j .payload | hex --decode
+```
+
+``` text
+hello from query!
+```
+
+#### The rollup HTTP server
+
+For guest applications written in languages that have no libcmt binding,
+the `/usr/bin/rollup-http-server` daemon is the practical bridge to
+`/dev/cmio`. The daemon listens on a local HTTP port and translates each
+request it receives into a libcmt operation. The guest application’s
+request/response loop runs in the host language and issues HTTP calls to
+the daemon to advance state, emit outputs, and finish requests.
+
+#### The rollup command-line utility
+
+The `/usr/bin/rollup` utility is a thin libcmt wrapper that exposes
+single libcmt operations on the command line, reading and writing JSON
+on standard input and standard output. It is intended for shell-driven
+demos and tests. Production applications should use either a libcmt
+language binding or `/usr/bin/rollup-http-server` instead. The
+[calculator that evaluates `bc` expressions](#rolling-cartesi-machines)
+earlier in this document drives a `rollup`-based loop from a shell
+script.
+
+For reference, the help text of the `rollup` utility is
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --quiet \
+    -- rollup --help
+```
+
+``` text
+Usage:
+    rollup [command]
+
+  where [command] is one of
+
+    voucher
+      emit a voucher read from stdin as a JSON object in the format
+        {"destination": <address>, "value": <hex-uint256>, "payload": <hex-data>}
+      where
+        <address> contains a 20-byte EVM address in hex,
+        <hex-uint256> contains a big-endian 32-byte unsigned integer in hex, and
+        <hex-data> contains arbitrary data in hex
+      if successful, prints to stdout a JSON object in the format
+        {"index": <number> }
+      where field "index" is the index allocated for the voucher
+
+    delegate-call-voucher
+      emit a delegate call voucher read from stdin as a JSON object in the format
+        {"destination": <address>, "payload": <hex-data>}
+      where
+        <address> contains a 20-byte EVM address in hex,
+        <hex-data> contains arbitrary data in hex
+      if successful, prints to stdout a JSON object in the format
+        {"index": <number> }
+      where field "index" is the index allocated for the voucher
+
+    notice
+      emit a notice read from stdin as a JSON object in the format
+        {"payload": <hex-data> }
+      where
+        <hex-data> contains arbitrary data in hex
+      if successful, prints to stdout a JSON object in the format
+        {"index": <number> }
+      where field "index" is the index allocated for the notice
+
+    report
+      emit a report read from stdin as a JSON object in the format
+        {"payload": <hex-data> }
+      where
+        <hex-data> contains arbitrary data in hex
+
+    finish
+      accept or reject the previous request based on a JSON object
+      read from stdin in the format
+        {"status": <string> }
+      where "status" is either "accept" or "reject".
+
+      print the next request to stdout as a JSON object in the format
+        {"request_type": <request-type>, "data": <request-data>}
+
+      when field "request_type" contains "advance_state",
+      field "data" contains a JSON object in the format
+        {
+          "chain_id": <number>,
+          "app_contract": <address>,
+          "msg_sender": <address>,
+          "block_number": <number>,
+          "block_timestamp": <number>
+          "prev_randao": <hex-uint256>,
+          "index": <number>,
+          "payload": <hex-data>
+        },
+      where
+        <address> contains a 20-byte EVM address in hex,
+        <hex-uint256> contains a big-endian 32-byte unsigned integer in hex, and
+        <hex-data> contains arbitrary data in hex
+
+      when field "request_type" contains "inspect_state",
+      field "data" contains a JSON object in the format
+        {"payload": <hex-data> }
+      where
+        <hex-data> contains arbitrary data in hex
+
+    accept
+      a shortcut for finish with implied input
+        {"status": "accept" }
+      no input is read from stdin
+
+    reject
+      a shortcut for finish with implied input
+        {"status": "reject" }
+      no input is read from stdin
+
+    exception
+      throw an exception read from stdin as a JSON object in the format
+        {"payload": <hex-data> }
+      where
+        <hex-data> contains arbitrary data in hex
+
+    gio
+      performs a generic IO operation request based on a JSON object
+      read from stdin in the format
+        { "domain": <number>, "id": <hex-data> }
+      if successful, prints to stdout a JSON object in the format
+        { "code": <number>, "data": <hex-data> }
+      where
+        <hex-data> contains arbitrary data in hex
+```
+
+#### The /dev/cmio device
+
+The raw `/dev/cmio` character device file is the kernel-level interface
+to the HTIF yield sub-device. Most users should not interact with it
+directly. Language bindings should be built on top of libcmt rather than
+`/dev/cmio` directly, because libcmt does more than carry traffic
+through the device. It also maintains the output hashes tree that
+Cartesi Rollups relies on to validate the application’s outputs. The
+information that follows is useful for the curious and for tooling that
+needs to talk to the device directly for testing or debugging.
+
+The kernel UAPI header is `<linux/cartesi/cmio.h>`, whose struct
+definitions are the source of truth. The device exposes two `ioctl`
+requests. `IOCTL_CMIO_SETUP` takes a `struct cmio_setup` argument and
+fills it with descriptors for the receive and transmit buffers. The
+caller `mmap`s those buffers once, at startup, and accesses them
+directly thereafter. `IOCTL_CMIO_YIELD` takes a `struct cmio_yield`
+argument and yields control to the host, encoding the yield kind in the
+struct’s fields. The two arguments are roughly
+
+``` c
+struct cmio_setup {
+    struct { uint64_t data; uint64_t length; } tx, rx;
+};
+
+struct cmio_yield {
+    uint8_t  dev;     /* HTIF_DEVICE_YIELD */
+    uint8_t  cmd;     /* HTIF_YIELD_CMD_AUTOMATIC or HTIF_YIELD_CMD_MANUAL */
+    uint16_t reason;
+    uint32_t data;
+};
+```
+
+The `dev` field identifies the HTIF sub-device targeted by the request.
+HTIF distinguishes three sub-devices internally, halt, console, and
+yield. `/dev/cmio` carries only yield-class traffic, so the `dev` field
+must be `HTIF_DEVICE_YIELD`. The `cmd` field selects between an
+automatic yield, where the host resumes the machine without further
+action, and a manual yield, where the host must reset `iflags_Y` before
+the machine can resume. The `reason` field carries one of the constants
+below, and the `data` field carries an auxiliary 32-bit value whose
+meaning is reason-specific.
+
+The reasons paired with `HTIF_YIELD_CMD_AUTOMATIC` are
+`HTIF_YIELD_AUTOMATIC_REASON_PROGRESS` (the `data` field carries a
+per-mille progress value), `HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT` (a
+voucher, delegate-call voucher, or notice has been written to the
+transmit buffer), and `HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT` (a report
+has been written to the transmit buffer).
+
+The reasons paired with `HTIF_YIELD_CMD_MANUAL` are
+`HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED` (the application has accepted the
+previous request and is ready for the next, and the host sets the `data`
+field on resume to `HTIF_YIELD_REASON_ADVANCE_STATE` or
+`HTIF_YIELD_REASON_INSPECT_STATE` to indicate the type of the freshly
+loaded input in the receive buffer),
+`HTIF_YIELD_MANUAL_REASON_RX_REJECTED` (the application has rejected the
+previous request, and the host reverts the machine state and replies
+with the next request as above), and
+`HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION` (the application has emitted an
+exception payload to the transmit buffer and the machine cannot
+continue).
+
+For convenience, `machine-guest-tools` also includes a `/usr/bin/yield`
+utility that sends a single yield request from the shell, useful for
+tests and one-off demos. It is a direct wrapper for `IOCTL_CMIO_YIELD`
+and only supports yield-class requests, so it does not send halt or
+console requests to HTIF. Its usage is
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --quiet \
+    -- yield
+```
+
+``` text
+Usage: yield <mode> <reason> [<data>]
+Where: 
+  <mode>       "manual" or "automatic"
+  <reason>     "progress", "rx-accepted", "rx-rejected",
+               "tx-voucher", "tx-notice", "tx-exception" or
+               "tx-report"
+  <data>       32-bit unsigned integer (decimal, default 0)
+```
+
+## System architecture
+
+The RISC-V ISA consists of a minimal integer instruction set to which
+several extensions can be added. The standard defines a privileged
+architecture with features commonly used by modern operating systems,
+such as multiple privilege levels, paged-based virtual-memory, timers,
+interrupts, exceptions and traps, etc. Implementations are free to
+select the combination of extensions that better suit their needs.
+
+The Cartesi Machine architecture can be separated into a main processor,
+board, and a microarchitecture (uarch). The processor performs the
+computations, executing the traditional fetch-execute loop while
+maintaining a variety of registers. The board defines the surrounding
+environment with an assortment of memories (RAM, flash drives, NVRAMs,
+CMIO buffers etc) and a number of devices. The uarch includes its own
+smaller processor and memory, invisible to the main processor, with full
+access into its inner workings. It can drive the main processor at a
+finer granularity that is suitable for dispute resolution in the context
+of blockchains.
+
+The Cartesi Machine maps its entire state to the physical address space
+in a well-defined way. This includes the internal states of the main
+processor, of the uarch processor, of all attached devices, and the
+contents of all memories. This state completely defines the Cartesi
+Machine.
+
+A full description of the RISC-V ISA is out of the scope of this
+documentation (See the volumes [1 and
+2](https://riscv.org/technical/specifications/) of the ISA specification
+for details.) This section describes the RISC-V architecture of the main
+processor and uarch, the modifications made to support verification, the
+devices supported by the emulator, and the process the machine follows
+to boot the Linux kernel.
+
+### The main processor
+
+Following RISC-V terminology, the Cartesi Machine’s main processor
+implements the `RV64IMAFDCZicsr_Zifencei` ISA. The letters after RV
+specify the extension set. This selection corresponds to a 64-bit
+machine, integer arithmetic with multiplication and division, atomic
+operations, single- and double-precision floating-point arithmetic, and
+compressed instructions, as well as the optional supervisor and user
+privilege levels. In addition, Cartesi Machines support the Sv39 mode of
+address translation and memory protection. Sv39 provides a 39-bit
+protected virtual address space, divided into 4KiB pages, organized by a
+three-level page table. This set of features creates a balanced
+compromise between the simplicity demanded by a blockchain
+implementation and the flexibility expected from off-chain computations.
+
+Even so, the instruction set remains compact. Most instructions are very
+simple and can be emulated in a few lines of high-level code. In
+contrast, the x86 ISA defines at least 2000 (potentially complex)
+instructions. In fact, the only complex operation in RISC-V is the
+virtual-to-physical address translation. Instruction decoding is
+particularly simple due to the reduced number of formats taking 32 or 16
+bits.
+
+The entire processor state fits within 848 bytes, divided into 106
+registers, each holding 64 bits. It consists of 32 general-purpose
+integer registers (`x0`…`x31`), 32 floating-point registers
+(`f0`…`f31`), and 42 standard or Cartesi-specific control registers. The
+last 8 of those control registers persist the externally-visible state
+of the board’s CLINT, PLIC, and HTIF subsystems, which is otherwise also
+reachable through the device-mapped addresses described in the next
+section. The processor makes its entire state available, externally and
+read-only, by mapping every register to the start of the physical
+address space (in the <i>processor shadow</i>, a 4KiB range). The
+mapping is given in the following table:
+
+| Offset  | Register  | Offset  | Register     | Offset  | Register        | Offset  | Register         |
+|---------|-----------|---------|--------------|---------|-----------------|---------|------------------|
+| `0x000` | `x0`      | `0x228` | `mtvec`      | `0x290` | `marchid`       | `0x2f8` | `iflags_X`       |
+| `0x008` | `x1`      | `0x230` | `mscratch`   | `0x298` | `mimpid`        | `0x300` | `iflags_Y`       |
+| `...`   | `...`     | `0x238` | `mepc`       | `0x2a0` | `stvec`         | `0x308` | `iflags_H`       |
+| `0x0f8` | `x31`     | `0x240` | `mcause`     | `0x2a8` | `sscratch`      | `0x310` | `clint_mtimecmp` |
+| `0x100` | `mcycle`  | `0x248` | `mtval`      | `0x2b0` | `sepc`          | `0x318` | `plic_girqpend`  |
+| `0x108` | `pc`      | `0x250` | `misa`       | `0x2b8` | `scause`        | `0x320` | `plic_girqsrvd`  |
+| `0x110` | `fcsr`    | `0x258` | `mie`        | `0x2c0` | `stval`         | `0x328` | `htif_tohost`    |
+| `0x118` | `f0`      | `0x260` | `mip`        | `0x2c8` | `satp`          | `0x330` | `htif_fromhost`  |
+| `0x120` | `f1`      | `0x268` | `medeleg`    | `0x2d0` | `scounteren`    | `0x338` | `htif_ihalt`     |
+| `...`   | `...`     | `0x270` | `mideleg`    | `0x2d8` | `senvcfg`       | `0x340` | `htif_iconsole`  |
+| `0x210` | `f31`     | `0x278` | `mcounteren` | `0x2e0` | `ilrsc`         | `0x348` | `htif_iyield`    |
+| `0x218` | `iprv`    | `0x280` | `menvcfg`    | `0x2e8` | `icycleinstret` |         |                  |
+| `0x220` | `mstatus` | `0x288` | `mvendorid`  | `0x2f0` | `iunrep`        |         |                  |
+
+The only generally relevant standard register is `mcycle`. Since its
+value is advanced at every CPU cycle, it can be used to identify a
+particular step in the computation being performed by a Cartesi Machine.
+This is a key component of the verification process, and can also be
+used to bound the amount of computation.
+
+The registers whose names start with “`i`” are Cartesi additions, and
+have the following semantics:
+
+- Register `iprv` holds the current privilege level (0 for User, 1 for
+  Supervisor, and 3 for Machine).
+- Register `iflags_X` is set to 1 when the processor has yielded
+  automatic. The emulator clears it again as soon as the machine
+  resumes.
+- Register `iflags_Y` is set to 1 when the processor has yielded manual.
+  It remains set until the host clears it (either directly, or as a side
+  effect of `send_cmio_response`).
+- Register `iflags_H` is set to 1 to signal the processor has been
+  permanently halted.
+- Register `ilrsc` holds the reservation address for the LR/SC atomic
+  memory operations.
+- Register `icycleinstret` holds the difference between `mcycle` and the
+  architectural instruction count.
+- Register `iunrep` is non-zero in machines configured as
+  unreproducible, a creation-time mode that enables host VirtIO devices
+  in exchange for giving up state-hash verifiability.
+
+### The microarchitecture
+
+In normal execution (i.e., via `machine:run(<max_mcycle>)`), the Cartesi
+Machine emulator runs programs in an *interpreter* that has been
+compiled to run natively on the host computer. The execution of this
+program modifies the registers and memories and interacts with the
+devices accessible to the main processor. The Cartesi Machine uarch can
+be seen as a lower-level emulator. The uarch is not visible to the main
+processor, but code running in the uarch has access to the entire state
+of the Cartesi Machine, including the main processor and the entire
+board. The same interpreter source-code for the Cartesi Machine that
+runs on the host can also be compiled to an `uarch.bin` binary that runs
+exactly one fetch-execute iteration of the main processor and then halts
+the uarch. In its pristine state, the uarch memory is loaded with this
+`uarch.bin`. Therefore, executing the uarch until it halts, and then
+resetting the uarch to its pristine state, is equivalent to executing
+one instruction of the main processor. This finer granularity enables
+state-transition proofs in architectures, such as blockchains, that lack
+sufficient computation power to reliably verify complex main-processor
+instructions (e.g., floating-point division and square-root,
+virtual-memory page-walks, TLB invalidations, etc.). It also greatly
+reduces the number and complexity of the instructions the blockchain
+must be taught to simulate. See [State-transition
+proofs](#state-transition-proofs) for details.
+
+In contrast to the main processor, the uarch processor implements the
+much more restricted RV64I set. This includes only 52 instructions, the
+implementation of which can be directly translated to run in any
+programmable blockchain. It has 32 general-purpose integer registers
+(`uarch_x0`…`uarch_x31`), a program counter (`uarch_pc`), a cycle
+counter (`uarch_cycle`), and a halt flag (`uarch_halt_flag`). Like the
+main processor, the uarch makes its entire state available, externally
+and read-only, by mapping every register to its own 4KiB <i>uarch
+shadow</i> range. The mapping is given in the following table:
+
+| Offset     | Register          | Offset     | Register    |
+|------------|-------------------|------------|-------------|
+| `0x400000` | `uarch_halt_flag` | `0x400018` | `uarch_x0`  |
+| `0x400008` | `uarch_cycle`     | `0x400020` | `uarch_x1`  |
+|            |                   | `...`      | `...`       |
+| `0x400010` | `uarch_pc`        | `0x400110` | `uarch_x31` |
+
+In addition to being able to access all memory ranges and devices
+visible to the main processor, the uarch includes a private 2MiB of RAM.
+
+### The board
+
+The interaction between board and processor happens through interrupts
+and the memory bus. Devices are mapped to the processor’s physical
+address space. The mapping can be seen in the following table:
+
+| Physical address                                     | Mapping                                    |
+|------------------------------------------------------|--------------------------------------------|
+| `0x00000000-0x00000fff`                              | Processor and board shadow                 |
+| `0x00001000-0x00006fff`                              | Shadow TLB                                 |
+| `0x00010000-0x00010fff`                              | PMA Array                                  |
+| `0x00400000-0x00400fff`                              | Uarch shadow                               |
+| `0x00600000-0x007fffff`                              | Uarch RAM                                  |
+| `0x02000000-0x020bffff`                              | Core Local Interruptor (CLINT)             |
+| `0x40008000-0x40008fff`                              | Host-Target Interface (HTIF)               |
+| `0x40010000-0x4001ffff` (*unreproducible mode only*) | VirtIO devices                             |
+| `0x40100000-0x404fffff`                              | Platform-Level Interrupt Controller (PLIC) |
+| `0x60000000-0x601fffff`                              | CMIO RX buffer                             |
+| `0x60800000-0x609fffff`                              | CMIO TX buffer                             |
+| `0x7ff00000-0x7fffffff`                              | Device tree (DTB)                          |
+| `0x80000000`-`0x80000000`+`ram.length`-1             | RAM                                        |
+| *configurable with constraints*                      | Flash drive or NVRAM 0                     |
+| …                                                    | …                                          |
+| *configurable with constraints*                      | Flash drive or NVRAM 7                     |
+
+Execution starts at the beginning of RAM, where the bootloader (an
+OpenSBI `fw_payload` bundle that wraps the Linux kernel) is loaded from
+`linux.bin`. The amount of RAM is user-configurable, but always starts
+at address `0x80000000`. The DTB occupies a fixed region immediately
+below RAM and carries the kernel command line, the description of every
+other range, and the init/entrypoint scripts.
+
+Flash drives must start after `0x80000000`+`ram.length`-1, end before
+`0x80000000`+64TiB, and be aligned to 2MiB.
+
+NVRAMs have much lighter requirements. Their start and length must be
+aligned to 4KiB page boundaries, but can otherwise start and end
+anywhere below the 2<sup>56</sup> limit as long as their length is less
+than 128TiB.
+
+> [!NOTE]
+>
+> For the relentlessly curious, here are the reasons for these
+> constraints:
+>
+> Flash drives are exposed via the persistent-memory block-device driver
+> `pmem-region`. The kernel adds this memory to its physical memory map
+> and reaches it through the direct linear mapping, a dedicated region
+> of the kernel’s virtual address space where physical memory is mapped
+> continuously using fixed offsets rather than page-table traversals.
+> Both buffered I/O through the page cache and direct access (DAX) rely
+> on this mapping, so the constraints below hold regardless of how a
+> drive is accessed.
+>
+> The linear mapping begins where RAM begins, at `0x80000000`. A Cartesi
+> Machine fixes RAM at this address because it is the standard RISC-V
+> layout, the 2GiB DRAM base used by QEMU’s `virt` board and expected by
+> firmware such as OpenSBI, with the lower 2GiB reserved for boot and
+> memory-mapped devices. Since those lower addresses are not
+> general-purpose memory, a flash drive must start at `0x80000000` or
+> higher. The kernel caps the mapping at 64TiB, reserving the rest of
+> the Sv48 address space for other kernel subsystems, so a drive must
+> end no later than `0x80000000`+64TiB-1. Finally, a flash drive’s start
+> and length must be multiples of 2MiB, because the kernel brings
+> persistent-memory regions online only in 2MiB subsections and cannot
+> map a region whose start or end falls off that boundary. This is a
+> generic Linux requirement, not something specific to RISC-V or to the
+> Cartesi Machine.
+>
+> UIO devices exposed via the `generic-uio` driver allow user-space
+> applications to directly interact with hardware, bypassing the page
+> cache and the direct linear mapping. The kernel dynamically creates
+> isolated virtual memory mappings for device registers and memory.
+>
+> UIO devices map directly to hardware addresses, so they must start and
+> end below the 2<sup>56</sup> limit, the maximum physical address space
+> supported by Sv48. Their dynamic mappings must align with 4KiB page
+> boundaries, which establishes valid page table entries without
+> altering access permissions for adjacent physical memory. (The Cartesi
+> Machine itself imposes the same alignment constraint.) The maximum
+> contiguous virtual memory available for user-space processes is
+> 128TiB, half of the total 256TiB Sv48 virtual address space. (The
+> limit for kernel-space mappings managed by the `vmalloc` and `ioremap`
+> subsystems is even smaller, 32TiB, reserving the remaining kernel
+> virtual address space for the direct linear mapping and fixed
+> structures.)
+
+The board also maps non-memory devices to the physical address space:
+CLINT, HTIF, PLIC, and (in unreproducible machines only) one or more
+VirtIO devices.
+
+#### CLINT
+
+The Core Local Interruptor (or CLINT) controls the timer interrupt. The
+active addresses are `0x0200bff8` (`mtime`)
+and `0x02004000` (`mtimecmp`). The CLINT issues a hardware interrupt
+whenever `mtime` equals `mtimecmp`. Since Cartesi Machines must ensure
+reproducibility, the processor’s clock and the timer are locked by a
+constant frequency divisor of `8192`. In other words, `mtime` is
+incremented once for every `8192` increments of `mcycle`. There is no
+notion of wall-clock time.
+
+#### HTIF
+
+The Host-Target Interface (HTIF) mediates communication with the
+external world. It is mapped to a physical memory starting at
+`0x40008000`, where registers can be accessed at the following offsets:
+
+| Offset  | Register   |
+|---------|------------|
+| `0x000` | `tohost`   |
+| `0x008` | `fromhost` |
+| `0x010` | `ihalt`    |
+| `0x018` | `iconsole` |
+| `0x020` | `iyield`   |
+| `0x028` | *Reserved* |
+| `...`   | `...`      |
+| `0x218` | *Reserved* |
+
+The format of CSRs `tohost` and `fromhost` are as follows:
+<p>
+</p>
+
+| Bits  | `63-56` | `55-48` | `47-32`  | `31-0` |
+|-------|---------|---------|----------|--------|
+| Field | `DEV`   | `CMD`   | `REASON` | `DATA` |
+
+Interactions with Cartesi’s HTIF device follow the following protocol:
+
+1.  start by writing 0 to `fromhost`;
+2.  write the <i>request</i> to `tohost`;
+3.  read the <i>response</i> from `fromhost`.
+
+Cartesi’s HTIF supports 3 subdevices: Halt, Console, and Yield. These
+are identified by the following values for the field `DEV`.
+
+| Name               | `DEV` |
+|--------------------|-------|
+| `HTIF_DEV_HALT`    | `0`   |
+| `HTIF_DEV_CONSOLE` | `1`   |
+| `HTIF_DEV_YIELD`   | `2`   |
+
+Registers `ihalt`, `iconsole`, and `iyield` are bit masks specifying the
+commands that are available for the respective devices. Unavailable
+commands are silently ignored by the machine.
+
+##### Halt
+
+| Name                 | `CMD` |
+|----------------------|-------|
+| `HTIF_HALT_CMD_HALT` | `0`   |
+
+The Halt device (`DEV=HTIF_DEV_HALT`) is used to halt the machine. This
+will permanently set register `iflags_H` to 1 and return control back to
+the host.
+
+Send request `CMD=HTIF_HALT_CMD_HALT` with bit 0 of the 32-bit `DATA`
+field (bits 31–0) set to 1. The remaining bits 31–1 of `DATA` carry an
+arbitrary exit code, read as `DATA >> 1`, following the convention used
+by the RISC-V test framework. The `cartesi-machine` utility reports this
+value as the machine’s exit code.
+
+##### Console
+
+| Name                       | `CMD` |
+|----------------------------|-------|
+| `HTIF_CONSOLE_CMD_GETCHAR` | `0`   |
+| `HTIF_CONSOLE_CMD_PUTCHAR` | `1`   |
+
+The Console device (`DEV=HTIF_DEV_CONSOLE`) can be used to input/output
+characters.
+
+To input a character from console (in interactive sessions), request
+`CMD=HTIF_CONSOLE_CMD_GETCHAR`, `DATA=0`, then read response
+`CMD=HTIF_CONSOLE_CMD_GETCHAR`, `DATA=<ch>+1`. (`DATA=0` means no
+character was available);
+
+To output a character `<ch>` to console, request
+`CMD=HTIF_CONSOLE_CMD_PUTCHAR`, with `DATA=<ch>`.
+
+##### Yield
+
+The Yield device can be used to return control to the host. There are
+two types of yield: *automatic* and *manual*.
+
+| Name                       | `CMD` |
+|----------------------------|-------|
+| `HTIF_YIELD_CMD_AUTOMATIC` | `0`   |
+| `HTIF_YIELD_CMD_MANUAL`    | `1`   |
+
+To issue an automatic yield, request `CMD=HTIF_YIELD_CMD_AUTOMATIC`. An
+automatic yield sets register `iflags_X` to 1 and returns control back
+to the host. There are currently 3 supported reasons for automatic
+yields:
+
+| Name                                    | `REASON` |
+|-----------------------------------------|----------|
+| `HTIF_YIELD_AUTOMATIC_REASON_PROGRESS`  | `1`      |
+| `HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT` | `2`      |
+| `HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT` | `4`      |
+
+To report `progress`, set `REASON=HTIF_YIELD_AUTOMATIC_REASON_PROGRESS`,
+and `DATA=<permil>`, where `<permil>` gives the progress in per-mille.
+The other reasons for automatic yield signal the production of Cartesi
+Rollups responses. `REASON=HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT`
+denotes the production of an output (a voucher, delegate-call voucher,
+or notice) and `REASON=HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT` denotes
+the production of a report. In both cases, the guest writes the payload
+to the CMIO TX buffer and `DATA` carries the payload length in bytes.
+
+To issue a manual yield, request `CMD=HTIF_YIELD_CMD_MANUAL`. A manual
+yield sets register `iflags_Y` to 1 and returns control back to the
+host. There are currently 3 supported reasons for manual yields, all
+used with Cartesi Rollups:
+
+| Name                                    | `REASON` |
+|-----------------------------------------|----------|
+| `HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED`  | `1`      |
+| `HTIF_YIELD_MANUAL_REASON_RX_REJECTED`  | `2`      |
+| `HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION` | `4`      |
+
+To accept or reject the previous request, set
+`REASON=HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED` or
+`REASON=HTIF_YIELD_MANUAL_REASON_RX_REJECTED`, respectively. On accept,
+the guest writes the root hash of the output hashes tree to the CMIO TX
+buffer, and `DATA` in `tohost` carries the length of that hash in bytes.
+On reject, `DATA` is ignored. Upon return, the host has loaded the next
+request into the CMIO RX buffer. The `REASON` field in `fromhost`
+carries the request type, and the `DATA` field carries the request
+length in bytes.
+
+| Name                              | `REASON` in response |
+|-----------------------------------|----------------------|
+| `HTIF_YIELD_REASON_ADVANCE_STATE` | `0`                  |
+| `HTIF_YIELD_REASON_INSPECT_STATE` | `1`                  |
+
+To signal the throwing of a rollup exception, set
+`REASON=HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION`. The guest writes the
+exception payload to the CMIO TX buffer and `DATA` in `tohost` carries
+the payload length in bytes.
+
+Before resuming the emulator after a manual yield, the host must
+manually reset register `iflags_Y` to 0. Otherwise, the emulator will
+immediately return with no changes to its state.
+
+#### Rollup
+
+In order to interact with Cartesi Rollups, the host application
+controlling the emulator and the guest application running inside the
+emulator must follow an agreed-upon protocol, mediated by the HTIF Yield
+device.
+
+The low-level view of what happens inside the machine is as follows:
+
+    Initialize
+    `reason` = HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED
+    `length` = 0
+    Repeat
+        Yield manual with `reason` as `REASON` and `length` as `DATA` in `tohost`
+        If `DATA` in `fromhost` is HTIF_YIELD_REASON_ADVANCE_STATE
+            Read ABI-encoded EvmAdvance(...) from CMIO RX buffer
+            Process advance-state request
+            For each output to emit (voucher, delegate-call voucher, or notice)
+                Write ABI-encoded output to CMIO TX buffer and its length to `length`
+                Add output hash to output hashes tree
+                Yield automatic with HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT as `REASON` and `length` as `DATA` in `tohost`
+            End
+            For each report to emit
+                Write raw report data to CMIO TX buffer and its length to `length`
+                Yield automatic with HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT as `REASON` and `length` as `DATA` in `tohost`
+            End
+            If exception to emit
+                Write raw exception data to CMIO TX buffer and its length to `length`
+                `reason` = HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION
+            ElseIf input rejected
+                `length` = 0
+                `reason` = HTIF_YIELD_MANUAL_REASON_RX_REJECTED
+            Else
+                Write output hashes root hash to CMIO TX buffer
+                `length` = hash size
+                `reason` = HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED
+            End
+        ElseIf `DATA` in `fromhost` is HTIF_YIELD_REASON_INSPECT_STATE
+            Read raw query from CMIO RX buffer
+            Process inspect-state request
+            For each report to emit
+                Write raw report data to CMIO TX buffer and its length to `length`
+                Yield automatic with HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT as `REASON` and `length` as `DATA` in `tohost`
+            End
+            If exception to emit
+                Write raw exception data to CMIO TX buffer and its length to `length`
+                `reason` = HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION
+            Else
+                `length` = 0
+                `reason` = HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED
+            End
+        Else
+            `length` = 0
+            `reason` = HTIF_YIELD_MANUAL_REASON_RX_REJECTED
+        End
+    End
+
+At a higher level, the guest application running inside the emulator is
+supported by the libcmt library or by even higher-level interfaces based
+on it, such as the `/usr/bin/rollup` command-line utility, the HTTP API
+exposed by the `/usr/bin/rollup-http-server` command-line utility, or a
+language-specific framework. The libcmt library handles ABI encoding and
+decoding, maintains the output hashes tree in userspace, and uses the
+`/dev/cmio` device driver to move data to and from the CMIO buffers and
+perform the required yields. See [The libcmt
+library](#the-libcmt-library), [The /dev/cmio
+device](#the-devcmio-device), [The rollup command-line
+utility](#the-rollup-command-line-utility), and [The rollup HTTP
+server](#the-rollup-http-server) for the corresponding interfaces.
+
+There are two types of request: advance-state requests and inspect-state
+requests. The loop processes one request per iteration. To transition
+between requests, the application accepts the previous request, rejects
+it, or throws an exception. The return from the accept yield defines the
+type of the next request.
+
+When the application identifies an advance-state request, it reads the
+ABI-encoded input from the CMIO RX buffer. While processing
+advance-state requests, the application can emit outputs (vouchers,
+delegate-call vouchers, or notices) and reports, in any order. Outputs
+and reports are written to the CMIO TX buffer. Outputs contribute to the
+output hashes tree maintained by libcmt. When the application is ready
+to accept the next input, libcmt writes the current output hashes root
+hash to the CMIO TX buffer as part of the accept yield.
+
+When an application identifies an inspect-state request, it reads the
+raw query from the CMIO RX buffer. While processing inspect-state
+requests, the application can emit reports. Reports are written to the
+CMIO TX buffer and do not affect the output hashes tree.
+
+Instead of accepting or rejecting a request, the application can emit an
+exception to signal some unrecoverable error. The exception is also
+written to the CMIO TX buffer.
+
+All data exchanged through the CMIO buffers follows the Solidity ABI
+specification. Advance-state inputs arrive in the CMIO RX buffer as
+`EvmAdvance(uint256 chainId, address appContract, address msgSender, uint256 blockNumber, uint256 blockTimestamp, uint256 prevRandao, uint256 index, bytes payload)`.
+Vouchers are encoded as
+`Voucher(address destination, uint256 value, bytes payload)`.
+Delegate-call vouchers are encoded as
+`DelegateCallVoucher(address destination, bytes payload)`. Notices are
+encoded as `Notice(bytes payload)`. Reports, inspect queries, and
+exceptions travel as raw bytes.
+
+In the host, the loop is as follows:
+
+    Save fresh fork of machine as a snapshot
+    Repeat
+        Obtain the next request from an external source
+        If advance-state request
+            Write the current state hash to the state at AR_SHADOW_REVERT_ROOT_HASH_START
+            Write ABI-encoded EvmAdvance(...) to CMIO RX buffer and its length to `length`
+            Write HTIF_YIELD_REASON_ADVANCE_STATE to `REASON` and `length` as `DATA` in `fromhost`
+            Reset register `iflags_Y` to 0
+            While register `iflags_H` is 0 and register `iflags_Y` is 0 (neither halted nor manual yield)
+                Resume machine
+                If register `iflags_X` is set (automatic yield)
+                    If `REASON` in `tohost` is HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT
+                        `length` = `DATA` from `tohost`
+                        Read ABI-encoded output from CMIO TX buffer using `length`
+                    End
+                    If `REASON` in `tohost` is HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT
+                        `length` = `DATA` from `tohost`
+                        Read raw report data from CMIO TX buffer using `length`
+                    End
+                End
+            End
+            If register `iflags_Y` is not 0 (machine yielded manual)
+                If `REASON` in `tohost` is HTIF_YIELD_MANUAL_REASON_RX_REJECTED
+                    Replace machine with fresh fork of snapshot
+                End
+                If `REASON` in `tohost` is HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED
+                    `length` = `DATA` from `tohost` (length of hash)
+                    Read output hashes root hash from CMIO TX buffer using `length`
+                    Replace snapshot with fresh fork of machine
+                End
+                If `REASON` in `tohost` is HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION
+                    `length` = `DATA` from `tohost`
+                    Read raw exception data from CMIO TX buffer using `length`
+                    Abort
+                End
+            End
+            If register `iflags_H` is not 0 (machine is halted)
+                Abort
+            End
+        End
+        If inspect-state request
+            Write raw query to CMIO RX buffer and its length to `length`
+            Write HTIF_YIELD_REASON_INSPECT_STATE to `REASON` and `length` as `DATA` in `fromhost`
+            Reset register `iflags_Y` to 0
+            While register `iflags_H` is 0 and register `iflags_Y` is 0 (neither halted nor manual yield)
+                Resume machine
+                If register `iflags_X` is set (automatic yield)
+                    If `REASON` in `tohost` is HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT
+                        `length` = `DATA` from `tohost`
+                        Read raw report data from CMIO TX buffer using `length`
+                    End
+                End
+            End
+            Replace machine with fresh fork of snapshot
+        End
+    End
+
+The host controls the emulator via the C, Lua, or JSON-RPC APIs. It
+loops obtaining requests from an external source. Processing requests
+modifies the state of the machine. However, at the end of a request, the
+host may have to revert these changes. Therefore, the host keeps a
+snapshot of the state of the machine before any request is processed.
+
+For an advance-state request, the host sends the request with
+`machine:send_cmio_response()`, passing the current state hash for the
+machine to record. (This, of course, changes the state so its hash is
+not what has just been written, but this is expected.) The call also
+writes the request to the CMIO RX buffer and its type and length to the
+HTIF register `fromhost`, and unblocks the machine by clearing its
+`iflags_Y` register. The machine is now ready to be resumed. The host
+loops resuming the machine and collecting its outputs or reports every
+time it yields automatic. The guest application is eventually done with
+the input. If it rejects the input, the host drops the current machine
+and replaces it with a copy of the snapshot. If it accepts the input,
+the host replaces the snapshot with a copy of the current machine, and
+collects the new output hashes root hash. If it threw an exception or
+halted, the host aborts.
+
+For an inspect-state request, the loop is very similar. The differences
+are that only reports are collected (outputs are ignored), and that the
+machine is always reverted back to a copy of its snapshot.
+
+#### Address ranges
+
+A Cartesi Machine contains many address ranges. The address ranges
+visible to the main processor are mapped at fixed positions in its
+64-bit physical address space. These are the ranges listed in the [board
+mapping table](#the-board) at the start of this chapter, exposed to Lua
+via the `cartesi.AR_*` constants, and discoverable at runtime via the
+[PMA array](#pmas) described in the next subsection.
+
+The uarch has its own private address ranges, which are not accessible
+to the main processor:
+
+| Physical address        | Mapping                  |
+|-------------------------|--------------------------|
+| `0x00400000-0x00400fff` | Microarchitecture shadow |
+| `0x00600000-0x007fffff` | Microarchitecture RAM    |
+
+The uarch shadow holds the uarch processor state. The uarch RAM holds
+the uarch program that decodes and executes one main processor
+instruction per uarch run before halting.
+
+#### PMAs
+
+Each address range visible to the main processor is described by an
+entry in the array of Physical Memory Attribute records (PMAs). The PMA
+array occupies `0x00010000-0x00010fff` and starts at address `0x10000`
+(exposed as `cartesi.AR_PMAS_START`). This is how the RISC-V interpreter
+discovers the available ranges at runtime, regardless of whether it is
+compiled to run directly on the host or inside a ZK prover. The
+microarchitecture’s private ranges are not visible to the main processor
+and have no PMA entries, though a driver id is reserved for the uarch
+shadow state for consistency.
+
+Each PMA consists of 2 64-bit words. The first word gives the start of a
+range and the second word its length. These words are readable both
+internally and externally. Since the ranges must be aligned to 4KiB page
+boundaries, the lowest 12-bits of each word are available for
+attributes. The meaning of each attribute field is as follows: First
+word:
+
+| Bits  | `63-12` | `11-8` | `7`  | `6`  | `5` | `4` | `3` | `2` | `1`  | `0` |
+|-------|---------|--------|------|------|-----|-----|-----|-----|------|-----|
+| Field | `start` | `DID`  | `IW` | `IR` | `X` | `W` | `R` | `E` | `IO` | `M` |
+
+The `M`, `IO`, and `E` bits are mutually exclusive, and respectively
+mark the range as memory, I/O mapped, or excluded. Bits `R`, `W`,
+and `X` mark read, write, and execute permissions, respectively. The
+`IR` and `IW` bits mark the range as idempotent for reads and writes,
+respectively. Finally, the `DID` gives the driver id, which can have the
+following values:
+
+| Name                         | Value |
+|------------------------------|-------|
+| `PMA_EMPTY_DID`              | `0`   |
+| `PMA_MEMORY_DID`             | `1`   |
+| `PMA_SHADOW_STATE_DID`       | `2`   |
+| `PMA_FLASH_DRIVE_DID`        | `3`   |
+| `PMA_CLINT_DID`              | `4`   |
+| `PMA_HTIF_DID`               | `5`   |
+| `PMA_PLIC_DID`               | `6`   |
+| `PMA_CMIO_RX_BUFFER_DID`     | `7`   |
+| `PMA_CMIO_TX_BUFFER_DID`     | `8`   |
+| `PMA_SHADOW_UARCH_STATE_DID` | `9`   |
+| `PMA_VIRTIO_DID`             | `10`  |
+| `PMA_NVRAM_DID`              | `11`  |
+
+Second word:
+
+| Bits  | `63-12`  | `11-0`          |
+|-------|----------|-----------------|
+| Field | `length` | *Reserved (=0)* |
+
+The list of PMA records ends with an invalid PMA entry for which
+`length=0`.
+
+### Linux setup
+
+By default, `pc` starts at the beginning of RAM (address `0x80000000`),
+where the RAM image is loaded. The emulator builds a
+[<i>devicetree</i>](https://www.devicetree.org/) describing the hardware
+at instantiation time, derived from the machine configuration, and
+writes it into the DTB memory range immediately below RAM. The start
+address of the DTB (`0x7ff00000`) is pre-loaded in register `a1`, per
+the conventional RISC-V boot ABI.
+
+The `dtc` command-line utility can be used to inspect the devicetree:
+
+``` bash
+cartesi-machine \
+    --no-init-splash \
+    --quiet \
+    --user=root \
+    -- "dtc -I dtb -O dts /sys/firmware/fdt"
+```
+
+The result is
+
+``` text
+/dts-v1/;
+
+/ {
+	#address-cells = <0x02>;
+	#size-cells = <0x02>;
+	compatible = "ucbbar,riscvemu-bar_dev";
+	model = "ucbbar,riscvemu-bare";
+
+	chosen {
+		bootargs = "quiet earlycon=sbi console=hvc0 uio_pdrv_genirq.of_id=generic-uio root=/dev/pmem0 rw init=/usr/sbin/cartesi-init";
+	};
+
+	cartesi-machine {
+		version = "0.20";
+		init = [55 53 45 52 3d 72 6f 6f 74 0a];
+		entrypoint = [64 74 63 20 2d 49 20 64 74 62 20 2d 4f 20 64 74 73 20 2f 73 79 73 2f 66 69 72 6d 77 61 72 65 2f 66 64 74];
+	};
+
+	cpus {
+		#address-cells = <0x01>;
+		#size-cells = <0x00>;
+		timebase-frequency = <0x3d09>;
+
+		cpu@0 {
+			device_type = "cpu";
+			reg = <0x00>;
+			status = "okay";
+			compatible = "riscv";
+			riscv,isa = "rv64acdfimsu";
+			mmu-type = "riscv,sv39";
+			clock-frequency = <0x7a12000>;
+
+			interrupt-controller {
+				#address-cells = <0x00>;
+				#interrupt-cells = <0x01>;
+				interrupt-controller;
+				compatible = "riscv,cpu-intc";
+				phandle = <0x01>;
+			};
+		};
+	};
+
+	soc {
+		#address-cells = <0x02>;
+		#size-cells = <0x02>;
+		compatible = "ucbbar,riscvemu-bar-soc\0simple-bus";
+		ranges;
+
+		clint@2000000 {
+			compatible = "riscv,clint0";
+			reg = <0x00 0x2000000 0x00 0xc0000>;
+			interrupts-extended = <0x01 0x03 0x01 0x07>;
+		};
+
+		plic@40100000 {
+			#interrupt-cells = <0x01>;
+			interrupt-controller;
+			compatible = "riscv,plic0";
+			riscv,ndev = <0x1f>;
+			reg = <0x00 0x40100000 0x00 0x400000>;
+			interrupts-extended = <0x01 0x09 0x01 0xffffffff>;
+			phandle = <0x02>;
+		};
+
+		htif@40008000 {
+			compatible = "ucb,htif0";
+			reg = <0x00 0x40008000 0x00 0x1000>;
+			interrupts-extended = <0x01 0x0d>;
+		};
+	};
+
+	memory@80000000 {
+		device_type = "memory";
+		reg = <0x00 0x80000000 0x00 0x8000000>;
+	};
+
+	reserved-memory {
+		#address-cells = <0x02>;
+		#size-cells = <0x02>;
+		ranges;
+
+		fw_resv@80000000 {
+			reg = <0x00 0x80000000 0x00 0x80000>;
+			no-map;
+		};
+	};
+
+	pmem@90000000 {
+		compatible = "pmem-region";
+		reg = <0x00 0x90000000 0x00 0x94e6000>;
+		volatile;
+	};
+
+	aliases {
+		flashdrive0 = "/pmem@90000000";
+		root = "/pmem@90000000";
+	};
+
+	cmio {
+		#address-cells = <0x02>;
+		#size-cells = <0x02>;
+		compatible = "ctsi-cmio";
+
+		rx_buffer@60000000 {
+			reg = <0x00 0x60000000 0x00 0x200000>;
+		};
+
+		tx_buffer@60800000 {
+			reg = <0x00 0x60800000 0x00 0x200000>;
+		};
+	};
+
+	yield {
+		compatible = "ctsi-yield";
+		manual;
+		automatic;
+	};
+};
+```
+
+The `memory@80000000` section describes 64MiB of RAM starting at address
+`0x80000000`. The `pmem@90000000` section describes flash drive 0: a
+memory region starting at address `90000000`, with compatible string
+`pmem-region`. This will eventually become available as `/dev/pmem0`.
+The `cmio` section specifies the starts and lengths of the CMIO memory
+ranges. The `yield` section specifies that the machine will process
+automatic and manual yields. Finally, section `chosen` includes the
+`bootargs` string that will be used as the kernel command-line
+parameters. Notice the specification of the root file-system as
+`root=/dev/pmem0` in the bootargs, and the `root` alias in `aliases`
+pointing to the `pmem` node. Also notice the command
+`dtc -I dtb -O dts /sys/firmware/fdt` coming directly from the
+`cartesi-machine` command line.
+
+Linux support for RISC-V is upstream in the [Linux kernel
+archives](https://www.kernel.org/). The kernel runs in supervisor mode,
+on top of a Supervisor Binary Interface (SBI) provided by a machine-mode
+shim: a [Cartesi fork](https://github.com/cartesi/opensbi) of
+[OpenSBI](https://github.com/riscv-software-src/opensbi), with
+Cartesi-specific extensions used by the kernel to talk to HTIF.
+Cartesi’s RAM image `linux.bin` is an OpenSBI `fw_payload` bundle, with
+the kernel embedded as the payload, built from the
+[`machine-linux-image`](https://github.com/cartesi/machine-linux-image)
+repository. OpenSBI occupies the first 512KiB of RAM, declared as a
+no-map region in the device tree so the kernel does not touch it. After
+self-initialization, OpenSBI switches to supervisor mode and cedes
+control to the kernel entry point.
+
+After completing its own initialization, the kernel mounts the root
+file-system (by default `root=/dev/pmem0 rw `) and cedes control to the
+program named by the `init=` parameter (by default
+`init=/usr/sbin/cartesi-init`). Cartesi’s root file-system `rootfs.ext2`
+is built from the
+[`machine-guest-tools`](https://github.com/cartesi/machine-guest-tools)
+repository, which also installs `cartesi-init` and the rollups
+user-space tooling. See [Initialization](#initialization-1) under the
+Guest perspective for what `cartesi-init` does after the kernel hands
+off.
+
+# The blockchain perspective
+
+This section describes the Cartesi Machine from the perspective of the
+blockchain. Using the Cartesi platform, smart contracts gain a new
+ability. They can get their users to agree on the results of
+computations that cannot be performed natively as smart contracts:
+computations that either involve too much data, are too computationally
+demanding, or require a sophisticated software infrastructure that is
+simply not available for use on-chain.
+
+Users that have a stake in a given computation are represented off-chain
+by Cartesi Nodes under their control. Cartesi Nodes react to
+Cartesi-enabled smart contracts and instantiate Cartesi Machines to
+perform the required computations and post the result back to the
+blockchain. Since Cartesi Machines are self-contained and reproducible,
+the results of off-chain computations performed by honest users will
+agree. The smart contract can then make decisions of consequence that
+depend on these results.
+
+When the Cartesi Node representing an honest user identifies an
+incorrect result posted by a dishonest user, it disputes the result. The
+opposing Cartesi Nodes then engage in an automatic dispute resolution
+protocol presided over by the blockchain, which results in the dishonest
+user being proven wrong. The smart contract that commanded the
+computation can then punish the dishonest user and reward the honest
+one.
+
+The Cartesi Machine emulator is one of a kind. It doesn’t simply emulate
+the RISC-V ISA to the extent that it can boot a performant operating
+system based on Linux. It does so in a way that allows smart contracts
+to specify computations, replace their inputs, inspect their outputs,
+and direct the dispute resolution protocol.
+
+## Hash-view of state
+
+One of the key goals of moving computations off-chain is to allow them
+to manipulate vast amounts of data: so much data that it becomes
+economically prohibitive to explicitly store them in the blockchain.
+Nevertheless, for smart contracts to delegate computations off-chain,
+they must be able to specify the computations, their inputs, and then
+reason over their outputs. The key to solving these seemingly
+contradictory goals is the clever use of cryptographic hashes.
+
+Cartesi Machines are transparent in the sense that their entire state is
+exposed for external inspection. This includes the RAM, all flash drives
+and NVRAMs, general purpose registers, control and status registers, and
+even the internal state of all devices. In fact, the entire machine
+state is mapped into the 64-bit physical memory address space of the
+Cartesi Machine. (The exact mapping is given in the [system
+architecture](#system-architecture) section of the guest perspective.)
+This means that, right before a machine is executed, a cryptographic
+hash of its entire state can be generated. A cryptographic hash of the
+state of a Cartesi Machine “completely” specifies the computation it is
+about to perform. This is because a given state always evolves in
+exactly the same way (because Cartesi Machines are self-contained and
+reproducible) and it is infeasible to find a different machine state
+that produces the same cryptographic state hash. By the same token, once
+the machine is done, the state hash “completely” specifies the result of
+the computation, wherever it may reside within the address space.
+
+> [!NOTE]
+>
+> The same caveat applies to “completely” here as to “only” earlier (see
+> [State hashes](#state-hashes)). There are vastly more possible machine
+> states than 256-bit state hashes, so collisions must exist, but
+> finding one is infeasible for a cryptographic hash function such as
+> Keccak-256.
+
+The state hash of a Cartesi Machine is the root hash of a Merkle tree.
+Merkle trees are binary trees where a leaf node is labeled with the hash
+of a data block and an inner node is labeled with the hash of the
+concatenated labels of its two child nodes. In the case of Cartesi
+Machines, a block is simply one of the 2<sup>59</sup> aligned 32-byte
+blocks in the machine’s physical memory address space. The root hash can
+be obtained from the `machine:get_root_hash()` method. In the
+command-line, the options `--initial-hash` and `--final-hash` of the
+`cartesi-machine` utility cause it to output the root hash of the Merkle
+tree as it is before the emulator starts running and after it is done
+running, respectively.
+
+The machine can be configured to use the `"keccak256"` hash function
+(for use with the uarch) or the `"sha256"` hash function (for use with
+ZK). In theory, the Merkle tree of the entire machine state could be
+built from these primitives and [external state
+access](#external-state-access) to the machine instance. In practice,
+most of the state is unused and implicitly filled with zeros, and this
+allows the Merkle tree computation to skip large swaths of the state by
+using precomputed hashes for subtrees that span zeroed out regions of
+all power-of-2 sizes. The computation is also smart enough to only
+update the parts of the tree that changed between invocations.
+
+<picture>
+<source media="(prefers-color-scheme: dark)" srcset="images/state-tree-dark.svg">
+<img alt="A machine's state hash-tree over its address space" src="images/state-tree-light.svg">
+</picture>
+
+The figure above shows the state Merkle tree of a machine, drawn over
+its 64-bit address space. Each memory range is a complete subtree, shown
+as a blue triangle rooted at one tree node. The address space between
+ranges is pristine, shown as pale triangles, and a single pristine gap
+may take more than one subtree to span. A tree node is blue when
+everything below it is a memory range, pale when all of it is pristine,
+and gray when it mixes the two. The state hash is the root, at the far
+left.
+
+Tree hashes are used instead of linear hashes because they support a
+variety of operations that are unavailable from linear hashes.
+
+### Slicing and splicing
+
+In the Merkle tree of a Cartesi Machine state, the labels of each of the
+2<sup>D</sup> nodes at a depth *D* can be seen as the root hashes for
+Merkle *subtrees* corresponding to adjacent intervals of *2<sup>L</sup>*
+bytes in the address space, where *L=64-D*. Each of these nodes can be
+identified by an address *A* and the log *L* of the length of the
+interval it spans, where *A* is aligned to a *2<sup>L</sup>* boundary.
+
+Consider a scenario in which a smart contract knows *only* the state
+hash *M* for a certain Cartesi Machine. Using Merkle trees makes the
+following key operations possible: 1. *Slicing* — A user with access to
+the Merkle tree of *M* can provide data the blockchain can use to prove
+that the word at a given address has a given value. More generally, the
+user can provide data the blockchain can use to prove that a node with a
+given address and length in the tree has a given label; 1. *Splicing* —
+A user with access to the Merkle tree of *M* can provide data the
+blockchain can use to prove that writing a given word at a given address
+results in a Cartesi Machine with a given state hash *M’*. More
+generally, the user can provide data the blockchain can use to prove
+that replacing a node of given length at a given address with another
+node of equal length and a given label results in a Cartesi Machine with
+a given state hash *M’*.
+
+To understand how the slicing proof works, notice that the path from the
+Merkle tree node at depth *D\>0* (i.e., with log length *L=64-D*) and
+address *A* goes through *D* nodes: *n<sub>D</sub>*, *n<sub>D-1</sub>*,
+…, *n<sub>1</sub>* until it reaches the root *n<sub>0</sub>*. The labels
+associated to all these nodes can be produced as follows. If
+*n<sub>D</sub>* is a leaf node, its `32`-byte contents must be provided
+and the label is the hash of those bytes. Otherwise, if it is a general
+node, its label must be provided. The label of *n<sub>D-1</sub>* can
+then be obtained by hashing together the label of node *n<sub>D</sub>*
+and the label of its sibling. The order between these two siblings is
+available from the *D*th most significant bit in address *A*. If it is
+clear, *n<sub>D</sub>*’s label comes first, otherwise, its sibling’s
+label comes first. It should be obvious that, when labels for *all
+siblings* in the path from the target node to the root are provided,
+this process can be repeated until the label of *n<sub>0</sub>* itself
+is obtained. This must match the value *M* known to the smart contract.
+In fact, due to the properties of cryptographic hashes, it is infeasible
+for the label so obtained to match *M* *unless all the data provided is
+true*.
+
+The data needed for the proofs can be produced by the
+`machine:get_proof(<address>, <log2_target_size>[, <log2_root_size>])`
+method of a Cartesi Machine instance. The contents of the proof returned
+are described in the [Lua interface](#state-value-proofs-1). That
+section uses the same small `hash-tree` module, whose three helpers are
+shown alongside the prose below.
+
+The workhorse is `roll_hash_up_tree(<proof>, <new_target_hash>)`:
+
+``` lua
+local function roll_hash_up_tree(proof, target_hash)
+    local hash = target_hash
+    for log2_size = proof.log2_target_size, proof.log2_root_size - 1 do
+        local sibling = assert(proof.sibling_hashes[log2_size - proof.log2_target_size + 1], "too few siblings")
+        local bit = (proof.target_address & (1 << log2_size)) ~= 0
+        local first, second
+        if bit then
+            first, second = sibling, hash
+        else
+            first, second = hash, sibling
+        end
+        hash = cartesi.keccak256(first, second)
+    end
+    return hash
+end
+```
+
+In the first iteration of the loop, the function uses the bit with value
+2<sup>`proof.log2_target_size`</sup> in `proof.target_address` to
+determine if the sibling of the target node comes before or after it in
+the address space of the Cartesi Machine. It then computes the hash of
+the concatenation of the target node’s hash and its sibling’s hash (in
+the correct order). To do so, it uses the
+`cartesi.keccak256(<hash1>, <hash2>)` function. The result must be the
+hash of the parent node to the target and its sibling. The loop then
+goes up the `proof.sibling_hashes` array, and obtains the sibling of
+this parent node. This is again concatenated with the just-calculated
+hash of the parent node (in the correct order) to obtain what must be
+the hash of the grandparent node. This process is repeated until the
+hash of what must be the root node is found and returned. Function
+`verify_slice(<proof>)` then compares this to `proof.root_hash`. If they
+match, the proof passes. Otherwise, something is amiss.
+
+The slicing check `verify_slice` wires this walk into the proof
+structure returned by `machine:get_proof()`:
+
+``` lua
+local function verify_slice(proof)
+    assert(roll_hash_up_tree(proof, proof.target_hash) == proof.root_hash, "target node not in tree")
+end
+```
+
+To verify a slicing operation, the code first checks the root hash *M*
+against the one found in the proof. Then, it uses `roll_hash_up_tree` to
+recompute the root hash from the path between the target node and root.
+Any mismatch triggers an assertion.
+
+Verifying a splicing operation is just as easy. First, the code verifies
+that the slicing operation is valid. This ensures that the sibling
+hashes are correct. Then, it uses `roll_hash_up_tree` to compute the
+root hash from the path between the target node and root. Only this time
+it starts from the new target node hash. The resulting root hash is the
+hash of a tree with the old node replaced by the new. This is exactly
+what `verify_splice` does:
+
+``` lua
+local function verify_splice(proof, new_target_hash, new_root_hash)
+    verify_slice(proof)
+    assert(roll_hash_up_tree(proof, new_target_hash) == new_root_hash, "target node not in tree")
+end
+```
+
+### Template instantiation
+
+The most important use for the splicing operation is template
+instantiation. From the blockchain perspective, a [Cartesi Machine
+template](#cartesi-machine-templates) is simply a state hash *M*.
+Instantiating the Cartesi Machine with a given input is simply the
+process of obtaining the state hash *M’* that results from replacing one
+or more of its input NVRAMs. Each replacement is the result of a
+splicing operation as described above. The splicing operation is
+particularly convenient if the input range length is a power of 2 and
+its start is aligned according to its length. This is why, by default,
+the Cartesi Machine positions flash drives and NVRAMs respecting these
+constraints.
+
+The following script performs the same operation in two distinct ways,
+an off-chain way and a blockchain way, and checks that the two agree.
+Off-chain, it instantiates the `calculator-template` concretely,
+modifies its input NVRAM with the contents of a mathematical expression,
+and then asks for the state hash *M’* of the modified machine.
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+local hash_tree = require("cartesi.hash-tree")
+
+-- Obtain input expression from the command line
+local input_expr = assert(arg[1], "missing input expression")
+
+-- Get instantiated template hash concretely
+
+-- Load machine from template
+local machine = cartesi.machine("calculator-template")
+
+-- Find input NVRAM by label
+local input_nvram = assert(util.find_drive(machine:get_initial_config(), "nvram", "input"))
+
+-- Write input expression to input NVRAM
+machine:write_memory(input_nvram.start, input_expr .. "\n")
+
+-- Get root hash of instantiated template
+local instantiated_template_hash = machine:get_root_hash()
+
+-- Verify instantiated template hash using proofs
+
+-- Load input proof (must be a whole-machine proof)
+local template_input_proof = require("pristine-input-proof")
+assert(template_input_proof.log2_root_size == cartesi.HASH_TREE_LOG2_ROOT_SIZE, "proof depth mismatch")
+
+-- Load actual input hash
+local input_hash = hash_tree.get_root_hash(input_expr .. "\n", input_nvram.log2_size)
+
+-- Check that instantiated template hash can be obtained directly from input proof and new input hash
+hash_tree.verify_splice(template_input_proof, input_hash, instantiated_template_hash)
+print("Instantiation by proof works!")
+```
+
+On chain, instantiating the machine like this would be impossible.
+Nevertheless, the script can obtain the same state hash *M’* using
+proofs. For this, it needs only the pristine input proof and the root
+hash of the modified input NVRAM. The splicing operation bubbles that
+root hash up the tree to recover the state hash, which the script then
+compares against the one obtained off-chain.
+
+Since the input NVRAM starts completely filled with zeros, only the
+mathematical expression is needed to describe its modified contents. Its
+root hash is computed by
+`hash_tree.get_root_hash(<data>, <log2_root_size>)`, which lays `<data>`
+at the base of a 2^`<log2_root_size>`-byte subtree and returns its root.
+
+``` lua
+local function get_root_hash(data, log2_root_size)
+    assert(#data <= (1 << log2_root_size), "data does not fit in the tree")
+    -- Level zero is one hash per word, a trailing partial word zero-padded after the loop.
+    local level = {}
+    local full = #data - #data % WORD_LENGTH
+    for i = 1, full, WORD_LENGTH do
+        level[#level + 1] = cartesi.keccak256(data:sub(i, i + WORD_LENGTH - 1))
+    end
+    if full < #data then
+        local word = data:sub(full + 1)
+        level[#level + 1] = cartesi.keccak256(word .. string.rep("\0", WORD_LENGTH - #word))
+    end
+    -- Pair upward to the root, the pristine hash standing in for every node the data misses.
+    local pristine = cartesi.keccak256(string.rep("\0", WORD_LENGTH))
+    for _ = WORD_LOG2_SIZE, log2_root_size - 1 do
+        local parents = {}
+        for i = 1, #level, 2 do
+            parents[#parents + 1] = cartesi.keccak256(level[i], level[i + 1] or pristine)
+        end
+        level, pristine = parents, cartesi.keccak256(pristine, pristine)
+    end
+    return level[1]
+end
+```
+
+The leaves are the 32-byte words of `<data>`, each hashed with
+`cartesi.keccak256`, and a trailing partial word is zero-padded. Each
+inner node is the hash of its two children. Every node that `<data>`
+does not reach takes its level’s pristine hash, the root of an all-zero
+subtree, obtained by hashing the previous level’s pristine hash with
+itself. In this way, the function recovers the drive’s root hash
+efficiently, without ever accessing its unmodified regions.
+
+Running the script with the command-line
+
+``` bash
+lua5.4 splice-calculator-with-new-drive.lua "6*2^1024 + 3*2^512"
+```
+
+produces the output
+
+``` text
+Instantiation by proof works!
+```
+
+### Result extraction
+
+The most important use for the slicing operation is retrieving
+computation results. In a typical scenario, a user posts the final state
+hash of an instantiated Cartesi Machine that has been run until it
+halted. When the other users agree with this final state hash, slicing
+operations can be used to convince the blockchain of the contents of the
+halted Cartesi Machine’s state. This can be the value of a single word
+in an output flash drive or NVRAM, or it can be the Merkle tree root for
+its entire contents.
+
+The following script performs the same operation in two distinct ways,
+an off-chain way and a blockchain way, and checks that the two agree.
+Off-chain, it instantiates the `calculator-template` concretely, writes
+a mathematical expression into its input NVRAM, runs the machine until
+it halts, reads the result string from its output NVRAM, and saves the
+state hash *M’* of the halted machine.
+
+``` lua
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+local hash_tree = require("cartesi.hash-tree")
+
+-- Obtain input expression from the command line
+local input_expr = assert(arg[1], "missing input expression")
+
+-- Get the result and the halted state hash concretely
+
+-- Load machine from template, silencing its console output
+local machine = cartesi.machine("calculator-template", { console = { output_destination = "to_null" } })
+local config = machine:get_initial_config()
+
+-- Write input expression to input NVRAM
+local input_nvram = assert(util.find_drive(config, "nvram", "input"))
+machine:write_memory(input_nvram.start, input_expr .. "\n")
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+
+-- Read result string from output NVRAM and save the halted state hash
+local output_nvram = assert(util.find_drive(config, "nvram", "output"))
+local result = string.unpack("z", machine:read_memory(output_nvram.start, output_nvram.length))
+local halted_state_hash = machine:get_root_hash()
+
+-- Verify the result against the output proof
+
+-- Load output proof (must be a whole-machine proof)
+local output_proof = require("output-proof")
+assert(output_proof.log2_root_size == cartesi.HASH_TREE_LOG2_ROOT_SIZE, "proof depth mismatch")
+
+-- Reconstruct the root hash of the output NVRAM from the result alone
+local output_hash = hash_tree.get_root_hash(result, output_nvram.log2_size)
+
+-- Splicing the reconstructed output drive into the proof must reproduce the agreed machine hash
+hash_tree.verify_splice(output_proof, output_hash, halted_state_hash)
+print("Extraction by proof works!")
+print(result)
+```
+
+On chain, the blockchain wants to verify the result of the computation.
+This is possible when all interested parties agree on the final state
+hash *M’* of the Cartesi Machine they ran off-chain. Assuming this to be
+the case, and in possession of the output proof and the result, the
+blockchain reconstructs the root hash of the output NVRAM from the
+result with `hash_tree.get_root_hash`, the same function the previous
+example used for the input drive. It then passes the output proof, this
+reconstructed hash, and the agreed hash *M’* to `verify_splice`, which
+confirms that an output NVRAM with exactly this content sits in the
+machine whose state hash is *M’*. In other words, once everyone agrees
+on *M’*, the result really is there.
+
+``` bash
+lua5.4 slice-calculator-output.lua "6*2^1024 + 3*2^512"
+```
+
+produces the output
+
+``` text
+Extraction by proof works!
+10786158809173895446375831144734148401707861873653839436405804869463\
+96054833005778796250863934445216126720683279228360145952738612886499\
+73495708458383684478649003115037698421037988831222501494715481595948\
+96901677837132352593468675094844090688678579236903861342030923488978\
+36036892526733668721977278692363075584
+```
+
+### The output hashes tree
+
+The operations so far concern the word-leaf tree of the machine state.
+The same slicing idea applies to another Merkle tree the project uses,
+the *output hashes tree*, introduced under [Rolling Cartesi Machines and
+Cartesi Rollups](#rolling-cartesi-machines-and-cartesi-rollups). Its
+leaves are output hashes, each one `cartesi.keccak256` of a single
+output, rather than the bytes of a fixed address range. Its height is
+fixed at 63, so it can hold up to 2<sup>63</sup> outputs. A leaf for an
+output not yet produced is pristine, literally 32 zero bytes, rather
+than the hash of a pristine word. A Rolling Cartesi Machine grows this
+one tree from genesis, across all of its epochs, one output at a time.
+
+Every operation the output hashes tree needs can be carried out from a
+compact summary of it, called a *frontier*, without ever materializing
+the whole tree. This matters at both ends of the system. Inside the
+Cartesi Machine, outputs accumulate across an unbounded number of
+epochs, so holding the complete tree would eventually exhaust the memory
+available to the guest. Outside, as we will see, even the output proofs
+can be generated holding only the frontier. The outputs themselves and
+their proofs are kept outside the machine, by the Cartesi Node. The
+machine state commits to them through the output hashes root hash alone.
+
+The frontier after *c* outputs captures the complete left subtrees
+standing over the leaves in the range \[0, *c*), each by its root hash.
+Writing *c* in binary, such a subtree spans 2<sup>*l*</sup> leaves and
+is present exactly when bit *l* of *c* is set. These subtrees tile the
+leaves left to right, largest first, so the frontier holds one root hash
+per set bit of *c*, and *c* itself can be read back from which entries
+are present. The module stores it as a fixed-length array with one slot
+per level, holding that level’s subtree root hash, or `false` where its
+bit is clear.
+
+The accessor `frontier_node` reads the hash of a node at one level from
+three regions that sit left to right in the tree, the frontier, an
+active region of nodes being worked on, and pristine padding:
+
+``` lua
+local function frontier_node(frontier_entry, base, active, pristine_entry, index)
+    local lo, hi = base, base + #active - 1
+    if index < lo then
+        return frontier_entry -- fell left: a complete left subtree from the frontier
+    elseif index > hi then
+        return pristine_entry -- fell right: an all-pristine subtree
+    else
+        return active[index - lo + 1] -- inside the active region
+    end
+end
+```
+
+A node index that falls to the left of the active region is supplied by
+the frontier, a complete left subtree’s root hash. One that falls to the
+right is the root hash of an all-pristine subtree. One inside is taken
+straight from the active region. In the excerpt, `<index>` is the node’s
+position within the level, `<base>` is where the active region begins
+and `<active>` holds its nodes, and `<frontier_entry>` and
+`<pristine_entry>` are that level’s frontier and pristine subtree roots.
+Both maintaining the frontier and emitting proofs go through this
+accessor.
+
+<figure>
+<img src="images/outputs-tree.svg"
+alt="Output hashes tree partitioned into frontier, active region, and pristine padding" />
+<figcaption aria-hidden="true">Output hashes tree partitioned into
+frontier, active region, and pristine padding</figcaption>
+</figure>
+
+The figure shows the tree mid-stream, scaled down to height four while
+the real output hashes tree has height 63. Six earlier outputs sit to
+the left under the frontier, which holds them as two complete subtrees,
+one of four leaves and one of two, filled blue at their roots. The three
+new outputs of this epoch form the active region in the middle, filled
+green. The seven leaves to the right are pristine padding, held as a
+four-leaf, a two-leaf, and a single-leaf subtree, filled gray at their
+roots. Only the hashes actually held are filled, so every node below a
+frontier or pristine root is left empty, outlined in its subtree’s
+color, because the frontier keeps each whole subtree as that one root
+hash and never materializes the leaves under it.
+
+The function `frontier_push_back` folds one new output leaf into the
+frontier:
+
+``` lua
+local function frontier_push_back(frontier, hash)
+    local right = hash
+    local level = 1
+    while frontier[level] do
+        right = cartesi.keccak256(frontier[level], right)
+        frontier[level] = false
+        level = level + 1
+    end
+    frontier[level] = right
+end
+```
+
+Adding an output advances the leaf count from *c* to *c*+1. In binary
+that clears a run of low set bits and sets the next one up, an ordinary
+carry. The function mirrors the carry, combining the new leaf with the
+present low levels from the bottom up to the first empty one, clearing
+each, and storing the resulting hash at that first empty level. It is
+the root of the subtree covering exactly the leaves ending at the new
+output, the frontier entry the carry creates. A level is combined only
+once every 2<sup>*l*</sup> outputs, so a long run of outputs costs
+constant work each, amortized.
+
+The function `frontier_get_root_hash` returns the root hash of the tree,
+padded with zero leaves to completion:
+
+``` lua
+local function frontier_get_root_hash(frontier)
+    local root = pristine_leaf
+    local pristine = pristine_leaf
+    for level = 1, #frontier do
+        if frontier[level] then
+            root = cartesi.keccak256(frontier[level], root)
+        else
+            root = cartesi.keccak256(root, pristine)
+        end
+        pristine = cartesi.keccak256(pristine, pristine)
+    end
+    return root
+end
+```
+
+Every leaf the outputs have not reached is pristine. The function climbs
+level by level, combining each present frontier entry on the left with
+pristine padding on the right. The [Output proofs](#output-proofs)
+example uses these two together while processing an epoch, pushing each
+accepted output and then rooting the frontier to check it against the
+output hashes root hash the guest reported.
+
+The constructor is `frontier`, which produces the frontier an epoch
+begins from:
+
+``` lua
+local function frontier(log2_max_leaves_or_last_proof)
+    if is_proof(log2_max_leaves_or_last_proof) then
+        local proof = log2_max_leaves_or_last_proof
+        local log2_max_leaves = proof.log2_root_size
+        local f = frontier_genesis(log2_max_leaves)
+        local leaf_count = proof.target_address + 1
+        local lowest_complete_level = 1
+        while leaf_count & (1 << (lowest_complete_level - 1)) == 0 do
+            lowest_complete_level = lowest_complete_level + 1
+        end
+        -- Above the lowest complete level, where the leaf count's bit at that level is set, the last leaf
+        -- is a right child, so its proof sibling there is exactly the complete left subtree we need.
+        for level = lowest_complete_level + 1, log2_max_leaves do
+            local bit = level - 1
+            if leaf_count & (1 << bit) ~= 0 then f[level] = proof.sibling_hashes[level] end
+        end
+        -- At the lowest complete level, the last leaf is a right child at every lower level, so rolling it
+        -- up through the siblings below rebuilds that level's complete left subtree, which ends at the leaf
+        -- count.
+        local hash = proof.target_hash
+        for level = 1, lowest_complete_level - 1 do
+            hash = cartesi.keccak256(proof.sibling_hashes[level], hash)
+        end
+        f[lowest_complete_level] = hash
+        return f
+    end
+    return frontier_genesis(log2_max_leaves_or_last_proof)
+end
+```
+
+It distinguishes two cases with `is_proof`, which checks whether the
+argument is a proof table rather than a height. Given the tree height,
+it returns the empty frontier of a genesis epoch, the all-`false`
+frontier for the given height. Given the previous epoch’s last output
+proof instead, it rebuilds the frontier as it stood after that output.
+The last output is the rightmost leaf in the range \[0, *c*), so at
+every level where *c* has a set bit that leaf is a right child, and its
+proof sibling there is exactly the root hash the frontier stores for
+that level. The lowest such entry is recovered by rolling the leaf up
+through its siblings below. A single proof, the one already saved for an
+epoch’s last output, is therefore all the next epoch needs to resume the
+same genesis-rooted tree.
+
+Finally, `frontier_next_proofs` produces an epoch’s output proofs:
+
+``` lua
+local function frontier_next_proofs(frontier, next_output_hashes)
+    local log2_max_leaves = #frontier
+    local next_output_count = #next_output_hashes
+    if next_output_count == 0 then return {} end
+    local leaf_count = frontier_leaf_count(frontier)
+    -- siblings[i] is the i-th new output's sibling array.
+    local siblings = {}
+    for i = 1, next_output_count do
+        siblings[i] = {}
+    end
+    -- active holds the node hashes covering global indices [base, base + #active - 1] at the
+    -- current level; start at the leaves over [leaf_count, leaf_count + next_output_count).
+    local active = next_output_hashes
+    local base = leaf_count
+    local pristine = pristine_leaf -- the all-pristine subtree at the current level
+    for level = 1, log2_max_leaves do
+        local bit = level - 1
+        local frontier_entry = frontier[level]
+        -- Each output's proof sibling at this level is its node's neighbour (toggle the low bit).
+        for i = 1, next_output_count do
+            local node = (leaf_count + i - 1) >> bit
+            siblings[i][level] = frontier_node(frontier_entry, base, active, pristine, node ~ 1)
+        end
+        -- Climb one level: parent p has children 2p and 2p+1; the leftmost index halves.
+        local parents = {}
+        local parents_base = base >> 1
+        for p = parents_base, (base + #active - 1) >> 1 do
+            local left = frontier_node(frontier_entry, base, active, pristine, 2 * p)
+            local right = frontier_node(frontier_entry, base, active, pristine, 2 * p + 1)
+            parents[p - parents_base + 1] = cartesi.keccak256(left, right)
+        end
+        active, base = parents, parents_base
+        pristine = cartesi.keccak256(pristine, pristine)
+    end
+    local root_hash = active[1] -- after the last level the single active node is the root
+    local proofs = {}
+    for i = 1, next_output_count do
+        proofs[i] = {
+            target_address = leaf_count + i - 1,
+            log2_target_size = 0,
+            log2_root_size = log2_max_leaves,
+            target_hash = next_output_hashes[i],
+            root_hash = root_hash,
+            sibling_hashes = siblings[i],
+        }
+    end
+    return proofs
+end
+```
+
+Given the starting frontier and the output hashes accepted during the
+epoch, in order, it returns one proof per new output, all against the
+single final root. The only thing a new output’s proof needs from the
+earlier leaves in the range \[0, *c*) is the frontier. A left sibling on
+a new leaf’s path to the root always ends at an aligned boundary at or
+before *c*, so it is a complete subtree whose root hash the frontier
+already holds, never an individual old leaf. The function sweeps the new
+leaves up one level at a time, reading each proof sibling through
+`frontier_node`, which supplies a frontier entry or pristine padding at
+the boundaries. The proofs are built together, in one batch at the end
+of the epoch, because an early output’s low siblings are later outputs
+of the same epoch. Note that proofs issued for outputs in previous
+epochs are produced and stored by the Cartesi Node as soon as those
+epochs were finalized. They are checked against the state hash (and
+output hashes root hash) finalized then, not against what gets finalized
+in later epochs.
+
+Generating these proofs is shown in the Lua [Output
+proofs](#output-proofs) section. Checking an output against them, from a
+settled machine state hash alone, is shown under [Output
+verification](#output-verification) below.
+
+### Output verification
+
+The slicing and splicing operations above extract a result from a halted
+machine, whose entire output occupies a single NVRAM. A Rolling Cartesi
+Machine instead emits outputs one at a time and keeps running. The
+analogous operation is to verify the contents of a given output it
+produced. This is possible between epochs, once the state hash of the
+machine is agreed upon. From that state hash, a slicing operation
+recovers the output hashes root hash from the machine’s CMIO tx buffer.
+As described under [Output proofs](#output-proofs), this is the root of
+a Merkle tree. Its leaves are the hashes of all outputs ever produced,
+in order. A second slicing operation, in that tree, then proves the
+output’s hash is one of its leaves.
+
+When the [Rolling Cartesi Machine calculator](#rolling-cartesi-machines)
+processed its first epoch, it saved more than the outputs themselves.
+For each accepted input, it saved a proof that the output hashes root
+hash occupied the CMIO tx buffer. For each output, it saved an output
+proof. Through `--final-hash`, it also saved the machine state hash the
+epoch settled on. The output proofs are built against the epoch’s final
+output hashes root hash. They therefore pair with the output hashes root
+hash proof from the last accepted input, input 3. The following script
+verifies output 0 from the settled state hash and those artifacts alone,
+without instantiating any machine.
+
+``` lua
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+local hash_tree = require("cartesi.hash-tree")
+
+-- Read a proof saved as a Lua chunk
+local function read_proof(name)
+    return assert(loadfile(name, "t", {}))()
+end
+
+-- The settled machine state hash, the two proofs, and the output to verify against them
+local machine_hash = util.read_file(assert(arg[1], "missing machine state hash"))
+local output_hashes_root_hash_proof = read_proof(assert(arg[2], "missing output hashes root hash proof"))
+local output_proof = read_proof(assert(arg[3], "missing output proof"))
+local output = util.read_file(assert(arg[4], "missing output"))
+
+-- The output hashes root hash proof must be rooted at the agreed machine state hash
+assert(output_hashes_root_hash_proof.root_hash == machine_hash, "proof not rooted at the machine state hash")
+hash_tree.verify_slice(output_hashes_root_hash_proof)
+
+-- The output proof's root is the output hashes root hash, the value the tx-buffer word holds
+assert(
+    cartesi.keccak256(output_proof.root_hash) == output_hashes_root_hash_proof.target_hash,
+    "tx buffer holds another value"
+)
+hash_tree.verify_slice(output_proof)
+
+-- The output proof's target must be the hash of the output itself
+assert(cartesi.keccak256(output) == output_proof.target_hash, "output does not match the proof")
+
+print(string.format("output %d verified against the machine state hash", output_proof.target_address))
+```
+
+The script first confirms the output proof’s root equals the value the
+output hashes root hash proof locates in the tx-buffer word. That joins
+the two trees. It then hashes the output’s bytes and matches them
+against the leaf the output proof locates, pinning down this exact
+output.
+
+Running the script over the artifacts the Rolling Cartesi Machine
+calculator saved
+
+``` bash
+lua5.4 verify-output-proof.lua \
+    epoch-1-state-hash.bin \
+    input-3-output-hashes-root-hash-proof.lua \
+    output-0-input-1-proof.lua \
+    output-0-input-1.bin
+```
+
+produces the output
+
+``` text
+output 0 verified against the machine state hash
+```
+
+## Verification game
+
+The question now becomes how the blockchain can identify the honest
+party when there are two opinions on the final state hash of a Cartesi
+Machine, for a computation the blockchain itself is unable to perform.
+This is the role of the verification game, an [established
+technique](https://doi.org/10.1016/j.ic.2013.03.003) on which our
+original [whitepaper](https://cartesi.io/cartesi_whitepaper.pdf) builds.
+It rests on one assumption, that at least one of the two parties is
+honest.
+
+The `verification-game.lua` recipe is a self-contained model of it. A
+referee, standing in for the Cartesi contracts deployed on the
+blockchain, mediates a dispute between two players, each standing in for
+a Cartesi Node that ran the computation off-chain. The three are
+separate processes that communicate over the network, which here stands
+in for blockchain transactions. The referee never trusts a player. The
+two players run identical code and differ only in the machine they hold.
+One is honest, the other cheats past a chosen point by switching to a
+machine that ran a different expression.
+
+The game opens with each player committing the final state hash of its
+machine, obtained by running it until it halts. If the two hashes agree
+there is no dispute and the result can be extracted directly. When they
+disagree the referee settles the dispute before accepting the result.
+
+``` lua
+local function run_referee(referee, dapp_contract)
+    local players = wait_for_commitments()
+
+    local winner = players[1]
+    if players[1].final_hash ~= players[2].final_hash then
+        winner = adjudicate_dispute(players, referee.initial_hash)
+    end
+
+    wait_for_result(dapp_contract, players, winner.final_hash)
+end
+```
+
+### Settling a dispute
+
+The dispute is settled in two bisections. The first ranges over `mcycle`
+and isolates the disputed main processor instruction, the second ranges
+over `uarch_cycle` and isolates the single uarch step within it.
+
+``` lua
+local function adjudicate_dispute(players, initial_hash)
+    local state = { last_agreed_hash = initial_hash, hash_after = players[1].final_hash, branch = "start" }
+
+    -- Bisect to the disputed main-processor instruction.
+    bisect_level(players, "mcycle", cartesi.MCYCLE_MAX, state)
+    -- Narrow down to the microarchitecture instruction.
+    bisect_level(players, "uarch_cycle", cartesi.UARCH_CYCLE_MAX, state)
+
+    -- A converged cycle of UARCH_CYCLE_MAX-1 means the disputed transition is the reset, else a step.
+    phase("verdict")
+    local log = wait_for_log(players[1], state.branch, state.lo)
+    eventf("Player 1 posted log")
+
+    -- Player 1 won if its log verifies against the agreed before-hash, otherwise player 2 is honest.
+    local winner = verify_state_transition(state.lo, state.last_agreed_hash, log, state.hash_after) and players[1]
+        or players[2]
+    eventf("Player %d wins! Final state hash is %s.", winner.index, short_hash(winner.final_hash))
+    return winner
+end
+```
+
+### One bisection level
+
+Each bisection narrows the disagreement to the single transition
+responsible for it, repeatedly asking both players for the state hash at
+the midpoint of an interval of cycles and keeping the half where they
+still disagree.
+
+``` lua
+local function bisect_level(players, level, hi, state)
+    phase("bisect_" .. level)
+    local lo, round = 0, 0
+    while math.ult(1, hi - lo) do
+        local mid = lo + ((hi - lo) >> 1)
+        local hash = wait_for_bisection(players, state.branch, level, mid)
+        if hash[1] == hash[2] then
+            lo, state.last_agreed_hash, state.branch = mid, hash[1], "agree"
+        else
+            hi, state.hash_after, state.branch = mid, hash[1], "disagree"
+        end
+        round = round + 1
+        eventf("%s bisection round %d, interval of disagreement is [0x%x, 0x%x]", level, round, lo, hi)
+    end
+    state.lo = lo
+end
+```
+
+The main processor has a fixed-point property once the machine halts.
+Running it for more `mcycle`s leaves the state, and therefore the hash,
+unchanged. Likewise, the uarch has a fixed-point property once it halts.
+Running it for more `uarch_cycle`s leaves the state unchanged, until a
+reset begins the next main processor instruction. This is what lets each
+bisection range over the full cycle ceiling without knowing in advance
+where either machine halts. A midpoint past a halt simply repeats the
+final hash, and the disagreement is still found at the cycle where the
+two computations diverge.
+
+### Verifying the state transition
+
+Once a single `uarch_cycle` is in dispute, the referee asks the player
+on the disagreeing side for the access log of the transition out of it,
+and verifies that log without ever instantiating a machine. This stands
+for a Cartesi contract that can verify such logs directly on the
+blockchain. The transition is either an ordinary uarch step or the
+terminal reset that begins the next main processor instruction. Which
+one it is depends only on the agreed cycle, since the only transition
+out of `cartesi.UARCH_CYCLE_MAX - 1` is the reset, so the referee checks
+the log with `verify_reset_uarch` at that boundary and
+`verify_step_uarch` everywhere else. If the log proves that the agreed
+before-hash advances to the player’s committed after-hash, that player
+was honest, otherwise the other one is assumed to be.
+
+``` lua
+local function verify_state_transition(uarch_cycle, state_hash_before, log, state_hash_after)
+    local pass
+    if uarch_cycle == cartesi.UARCH_CYCLE_MAX - 1 then
+        eventf("Verifying uarch reset log!")
+        pass = pcall(cartesi.machine.verify_reset_uarch, cartesi.machine, state_hash_before, log, state_hash_after)
+    else
+        eventf("Verifying uarch step log!")
+        pass = pcall(cartesi.machine.verify_step_uarch, cartesi.machine, state_hash_before, log, state_hash_after)
+    end
+    eventf("Log is %s!", pass and "valid" or "invalid")
+    return pass
+end
+```
+
+### Verifying the result
+
+Naming the winner settles which final state hash is the true one. The
+referee asks both players for a result and accepts the first that
+verifies against that hash.
+
+``` lua
+local function wait_for_result(dapp_contract, players, final_hash)
+    phase("output")
+    while true do
+        local output = wait_for_output(players)
+        if verify_output(dapp_contract, output, final_hash) then
+            eventf("Result posted:\n%sAccepted!", output.target_value)
+            return
+        end
+        eventf("Result posted:\n%sRejected!", output.target_value)
+    end
+end
+```
+
+A posted result verifies, by the same slicing operation shown earlier,
+only if its bytes hash to the proof’s target, the target sits at the
+output drive’s address, and the proof rolls up to the winner’s final
+hash.
+
+``` lua
+local function verify_output(dapp_contract, output, final_hash)
+    return output.proof.root_hash == final_hash
+        and output.proof.log2_root_size == cartesi.HASH_TREE_LOG2_ROOT_SIZE
+        and output.proof.target_address == dapp_contract.output.start
+        and output.proof.log2_target_size == dapp_contract.output.log2_size
+        and hash_tree.get_root_hash(output.target_value, dapp_contract.output.log2_size) == output.proof.target_hash
+        and pcall(hash_tree.verify_slice, output.proof)
+end
+```
+
+A result that does not, from the dishonest player or anyone else, is
+rejected. This keeps the result phase decoupled from the dispute, the
+parties who settle it are not the parties who later rely on the
+finalized hash to prove the result.
+
+### Running the game
+
+To run the whole game, start the referee, the server the players connect
+to:
+
+``` bash
+lua5.4 verification-game.lua referee 127.0.0.1:8087 "6*2^1024 + 3*2^512"
+```
+
+then the honest player, which evaluates the public expression:
+
+``` bash
+lua5.4 verification-game.lua honest 127.0.0.1:8087 "6*2^1024 + 3*2^512"
+```
+
+and the dishonest player, which cheats at an early cycle into a
+different expression:
+
+``` bash
+lua5.4 verification-game.lua dishonest 127.0.0.1:8087 "6*2^1024 + 3*2^512" 25 7 "2+2"
+```
+
+The referee narrates the dispute from start to finish:
+
+``` text
+Player 1 posted final state hash 0xa7fdb74d....
+Player 2 posted final state hash 0xdbece74e....
+mcycle bisection round 1, interval of disagreement is [0x0, 0x7fffffffffffffff]
+mcycle bisection round 2, interval of disagreement is [0x0, 0x3fffffffffffffff]
+mcycle bisection round 3, interval of disagreement is [0x0, 0x1fffffffffffffff]
+...
+mcycle bisection round 62, interval of disagreement is [0x17, 0x1b]
+mcycle bisection round 63, interval of disagreement is [0x19, 0x1b]
+mcycle bisection round 64, interval of disagreement is [0x19, 0x1a]
+uarch_cycle bisection round 1, interval of disagreement is [0x0, 0x80000]
+uarch_cycle bisection round 2, interval of disagreement is [0x0, 0x40000]
+uarch_cycle bisection round 3, interval of disagreement is [0x0, 0x20000]
+...
+uarch_cycle bisection round 18, interval of disagreement is [0x4, 0x8]
+uarch_cycle bisection round 19, interval of disagreement is [0x6, 0x8]
+uarch_cycle bisection round 20, interval of disagreement is [0x7, 0x8]
+Player 1 posted log
+Verifying uarch step log!
+Log is valid!
+Player 1 wins! Final state hash is 0xa7fdb74d....
+Result posted:
+4
+Rejected!
+Result posted:
+10786158809173895446375831144734148401707861873653839436405804869463\
+96054833005778796250863934445216126720683279228360145952738612886499\
+73495708458383684478649003115037698421037988831222501494715481595948\
+96901677837132352593468675094844090688678579236903861342030923488978\
+36036892526733668721977278692363075584
+Accepted!
+```
+
+The bisection converges on the cheat point, the disputed step verifies
+in the honest player’s favor, and the cheater’s result is rejected
+before the true one is accepted.
+
+That dispute resolved on an ordinary uarch step, since the cheat point
+fell early in the disputed instruction’s uarch cycles. Cheating instead
+at the last uarch cycle, `cartesi.UARCH_CYCLE_MAX - 1`, moves the
+disagreement onto the terminal reset that begins the next instruction,
+the case the referee checks with `verify_reset_uarch`:
+
+``` bash
+lua5.4 verification-game.lua dishonest 127.0.0.1:8088 "6*2^1024 + 3*2^512" 25 "$last_uarch_cycle" "2+2"
+```
+
+This time the uarch bisection climbs to the reset boundary and the
+honest player’s reset log verifies just the same:
+
+``` text
+uarch_cycle bisection round 1, interval of disagreement is [0x80000, 0x100000]
+uarch_cycle bisection round 2, interval of disagreement is [0xc0000, 0x100000]
+uarch_cycle bisection round 3, interval of disagreement is [0xe0000, 0x100000]
+...
+uarch_cycle bisection round 18, interval of disagreement is [0xffffc, 0x100000]
+uarch_cycle bisection round 19, interval of disagreement is [0xffffe, 0x100000]
+uarch_cycle bisection round 20, interval of disagreement is [0xfffff, 0x100000]
+Player 1 posted log
+Verifying uarch reset log!
+Log is valid!
+Player 1 wins! Final state hash is 0xa7fdb74d....
+```
+
+For simplicity this model uses only two players, but the same idea is
+the basis for efficient algorithms that resolve disputes among many
+players. Our implementation has since moved on to use our
+[Permissionless Refereed Tournaments](https://arxiv.org/abs/2212.12439).
+For an even better algorithm, see our [Dave: A Decentralized, Secure,
+and Lively Fraud-Proof Algorithm](https://doi.org/10.1145/3734698).
diff --git a/doc/README.md.template b/doc/README.md.template
new file mode 100644
index 000000000..25e0eeaed
--- /dev/null
+++ b/doc/README.md.template
@@ -0,0 +1,4673 @@
+---
+title: Cartesi Machine
+include-before: |
+    # Table of contents
+---
+
+# Introduction
+
+The Cartesi Machine is Cartesi's solution for verifiable computation.
+It was designed to bring mainstream scalability to decentralized applications and mainstream productivity to their developers.
+
+## Scalability
+
+Applications running exclusively on smart contracts face severe constraints on the amount of data they can manipulate and on the complexity of computations they can perform.
+These limitations manifest themselves as exorbitant transaction costs and, even if such costs could somehow be overcome, as extremely long computation times.
+
+In comparison, applications running inside Cartesi Machines can process practically unlimited amounts of data, and at a pace orders of magnitude faster.
+This is possible because Cartesi Machines run off-chain, free of the overhead imposed by the consensus mechanisms used by blockchains.
+
+In a typical scenario, one of the parties involved in an application will execute the Cartesi Machine off-chain and report its results to the blockchain.
+Different parties do not need to trust each other because the Cartesi platform includes an automatic dispute mechanism for Cartesi Machines.
+All interested parties repeat the computation off-chain and, if their results do not agree, they enter into a dispute, which the mechanism guarantees to be always won by an honest party against any number of dishonest parties.
+
+To enable this dispute mechanism, Cartesi Machines are executed inside a special emulator that has three unique properties:
+
+- Cartesi Machines are _self contained_ &mdash; They run in isolation from any external influence on the computation;
+- Cartesi Machines are _reproducible_ &mdash; Two parties performing the same computation always obtain exactly the same results;
+- Cartesi Machines are _transparent_ &mdash; They expose their entire state for external inspection.
+
+From the point of view of the blockchain, the disputes require only a tiny fraction of the amount of computation performed by the Cartesi Machine.
+Dispute resolution thus becomes an ordinary task and dishonest parties are generally expected to be exposed, which discourages the posting of incorrect results and further increases the efficiency of the platform.
+
+Cartesi Machines allow decentralized applications to take advantage of vastly increased computing capabilities off-chain, while enjoying the same security guarantees offered by code that runs natively as smart contracts.
+This is what Cartesi means by scalability.
+
+## Productivity
+
+Scalability is not the only impediment to widespread blockchain adoption.
+Another serious limiting factor is the reduced developer productivity.
+
+Modern software development involves the combination of dozens of off-the-shelf software components.
+Creating these components took the concerted effort of an active worldwide community over the course of several decades.
+They have all been developed and tested using well-established toolchains (programming languages, compilers, linkers, profilers, debuggers, etc.), and rely on multiple services provided by modern operating systems (memory management, multi-tasking, file systems, networking, etc.).
+
+Smart contracts are developed using ad-hoc toolchains, and run directly on top of custom virtual machines, without the support of an underlying operating system.
+This arrangement deprives developers of the tools of their trade, severely reduces their expressive power, and consequently decimates their productivity.
+
+In contrast, Cartesi Machines are based on a proven platform: [RISC-V](https://riscv.org/).
+RISC-V was born of research in academia at UC Berkeley.
+It is now maintained by its own independent foundation.
+It is important to keep in mind that, unlike many of its academic counterparts, RISC-V is not a toy architecture.
+It is suitable for direct native hardware implementation, which is indeed currently commercialized by a large (and ever-increasing) number of [vendors](https://en.wikipedia.org/wiki/RISC-V#Implementations).
+This means that, in the future, Cartesi will not be limited to emulation or binary translation off-chain.
+The RISC-V platform is supported by a vibrant community of developers.
+Their efforts have produced an extensive software infrastructure, most notably ports of the Linux Operating System and the GNU toolchain.
+
+By moving key parts of their application logic to run inside Cartesi Machines, but on top of the Linux Operating System, developers are isolated not only from the limitations and idiosyncrasies of specific blockchains, but also from irrelevant details of the Cartesi Machine architecture itself.
+They regain access to all the tools they have come to rely on when writing applications.
+
+This is Cartesi's contribution to empowering application developers to express their creativity unimpeded, and to boost their productivity.
+
+## What's in a machine
+
+The key components of a Cartesi Machine are its main processor and a board.
+The processor that performs the computations, executing the traditional fetch-execute loop while maintaining a variety of registers, implements a generous set of RISC-V extensions.
+The board defines the surrounding environment with an assortment of memories (RAM, flash drives, NVRAMs etc) and a number of devices.
+Memories and devices are mapped to the 64-bit physical address space of the Cartesi Machine.
+The amount of RAM, as well as the number, length, and position of the flash drives and NVRAMs in the address space can be chosen according to the needs of each particular application.
+The Cartesi Machine emulator is a program that carefully implements the Cartesi Machine architecture so that its execution is reproducible in production.
+During development, a variety of convenient devices can be added to the Cartesi Machine that make prototyping more ergonomic.
+The emulator can be built from the [`cartesi/machine-emulator`](https://github.com/cartesi/machine-emulator) repository.
+
+The Cartesi Machine also includes a microarchitecture (uarch) that can drive the main processor using a much-reduced RISC-V ISA.
+This is necessary to enable verifiability in architectures that, due to computational limitations, cannot emulate a main-processor instruction, such as blockchains.
+Running the uarch until it halts, and then resetting the uarch to its pristine state, is equivalent to executing one instruction of the main processor.
+See [the microarchitecture section](#the-microarchitecture) for details.
+
+The initialization of a Cartesi Machine typically loads the Linux kernel into RAM, and a Linux root file-system (as a flash drive) from regular files in the host file-system.
+The Linux kernel `linux.bin`, is built by the [`cartesi/machine-linux-image`](https://github.com/cartesi/machine-linux-image) repository.
+After it is done with its own initialization, the Linux kernel cedes control to the `/usr/sbin/cartesi-init` program in the root file-system.
+The root file-system `rootfs.ext2` contains all the data files and programs that make up the Linux distribution.
+It is built by the [`cartesi/machine-rootfs-image`](https://github.com/cartesi/machine-rootfs-image) repository.
+The components of the guest application can reside in the root file-system itself, or in their own, separate file-systems.
+The emulator can be instructed to execute whatever command is necessary to start the guest application.
+For a complete description of the Cartesi Machine architecture and the boot process, see the documentation for [the guest perspective](#the-guest-perspective).
+
+There are two distinct modes of operation.
+In the first mode, a Cartesi Machine is initialized and tasked to run a guest application until the machine _halts_.
+Inputs for the guest application can be provided as additional flash drives with file-systems, or NVRAMs with raw data.
+Outputs are only available to the host after the machine halts.
+Once it halts, the machine cannot perform any additional computations.
+
+In the second mode of operation, the guest application runs in a loop.
+In each iteration, it obtains a request carrying an input, performs any necessary computations to service the request, and produces a number of responses.
+Indeed, this is much like a server in which the guest application can interact with the outside world.
+We say that a Cartesi Machine operating in this mode is a _Rolling Cartesi Machine_.
+
+### Rolling Cartesi Machines and Cartesi Rollups
+
+Rolling Cartesi Machines accept two types of requests: advance-state requests and inspect-state requests.
+Advance-state requests can create persistent changes to the state of the underlying Cartesi Machine.
+In contrast, inspect-state requests leave the state unchanged.
+
+Both types of request are serviced by the guest application, which modifies the state of the Cartesi Machine while doing so.
+When servicing an advance-state request, the guest application ultimately either accepts or rejects it.
+The resulting modifications are kept only when the request is accepted, and reverted when it is rejected.
+State modifications are always reverted after inspect-state requests are serviced.
+
+The stringent demands of reproducibility prevent a Cartesi Machine from communicating _directly_ with the outside world.
+Indeed, if two parties were to run the same Cartesi Machine and then disagree on the data each instance independently obtained from a network connection, there would be no way to settle a dispute between them.
+Instead, Rolling Cartesi Machines communicate with the outside world under controlled conditions, through _Cartesi Rollups_.
+
+In a nutshell, Cartesi Rollups uses the blockchain to maintain a public record of advance-state requests targeting each Rolling Cartesi Machine.
+Both the order and the inputs carried by these requests are recorded and made available in an indisputable fashion.
+Since Cartesi Machines are deterministic, and since the inputs are agreed upon, the state of a Rolling Cartesi Machine can be advanced in a well-defined way, always producing the same set of responses, no matter who runs it.
+
+After producing each response to a request, the guest application asks the machine to _yield_ control back to the host.
+The host extracts the response and _resumes_ the machine.
+When done with a given input, the guest application once again asks the machine to yield control back to the host.
+At the same time, it notifies the host whether the input was accepted or rejected.
+The host then prepares the input for the next request, and _resumes_ either the modified machine or a backup copy, so the guest application can service the next request in a new iteration of its loop.
+Inputs and responses are transferred in special memory ranges (_CMIO_ memory ranges).
+
+Advancing the state of a Rolling Cartesi Machine can produce four types of response: _vouchers_, _notices_, _reports_, and _exceptions_.
+Vouchers allow a Rolling Cartesi Machine to interact back with the blockchain.
+A voucher issued by the guest application may, for example, grant a user the right to withdraw tokens locked into a custodial smart contract.
+Notices are used to register noteworthy changes to the state of the guest application.
+A notice may be issued, for example, announcing the demise of a character in a game or some other relevant state transition.
+Disputes over the fact that a voucher or notice has been generated while advancing the state of a Rolling Cartesi Machine can be settled by Cartesi Rollups.
+Reports, in contrast, are used to output any data that is irrelevant to the blockchain.
+A report may, for example, provide diagnostic information on the reasons why an input has been rejected.
+
+_Rejecting an input not only reverts the state, but also cancels all vouchers and notices emitted while the request was serviced._
+
+The advance-state requests serviced by a Rolling Cartesi Machine are grouped into _epochs_.
+At the end of an epoch, the state of the machine is finalized, so its state hash becomes known.
+From the finalized state one can read the _output hashes root hash_, a single hash that commits to every voucher and notice the machine has ever emitted.
+This hash is the root of a Merkle tree maintained inside the machine, where each leaf is the hash of one of the outputs, in the order they are emitted.
+(The index of an output is its leaf position.)
+Given the contents of an output, and a proof that its hash is the leaf at that index in the tree, it is therefore possible to verify that the machine has in fact produced that output.
+This is how Cartesi Rollups settles disputes over the vouchers and notices a Rolling Cartesi Machine produces.
+
+Between state advances, it is possible to inspect the state of a Rolling Cartesi Machine.
+This works by sending a query for processing inside the Cartesi Machine.
+State inspection produces only reports and exceptions.
+_All modifications to the state due to servicing queries are reverted after the responses are collected._
+
+An exception, which either kind of request may produce, signals an irrecoverable error encountered by the guest application.
+
+## Documentation
+
+Cartesi Machines can be seen from three different perspectives:
+
+- _The host perspective_ &mdash;
+  This is the environment right outside the Cartesi Machine emulator.
+  It is most relevant to developers setting up Cartesi Machines, running them, or manipulating their contents.
+  It includes the emulator's API in all its flavors: C, C++, Lua, JSON-RPC, and the command-line interface;
+- _The guest perspective_ &mdash;
+  This is the environment inside the Cartesi Machine.
+  It encompasses Cartesi's particular flavor of the RISC-V architecture, as well as the organization of the Linux Operating System that runs on top of it.
+  It is most relevant to programmers responsible for the application components that run off-chain but must be verifiable.
+  The cross-compiling toolchain, and the tools used to build the Linux kernel and the Linux root file-systems are also important from this perspective, even though they are used in the host;
+- _The blockchain perspective_ &mdash;
+  This is the view smart contracts have of Cartesi Machines.
+  It consists almost exclusively of the manipulation of cryptographic hashes of the state of Cartesi Machines and parts thereof.
+  In particular, using only hash operations, the blockchain can verify assertions concerning the contents of the state, and can obtain the state hash that results from modifications to the state.
+  Notably, this includes direct verification by the blockchain of RISC-V instructions performed by the uarch, and ZK proofs of batches of RISC-V instructions performed by the main processor.
+
+As with every computer, the level of knowledge required to interact with Cartesi Machines depends on the nature of the application being created.
+Simple applications make only modest demands of each kind of developer. Guest developers code a few scripts invoking pre-installed software components. Host developers fill out a configuration file specifying the location of the components needed to build a Cartesi Machine. Blockchain developers instantiate one of the high-level contracts provided by Cartesi.
+At the other extreme are the developers contributing to the Cartesi ecosystem, who regularly write, build, and deploy custom software components to run in the guest, or even change the Linux kernel to support Cartesi-specific devices. Additionally, these developers programmatically control the creation and execution of Cartesi Machines in the host, and must also understand and use the hash-based state manipulation primitives the blockchain needs.
+
+Although Cartesi's goal is to shield platform users from as much complexity as possible, there is value in making information available to the greatest extent possible. To that end, this documentation of Cartesi Machines aims to provide enough information to cover all three perspectives, at all depths of understanding.
+
+# The host perspective
+
+Cartesi's reference off-chain implementation of a Cartesi Machine is based on software emulation.
+The emulator is written in C++23 with well-insulated POSIX dependencies.
+The [`cartesi/machine-emulator`](https://github.com/cartesi/machine-emulator) repository can be used to build and install the Cartesi Machine emulator.
+The emulator is implemented by a C++ class that can be accessed in a variety of different ways.
+
+When linked to a C++ application, the emulator can be controlled directly via the interface of the `cartesi::machine` class.
+C applications can control the emulator in a similar way, by means of a matching C API defined in the include file `cm.h`.
+The C API is stable and complete.
+It is the basis for the creation of binds in other programming languages, most notably the Lua programming language.
+The emulator can be accessed via a `cartesi` module that exposes a `cartesi.machine` interface to Lua programs.
+Additionally, Cartesi provides a JSON-RPC server that can run a Cartesi Machine instance that is controlled remotely.
+The server supports JSON-RPC discovery so client libraries can be generated automatically.
+Finally, there is a command-line utility (written in Lua) that can configure and run Cartesi Machines for rapid prototyping.
+The C, C++, Lua APIs as well as the command-line utility can seamlessly instantiate local emulators or connect to remote JSON-RPC servers.
+
+The documentation starts from the command-line utility, `cartesi-machine`.
+This utility is used for most prototyping tasks.
+The documentation then covers the Lua interface of `cartesi.machine`.
+The C, C++, and JSON-RPC interfaces closely mirror the Lua interface documented here, so this document does not cover them separately.
+The C API is defined in the `cm.h` header.
+The JSON-RPC API supports discovery, so client bindings can be generated from a running server.
+
+## Machine playground
+
+The setup of a new development environment is often a time-consuming task.
+This is particularly true in case of cross-development environments (i.e., when the development happens in a host platform but software runs in a different target platform).
+With this in mind, the Cartesi team provides the `cartesi/machine-emulator-docs` Docker image for use while reading this documentation.
+The Docker image enables immediate experimentation with Cartesi Machines, as well as the generation of the documentation itself.
+It comes with a pre-built emulator and Lua interpreter accessible within the command-line, as well as a pre-built RAM image and root file-system.
+It also comes with the cross-compiler for the RISC-V architecture on which the Cartesi Machine is based.
+
+To enter the playground, open a terminal, download the Docker image from Cartesi's repository, and run it adequately mapping the current user and group information, as well as making the host's current directory available inside the container:
+
+```{.bash key=docker_pull replace=source vars=image->globals/docs_image}
+docker pull $image
+```
+
+```{.bash key=docker_run replace=source vars=image->globals/docs_image}
+docker run \
+    --hostname playground \
+    --name playground \
+    --rm \
+    -e USER=$(id -u -n) \
+    -e GROUP=$(id -g -n) \
+    -e UID=$(id -u) \
+    -e GID=$(id -g) \
+    -v "$(pwd)":/work \
+    -w /work \
+    -it \
+    $image \
+    /bin/bash
+```
+
+Once inside, you can execute the `cartesi-machine` utility as follows:
+
+```{.bash key=cli_help replace=source}
+set +o pipefail
+# docs:begin
+cartesi-machine --help | head -n 40
+# docs:end
+echo ...
+```
+
+```{.text replace=cli_help}
+```
+
+A final check can also be performed to verify if the contents inside the container are as expected:
+
+```{.bash key=linux_sha replace=source}
+sha256sum /usr/share/cartesi-machine/images/linux.bin
+```
+
+```{.text replace=linux_sha}
+```
+
+```{.bash key=rootfs_sha replace=source}
+sha256sum /usr/share/cartesi-machine/images/rootfs.ext2
+```
+
+```{.text replace=rootfs_sha}
+```
+
+Note that, if the hashes of the files you are using do not match the ones above, then when you attempt to replicate the examples in the documentation, you will obtain different hashes.
+Moreover, the cycle counts and outputs may also differ.
+
+## Command-line interface
+
+In the simplest usage scenario, the `cartesi-machine` command-line utility can be used to define a Cartesi Machine and run it until it halts.
+The command-line utility, however, is very versatile.
+It was designed to simplify the most common prototyping tasks.
+
+The simplest invocation takes no arguments
+```{.bash key=nothing_to_do outputs=config-nothing-to-do.lua replace=source}
+# docs:begin null
+cartesi-machine --max-mcycle=0 --store-config=config-nothing-to-do.lua
+# docs:end null
+cartesi-machine
+```
+and produces the output
+```{replace=nothing_to_do}
+```
+The utility instantiates a default Cartesi Machine and runs it until it halts.
+The Linux kernel boots, the Cartesi-provided `cartesi-init` script prints the ASCII-art splash and reports there is nothing to do, then gracefully halts the machine.
+This takes many millions of cycles to complete: time mostly spent initializing the Linux kernel.
+The utility regains control from the emulator, and prints the `Halted` message and the cycle count.
+
+### Initialization
+
+The following command instructs `cartesi-machine` to build a Cartesi Machine.
+The machine has 128MiB of RAM, uses `linux.bin` as the RAM image, and uses `rootfs.ext2` as the root file-system.
+(`linux.bin` is generated by [machine-linux-image](https://github.com/cartesi/machine-linux-image) and `rootfs.ext2` is generated by [machine-rootfs-image](https://github.com/cartesi/machine-rootfs-image). Sample files are available in the `cartesi/machine-emulator-docs` Docker image, which can be built from the `doc/` directory of the [machine-emulator](https://github.com/cartesi/machine-emulator) repository.)
+Once initialization is complete, the machine executes the command `ls /bin` and exits.
+
+```bash
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    --ram-length=128Mi \
+    --ram-image="/usr/share/cartesi-machine/images/linux.bin" \
+    --flash-drive="label:root,data_filename:/usr/share/cartesi-machine/images/rootfs.ext2" \
+    -- ls /bin
+```
+The `--quiet` option suppresses the output of `cartesi-machine.lua` itself, leaving visible only what is produced inside the machine.
+The command-line option `--no-init-splash` instructs the utility to skip the splash, keeping the output focused on the example at hand.
+The `--ram-image`, `--ram-length`, and `--flash-drive` command-line options have the values in the example as default, so these options can be omitted.
+To remove these default settings, use the command-line options `--no-ram-image` and `--no-root-flash-drive`, respectively.
+
+The simplified command-line is
+```{.bash key=ls_bin outputs=config-ls-bin.lua replace=source}
+{
+# docs:begin
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+# docs:begin null
+    --store-config=config-ls-bin.lua \
+# docs:end null
+    -- ls /bin
+# docs:end
+} | head
+echo ...
+```
+The output is
+```{replace=ls_bin}
+```
+
+It shows the listing of directory `/bin/` inside the root file-system.
+The listing was produced by the entrypoint command that follows the `--` separator in the command line.
+By a method explained in great detail later on (see [The guest perspective initialization](#initialization-1)) the entrypoint is picked up by the Cartesi-provided `/usr/sbin/cartesi-init`, which executes it before gracefully halting the machine.
+
+:::note
+In many of the documentation examples, the utilities invoked from the command-line executed by a Cartesi Machine are in the default search path for executables. (This is set up by the Cartesi-provided `/usr/sbin/cartesi-init` script itself.)
+When in doubt, or when using your own executables installed in custom locations, make sure to invoke them by using their full paths (e.g., `/bin/ls` or `/bin/sh` instead of simply `ls` and `sh`.)
+:::
+
+### Interactive sessions
+
+By default, the `cartesi-machine` utility executes the Cartesi Machine in non-interactive mode.
+Verifiable computations must always be run in non-interactive sessions.
+User interaction with a Cartesi Machine via the console is, after all, not reproducible.
+Nevertheless, during development, it is often convenient to directly interact with the emulator, as if using a computer console.
+
+The command-line option `-i` (short for `--htif-console-getchar`) instructs the emulator to monitor the console for input, and to make this input available to the Linux kernel.
+Typically, this option will be used in conjunction with the `--` separator and the command `sh`, causing the Cartesi-provided `/usr/sbin/cartesi-init` script to drop into an interactive shell.
+Interaction with the shell enables the exploration of the Linux distribution from the inside.
+Exiting the shell returns control back to `/usr/sbin/cartesi-init`, which then gracefully halts the machine.
+
+For example, if an interactive session is started with the following command
+```{.bash key=cmdline_interactive_ls_shown replace=source}
+cartesi-machine \
+    --no-init-splash \
+    -i \
+    -- sh
+```
+it drops into the shell.
+Running the command `ls /bin` causes the listing of directory `/bin` to appear.
+Pressing Ctrl+D at the prompt then causes the shell to exit.
+The output is
+```{key=cmdline_interactive_ls replace=both}
+# The user-facing command is shown in the bash block above. Here we feed
+# the session non-interactively by piping `ls /bin` followed by the VEOF
+# character (^D, byte 0x04) into the emulator. The guest TTY's line
+# discipline turns ^D into a 0-byte read, so the shell exits cleanly
+# without an `exit` command, and ^D itself is not echoed. input_fd:0
+# routes the pipe to the console; /usr/sbin/cartesi-init halts the machine when the
+# user shell exits.
+printf 'ls /bin\n\x04' | cartesi-machine \
+    --no-init-splash \
+    -i \
+    --quiet \
+    --console-io=input_fd:0 \
+    -- sh | head
+echo ...
+```
+:::note
+When running in interactive mode, not even the final cycle count is reproducible.
+To avoid busy wait for new interactive input, the emulator sleeps from one Cartesi Machine timer interrupt to the next, skipping Cartesi Machine cycles forward so programs running inside stay _roughly_ in sync with wall-clock time outside.
+This dynamic balancing act is sure to vary between executions and across different computers.
+:::
+
+### Flash drives
+
+The command-line option `--flash-drive=label:<label>,data_filename:<filename>` can be used to add between 1 and 8 flash drives to the Cartesi Machine.
+Here, the string `<label>` is the *label* for the flash drive, and `<filename>` points to an *image file* with the initial contents of the flash drive.
+When the image file contains a valid file-system, the `cartesi-machine` command-line utility instructs `/usr/sbin/cartesi-init` to mount it at `/mnt/<label>`.
+
+To enable transparency, Cartesi Machine flash drives are mapped into the machine's 64-bit address space.
+The start and length are set, respectively, by the `start:<number>` and `length:<number>` parameters to `--flash-drive`.
+
+When the `length` parameter is omitted, the `cartesi-machine` utility automatically sets the size of a flash drive to match the size of its image file.
+Because RISC-V uses 4KiB pages, image files must have a size multiple of 4KiB.
+(The `truncate` utility can be used to pad a file with zeros so its size is a multiple of 4KiB.)
+
+For convenience, numbers can be specified in decimal or hexadecimal (e.g., `4096` or `0x1000`) and may include a suffix multiplier (i.e., `Ki` to multiply by 2<sup>10</sup>, `Mi` to multiply by 2<sup>20</sup>, and `Gi` to multiply by 2<sup>30</sup>).
+They can also use the C programming language *shift left* notation to multiply by arbitrary powers of 2 (e.g. `1 << 24` meaning 2<sup>24</sup>).
+
+When the `length` of a drive is specified, the `data_filename` parameter can be omitted.
+In that case, the drive starts in a *pristine* state: i.e., filled with zeros.
+If, however, both `length` and `data_filename` are specified, then the `length` must exactly match the size of the image file referred to by the `data_filename` parameter.
+
+The positioning of memory ranges in the machine's address space has implications on certain operations, discussed in detail under [the blockchain perspective](#hash-view-of-state), that involve the manipulation of hashes of the Cartesi Machine state.
+First, memory ranges cannot overlap with each other.
+Second, memory ranges must start at positions that are aligned to their lengths.
+Finally, the lengths used to restrict the starts and to detect overlaps are rounded up to the next power of 2.
+
+When the `start` of a drive is omitted, the emulator automatically places it following this rule.
+The first drive is placed past the RAM, and each remaining drive is placed past the previous one.
+
+The preferred file-system type is `ext2`.
+This is because `ext2` image files can be easily created with the `xgenext2fs` command-line utility (a Cartesi fork of `genext2fs`) and manipulated with `e2ls`, `e2cp`, `e2rm`, etc.
+All of these utilities come pre-installed in the `cartesi/machine-emulator-docs` Docker image (the `e2tools` package also provides `e2ls`, `e2cp`, and `e2rm` individually for Ubuntu hosts).
+Support for `ext4` is also enabled by default in the kernel.
+(Support for additional file-systems can be enabled by modifying the configuration that [`cartesi/machine-linux-image`](https://github.com/cartesi/machine-linux-image) uses to produce `linux.bin`.)
+
+For example,
+```{.bash key=foo_ext2 outputs=foo.ext2 replace=source}
+trap 'rm -rf foo foo.tar' EXIT
+rm -rf foo
+# docs:begin
+mkdir foo
+echo "Hello world!" > foo/bar.txt
+tar \
+    --sort=name \
+    --mtime="2022-01-01" \
+    --owner=1000 \
+    --group=1000 \
+    --numeric-owner \
+    -cf foo.tar \
+    --directory=foo .
+xgenext2fs \
+    -fzB 4096 \
+    -i 4096 \
+    -a foo.tar \
+    foo.ext2
+# docs:end
+```
+
+:::note
+The flags above are the base set used in all `xgenext2fs` examples in this documentation.
+The `-a foo.tar` flag tells `xgenext2fs` to populate the image from a `tar` archive rather than from a directory tree.
+The `-f` (faketime) flag zeros the modification times that `xgenext2fs` would otherwise read from the inputs.
+The `-z` flag writes a sparse file, leaving unwritten blocks as holes on disk.
+The `-B 4096` flag sets the block size to 4096 bytes.
+The `-i 4096` flag requests one inode per 4096 bytes of data.
+
+The tar detour is what makes the output reproducible.
+Running `xgenext2fs` directly on a directory tree would record modification times, user and group IDs, and traverse the directory in an unspecified order.
+The `-f` flag fixes the timestamp problem, but does nothing about the rest.
+The `tar` invocation above pins the file order (`--sort=name`), the timestamps (`--mtime`), and the user and group IDs (`--owner`, `--group`, `--numeric-owner`).
+`xgenext2fs` then walks the archive in deterministic order and emits a byte-identical file-system on every run.
+:::
+
+The image can be loaded as a flash drive:
+```{.bash key=cat_foo_bar vars=foo_ext2->foo_ext2/foo.ext2/path outputs=config-cat-foo-bar.lua replace=source}
+ln -sf "$foo_ext2" .
+# docs:begin
+cartesi-machine \
+    --no-init-splash \
+    --flash-drive="label:foo,data_filename:foo.ext2" \
+# docs:begin null
+    --store-config=config-cat-foo-bar.lua \
+# docs:end null
+    -- "cat /mnt/foo/bar.txt"
+# docs:end
+```
+Here, a flash drive with label `foo` is initialized with the contents of an `ext2` file-system in the image file `foo.ext2`.
+The Cartesi-provided `/usr/sbin/cartesi-init` mounts this as `/mnt/foo`.
+The command executed in the machine simply copies the contents of `/mnt/foo/bar.txt` to the terminal.
+The output is
+```{replace=cat_foo_bar}
+```
+
+### Persistent flash drives and NVRAMs
+
+By default, the emulator does *not* modify the image files associated to any of its memory ranges (such as the RAM, flash drives, and NVRAMs).
+However, since these image files can be very large, the emulator does not pre-allocate any host memory for them.
+Instead, it uses the operating system's memory mapping capabilities.
+The operating system reads to host memory only those pages from the image file that are actually read by code executing in the guest.
+(Naturally, when a state hash is requested, all image files are read from disk in their entirety and processed. See below.)
+These image files are mapped to host memory in a *copy-on-write* fashion.
+When code running in the guest causes the emulator to write to a mapped image file, the operating system makes a copy of the page before modification and replaces the mapping to point to the fresh copy.
+The image files are never written to.
+(The `--dump-memory-ranges` command-line option can be used to inspect the modified copies for debugging purposes. See below.)
+
+:::note
+The entrypoint commands executed by the Cartesi-provided `/usr/sbin/cartesi-init` run as the unprivileged user `dapp`.
+By default, every flash drive is mounted with the ownership and permissions baked into its image file, which typically means its root directory is owned by `root`.
+As a result, `dapp` can read the drive but cannot write to it.
+To allow writes, pass `user:dapp` to the `--flash-drive` command-line option so the emulator changes the owner of the drive's mount point to `dapp` after mounting.
+The same is true of NVRAMs: by default, they are only writeable by `root`.
+Alternatively, the `--user=root` command-line option causes `/usr/sbin/cartesi-init` to run commands as `root`, which can write to the drive without any ownership changes.
+For safety, running as `dapp` is preferred.
+:::
+
+For example, running the machine
+```{.bash key=not_shared_flash vars=foo_ext2->foo_ext2/foo.ext2/path replace=source}
+ln -sf "$foo_ext2" .
+# docs:begin
+cartesi-machine \
+    --no-init-splash \
+    --flash-drive="label:foo,data_filename:foo.ext2,user:dapp" \
+    -- "ls /mnt/foo/*.txt && cp /mnt/foo/bar.txt /mnt/foo/baz.txt && ls /mnt/foo/*.txt"
+# docs:end
+```
+produces the output
+```{replace=not_shared_flash}
+```
+indicating that the file-system was modified, at least from the perspective of the guest.
+However, inspecting the `foo.ext2` image file from outside the emulator shows it is unchanged.
+```{.bash key=e2ls_not_shared_foo_ext2 replace=source vars=foo_ext2->foo_ext2/foo.ext2/path}
+ln -fs "$foo_ext2" .
+# docs:begin
+e2ls -aln foo.ext2:*.txt
+# docs:end
+```
+
+```{.text replace=e2ls_not_shared_foo_ext2}
+```
+
+This behavior is appropriate when the flash drives will only be used as inputs.
+For output flash drives, guest changes to the drives must reflect on the associated image files.
+For that purpose, the parameter `shared` can be passed to command-line option `--flash-drive`, causing the image files to be mapped to host memory in a *shared* fashion.
+For example,
+```{.bash key=shared_flash replace=source vars=foo_ext2->foo_ext2/foo.ext2/path outputs=foo.ext2}
+cp -f "$foo_ext2" .
+# docs:begin
+cartesi-machine \
+    --no-init-splash \
+    --flash-drive="label:foo,data_filename:foo.ext2,shared,user:dapp" \
+    -- "ls /mnt/foo/*.txt && cp /mnt/foo/bar.txt /mnt/foo/baz.txt && ls /mnt/foo/*.txt"
+# docs:end
+```
+produces exactly the same output as before.
+However, `e2ls` now shows the image file `foo.ext2` has indeed been modified.
+```{.bash key=e2ls_shared_foo_ext2 replace=source vars=foo_ext2->shared_flash/foo.ext2/path}
+ln -sf "$foo_ext2" .
+# docs:begin
+e2ls -aln foo.ext2:*.txt
+# docs:end
+```
+
+```{.text replace=e2ls_shared_foo_ext2/both}
+```
+
+### Limiting execution
+
+The machine's processor includes a control and status register (CSR), named `mcycle`, that starts at 0 and is incremented after every instruction cycle.
+By default the `cartesi-machine` utility only returns when the machine halts (or yields manual), as the [introductory example](#command-line-interface) showed.
+The maximum cycle can be specified with the command-line option `--max-mcycle=<number>`.
+
+```{.bash key=cycles_htif_putchar vars=config->nothing_to_do/config-nothing-to-do.lua/path replace=null}
+ln -sf "$config" .
+lua5.4 $RECIPES_DIR/find-htif-putchar.lua > /dev/null
+```
+
+For example, running
+```{.bash key=limit_exec replace=source vars=cycles->cycles_htif_putchar}
+cartesi-machine --max-mcycle=$cycles
+```
+produces the output
+```{replace=limit_exec}
+```
+Note the execution was interrupted before the splash screen was even completed.
+The ability to limit computation to an arbitrary number of cycles is fundamental to the verifiability of Cartesi Machines, as is explained in detail under the [blockchain perspective](#verification-game).
+
+### State hashes
+
+The `cartesi-machine` utility can also be used to print Cartesi Machine state hashes.
+State hashes are Merkle tree root hashes of the entire 64-bit address space of the Cartesi Machine, where the leaves are aligned 256-bit words.
+(See [Hash-view of state](#hash-view-of-state) for an explanation of Merkle trees.)
+Since Cartesi Machines are transparent, the contents of this address space encompass the entire machine state, including all processor CSRs and general-purpose registers, the contents of RAM, of all flash drives and NVRAMs, and of all other devices connected to the board, and even the state of the uarch.
+State hashes therefore work as cryptographic signatures of the machine, and implicitly of the computation they are about to execute.
+
+To obtain the state hash right before execution starts, use the command-line option `--initial-hash`.
+Conversely, to obtain the state hash right after execution is done, use the option `--final-hash`.
+For example,
+
+```{.bash key=state_hashes_limit_exec vars=cycles->cycles_htif_putchar replace=source}
+cartesi-machine \
+    --max-mcycle=$cycles \
+    --initial-hash \
+    --final-hash
+```
+produces the output
+```{key=reorder_state_hashes_limit_exec vars=err->state_hashes_limit_exec/stderr/path,out->state_hashes_limit_exec/stdout/path replace=stdout}
+# stderr comes mixed with stdout in an unfortunate order, so we reorder them
+cat $err | head -n 1
+cat $out
+echo
+cat $err | tail -n +2
+```
+
+```{.bash key=state_hashes_initial vars=hashes->state_hashes_limit_exec/stderr/path replace=null}
+cat $hashes \
+    | $RECIPES_DIR/find-hash.sh 0 \
+    | $RECIPES_DIR/trunc8.sh
+```
+The initial state hash [...]{replace=state_hashes_initial} is the Merkle tree root hash for the initial Cartesi Machine state.
+Since Cartesi Machines are reproducible, the initial state hash also works as a *promise* on the result of the entire computation.
+
+```{.bash key=state_hashes_final_limit_exec vars=cycles->cycles_htif_putchar,log->state_hashes_limit_exec/both/path replace=null}
+cat $log \
+    | $RECIPES_DIR/find-hash.sh "$cycles" \
+    | $RECIPES_DIR/trunc8.sh
+```
+In other words, the &ldquo;final state hash&rdquo; [...]{replace=state_hashes_final_limit_exec} is the &ldquo;only&rdquo; possible outcome for the `--final-hash` at cycle []{replace=cycles_htif_putchar/stderr}, given the result of the `--initial-hash` operation was [...]{replace=state_hashes_initial}.
+
+:::info
+The scare quotes around &ldquo;only&rdquo; are pedantic.
+It is true that there are a multitude of machine states that produce the same state hash.
+After all, the Keccak-256 state hashes fit in 256-bits, whereas machine states can take gigabytes.
+There are therefore many more possible machine states than possible state hashes.
+By the pigeonhole principle, there must be multiple machines with the same hash (i.e., hash collisions).
+However, given only the state hash, finding a Cartesi Machine with that state hash should be virtually impossible.
+Given a Cartesi Machine and its state hash, finding a *second* (distinct) Cartesi Machine with the same state hash should also be virtually impossible.
+Even finding two different Cartesi Machines that have the same state hash (any hash) should be virtually impossible.
+Cryptographic hash functions, such as Keccak-256, were designed *specifically* to have these properties.
+:::
+
+Allowing the machine to run until it halts
+
+```{.bash key=state_hashes_no_limit_exec replace=source}
+cartesi-machine \
+    --initial-hash \
+    --final-hash
+```
+produces instead the output
+```{key=reorder_state_hashes_no_limit_exec vars=err->state_hashes_no_limit_exec/stderr/path,out->state_hashes_no_limit_exec/stdout/path replace=stdout}
+# stderr comes mixed with stdout in an unfortunate order, so we reorder them
+cat $err | head -n 1
+cat $out
+cat $err | tail -n +2
+```
+Naturally, the initial state hash is the same as before.
+
+```{.bash key=state_hashes_cycles_no_limit_exec vars=log->state_hashes_no_limit_exec/both/path replace=null}
+cat $log | $RECIPES_DIR/last-cycles.sh
+```
+
+```{.bash key=state_hashes_final_no_limit vars=cycles->state_hashes_cycles_no_limit_exec/stdout,hashes->state_hashes_no_limit_exec/stderr/path replace=null}
+cat $hashes \
+    | $RECIPES_DIR/find-hash.sh "$cycles" \
+    | $RECIPES_DIR/trunc8.sh
+```
+However, the final state hash [...]{replace=state_hashes_final_no_limit} now pertains to cycle []{replace=state_hashes_cycles_no_limit_exec}, where the machine is halted.
+This is the &ldquo;only&rdquo; possible state hash for a *halted* machine that started from state hash [...]{replace=state_hashes_initial}.
+
+### Persistent Cartesi Machines
+
+At any point in their execution, Cartesi Machines can be stored to disk.
+A stored machine can later be loaded to continue its execution from where it left off.
+To store a machine to a given `<directory>`, use the command-line option `--store=<directory>`.
+(In `<directory>`, the `%h` escape will be replaced by the state hash in hex.)
+The machine is stored as it was right before `cartesi-machine` returns to the command line.
+For example, to store the machine corresponding to state hash [...]{replace=state_hashes_final_limit_exec}
+```{.bash key=persistent_htif_putchar replace=source outputs=dirname vars=cycles->cycles_htif_putchar}
+\rm -rf machine-????????
+# docs:begin
+cartesi-machine \
+    --max-mcycle=$cycles \
+    --store="machine-%8h"
+# docs:end
+    ls -d machine-* > dirname
+```
+
+This command creates a directory []{replace=persistent_htif_putchar/dirname}, containing a variety of files that allow the Cartesi Machine emulator to recreate a machine state.
+Every image file is copied into the directory, so no external dependencies remain.
+
+:::note
+If the machine initialization involved large image files or a considerable amount of RAM, this operation may consume significant disk space.
+It will also take the time required by the copying of image files into the directory, and by the computation of the state hash.
+:::
+
+If the directory already exists, the operation will fail.
+(This prevents the overwriting of a Cartesi Machine by mistake.)
+Once created, the directory can be compressed and transferred to other hosts.
+To restore the corresponding Cartesi Machine, use the command-line option `--load=<directory>`.
+For example,
+```{.bash key=persistent_htif_putchar_reload replace=source vars=persistent_htif_putchar,dirname->persistent_htif_putchar/dirname}
+ln -sf "$persistent_htif_putchar/$dirname" .
+# docs:begin
+cartesi-machine \
+    --load="$dirname" \
+    --initial-hash \
+    --final-hash
+# docs:end
+```
+produces the output
+```{key=reorder_persistent_htif_putchar_reload vars=err->persistent_htif_putchar_reload/stderr/path,out->persistent_htif_putchar_reload/stdout/path replace=stdout}
+# here --load prints a line before the initial hash, so keep the first two
+cat $err | head -n 2
+cat $out
+cat $err | tail -n +3
+```
+Note that, other than `--load`, no initialization command-line options were used.
+These initializations were used to define the machine before it was stored: their values are implicitly encoded in the stored state.
+The machine continues from where it left off, and reaches the same final state hash [...]{replace=state_hashes_final_no_limit}, as if it had never been interrupted.
+
+Note also that the initial state hash [...]{replace=state_hashes_final_limit_exec} after `--load` matches the final state hash before `--store`.
+After all, they are state hashes concerning the state of the same machine at the same cycle.
+`--load` verifies the archive format version recorded in the stored machine, and the pre-store and post-load state hashes are equal because the same machine state is restored.
+
+The `cartesi-machine-stored-hash` command-line utility can be used to extract the state hash from a stored Cartesi Machine.
+The command
+```{.bash key=persistent_htif_putchar_stored_hash replace=source vars=persistent_htif_putchar,dirname->persistent_htif_putchar/dirname}
+ln -sf "$persistent_htif_putchar/$dirname" .
+# docs:begin
+cartesi-machine-stored-hash $dirname
+# docs:end
+```
+produces the output
+```{replace=persistent_htif_putchar_stored_hash}
+```
+
+### Running as root
+
+Starting at version 4.0 of `rootfs.ext2`, the Cartesi-provided `/usr/sbin/cartesi-init` script runs the entrypoint command as []{replace=run_as_dapp}.
+This can be seen by running:
+```{.bash key=run_as_dapp replace=source}
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    -- id
+```
+It shows the user and group are indeed `dapp`:
+```{replace=run_as_dapp}
+```
+To instead run your guest application as `root`, pass the `--user=root` command-line option:
+```{.bash key=run_as_root replace=source}
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    --user=root \
+    -- id
+```
+The output now shows the user and group are `root`:
+```{replace=run_as_root}
+```
+
+Running as root is not recommended.
+To perform setup tasks that require elevated permissions, use instead the `--append-init` command-line option:
+
+```{.bash key=append_init replace=source}
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    --append-init="echo Before init ends: && id" \
+    -- "echo After entrypoint starts: && id"
+```
+This runs the init part as `root`, but the entrypoint part as `dapp`:
+```{replace=append_init}
+```
+
+The `--append-init-file=<filename>` command-line option works like `--append-init`, but appends to init the entire contents of file `<filename>`.
+
+### Cartesi Machine templates
+
+*Templates* are one of the key uses for Cartesi Machines stored to disk.
+Cartesi Machine templates are machines in which the contents of one or more flash drives or NVRAMs are still unknown.
+To put it another way, Cartesi Machine templates behave like functions whose parameters are the yet-to-be-defined contents of these drives.
+
+As discussed in detail under [the blockchain perspective](#hash-view-of-state), starting from template hashes, the hashes of the drives, and a small amount of additional information, it is possible to obtain the state hash of the *instantiated template*&mdash;the state hash for a Cartesi Machine with drives replaced by their actual contents.
+This is how a smart contract can specify a computation to be performed off-chain over arbitrary input.
+Starting from the template hash, and in possession of the drive hashes, it instantiates the template, generating the initial state hash for the corresponding Cartesi Machine.
+
+As an example, consider a Cartesi Machine that operates as an arbitrary-precision arithmetic expression evaluator.
+The machine will take the expression in text format from an input NVRAM labeled `input`, and will copy the output in text format into an output NVRAM labeled `output` (`shared`, of course, so the output persists after the emulator is done).
+
+NVRAMs bind directly to a memory-backed UIO device exposed inside the guest as `/dev/uioN`.
+Unlike flash drives, they have no file-system layer and no page cache between the guest and the underlying memory range, so writes are immediately visible to the emulator and there is no need to flush a cache before snapshotting.
+This makes NVRAMs faster than flash drives for cases where the guest only needs raw access to a region of bytes.
+
+```{.bash key=calc_pipeline replace=null}
+$'readmmap input | lua5.4 -e \'print((string.unpack("z", io.read("a"))))\' | bc | writemmap output'
+```
+
+Because UIO devices do not support ordinary `read()` or `write()` against the device file, the machine guest utilities include the `readmmap` and `writemmap` tools to read and write NVRAMs.
+They resolve the label, `mmap()` the device, and copy bytes to/from standard input or standard output.
+Both also work on flash drives.
+
+The `bc` command-line utility is the perfect tool to evaluate the arithmetic expressions.
+The command passed to `cartesi-machine` below uses `readmmap` to read the contents of the input NVRAM, extracts a zero-terminated string from it using a tiny Lua script run by the `lua5.4` interpreter, pipes the result through `bc`, and uses `writemmap` to copy the result back into the output NVRAM.
+Here is the sample playground session
+
+```{.bash key=calc_run vars=pipeline->calc_pipeline/body.sh outputs=output.raw,config-calculator.lua replace=source}
+trap 'rm -f input.raw' EXIT
+# docs:begin
+truncate -s 4K output.raw
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+cartesi-machine \
+    --no-init-splash \
+    --nvram="label:input,length:1<<12,data_filename:input.raw" \
+    --nvram="label:output,length:1<<12,data_filename:output.raw,shared,user:dapp" \
+# docs:begin null
+    --store-config=config-calculator.lua \
+# docs:end null
+    -- $pipeline
+# docs:end
+```
+
+:::note
+The `$'...'` form here is bash's ANSI-C-quoted string, used throughout the manual for entrypoint commands.
+It passes the contents to `cartesi-machine` as a single argument, leaves host-side variable references like `$i` unexpanded (so they reach the guest shell verbatim), and accepts `\'` as an escape for a single quote inside the string.
+This last property matters when the entrypoint wraps a single-quoted sub-command, such as a `lua5.4 -e '...'` invocation.
+:::
+
+Using the `truncate` command-line utility, the session creates a 4KiB file `output.raw` containing only zeros to serve as the output drive image.
+Then, it creates the `input.raw` file for use as the input drive image containing the expression `6*2^1024 + 3*2^512\n` to be evaluated.
+This file is then padded with zeros to 4KiB in size by the `truncate` utility.
+The session then invokes the `cartesi-machine` command-line utility to evaluate the expression.
+The output of the `cartesi-machine` command is
+```{replace=calc_run}
+```
+Once the emulator returns, a tiny Lua script, run by the `lua5.4` Lua interpreter, prints the contents of the output drive
+```{.bash key=dump_calc_run_result vars=output->calc_run/output.raw/path replace=source}
+ln -sf "$output" .
+# docs:begin
+lua5.4 -e 'print((string.unpack("z", io.read("a"))))' < output.raw
+# docs:end
+```
+which reads
+```{replace=dump_calc_run_result}
+```
+This is indeed the result of 6&times;2<sup>1024</sup>+3&times;2<sup>512</sup>.
+
+To create the template, simply omit the input and output image filenames.
+This will cause the Cartesi Machine to assume both drives are filled with zeros.
+Then, limit the computation with `--max-mcycle=0`, to prevent the Cartesi Machine from running.
+Finally, use the `--store="calculator-template"` command-line option to store the Cartesi Machine template.
+The `--final-hash` command-line option prints the resulting template hash.
+```{.bash key=calc_template vars=pipeline->calc_pipeline/body.sh outputs=calculator-template replace=source}
+rm -rf calculator-template
+# docs:begin
+cartesi-machine \
+    --no-init-splash \
+    --nvram="label:input,length:1<<12" \
+    --nvram="label:output,length:1<<12,user:dapp" \
+    --max-mcycle=0 \
+    --final-hash \
+    --store="calculator-template" \
+    -- $pipeline
+# docs:end
+```
+The result is as follows
+```{replace=calc_template}
+```
+The directory `calculator-template/` now contains the Cartesi Machine template.
+And indeed, running
+
+```{.bash key=calc_template_hash vars=template->calc_template/calculator-template/path replace=source}
+ln -sf "$template" .
+# docs:begin
+cartesi-machine-stored-hash calculator-template/
+# docs:end
+```
+we can see from the output
+```{replace=calc_template_hash}
+```
+
+```{.bash key=calc_template_trunc_hash vars=hash->calc_template_hash/stdout/path replace=null}
+cat $hash | $RECIPES_DIR/trunc8.sh
+```
+that the stored template hash is [...]{replace=calc_template_trunc_hash}.
+
+Templates are typically used by programs that control the emulator with the C++, Lua, or JSON-RPC interfaces.
+
+The `--replace-memory-range=label:<label>,data_filename:<filename>` command-line option of the `cartesi-machine` utility can be used to replace an existing memory range right after a machine is loaded.
+The memory range can be identified by `label`, by `start` and `length`, or both.
+
+This functionality can be used to test templates.
+For example, the following command loads the calculator template, and replaces its pristine input NVRAM with one containing the contents of the `input.raw` file.
+Then, it replaces the pristine output NVRAM so the machine saves results in the file `output.raw`.
+
+```{.bash key=calc_template_instantiated vars=template->calc_template/calculator-template/path replace=source}
+ln -sf "$template" .
+# docs:begin
+rm -f output.raw
+truncate -s 4K output.raw
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+cartesi-machine \
+    --no-init-splash \
+    --load="calculator-template" \
+    --replace-memory-range="label:input,data_filename:input.raw" \
+    --replace-memory-range="label:output,data_filename:output.raw,shared"
+lua5.4 -e 'print((string.unpack("z", io.read("a"))))' < output.raw
+# docs:end
+```
+The result of running the command is, as expected,
+```{replace=calc_template_instantiated/stdout}
+```
+
+### State value proofs
+
+```{.lua key=hash_tree_constants replace=null outputs=log2_word_size,word_size,log2_root_size,log2_leaf_count,log2_max_output_count,hash_size}
+local cartesi = require("cartesi")
+local log2_word = cartesi.HASH_TREE_LOG2_WORD_SIZE
+local log2_root = cartesi.HASH_TREE_LOG2_ROOT_SIZE
+local word_size = 1 << log2_word
+local function writefile(name, val)
+    local f = assert(io.open(name, "w"))
+    f:write(tostring(val))
+    f:close()
+end
+writefile("log2_word_size", log2_word)
+writefile("word_size",      word_size)
+writefile("log2_root_size", log2_root)
+writefile("log2_leaf_count", log2_root - log2_word)
+writefile("log2_max_output_count", cartesi.CMIO_LOG2_MAX_OUTPUT_COUNT)
+writefile("hash_size", cartesi.HASH_SIZE)
+```
+*State value proofs* are proofs that a given node in the Merkle tree of the Cartesi Machine state has a given associated hash.
+Each Merkle tree node covers a contiguous range of the machine's 64-bit address space.
+The size of a range is always a power of 2 (i.e., the `<log2_size>` power of 2).
+Since the leaves have size []{replace=hash_tree_constants/word_size} bytes, the valid values for `<log2_size>` are []{replace=hash_tree_constants/log2_word_size}&hellip;[]{replace=hash_tree_constants/log2_root_size}.
+The range corresponding to each node starts at an `<address>` that is a multiple of its size.
+
+The `cartesi-machine` command-line utility can generate proofs concerning the contents of the machine state.
+To generate a proof concerning the state as it is before the machine starts running, use the
+`--initial-proof=address:<number>,log2_size:<number>[,filename:<filename>]` or `--initial-proof=label:<label>[,filename:<filename>]`.
+The label form of the option searches for a flash drive or NVRAM with that label, from which it automatically obtains the corresponding `address` and `log2_size`.
+For proofs concerning the state after the emulator is done, use `--final-proof` instead.
+The proofs are output as Lua tables that can be loaded with the `require` function.
+To output JSON objects instead, add the `format:json` sub-key, as in `--initial-proof=label:<label>,filename:<filename>,format:json`.
+When `format:` is omitted, the format is inferred from the filename extension (`.json` or `.lua`), defaulting to Lua.
+In either case, the filename field is optional.
+When provided, the proof will be written to the corresponding file.
+Otherwise, the contents will be displayed on screen.
+
+For example, to generate a proof that the Cartesi Machine template above indeed contains a pristine input drive, use the command line
+```{.bash key=proofs_pristine_run vars=template->calc_template/calculator-template/path replace=source outputs=pristine-input-proof.lua,root_hash,target_hash,target_address,log2_target_size}
+ln -sf "$template" .
+# docs:begin
+cartesi-machine \
+    --no-init-splash \
+    --load="calculator-template" \
+    --max-mcycle=0 \
+    --initial-hash \
+    --initial-proof="label:input,filename:pristine-input-proof.lua"
+# docs:end
+lua5.4 -e 'input_proof = require"pristine-input-proof"; print(input_proof.root_hash)' | \
+    hex --encode \ |
+    $RECIPES_DIR/trunc8.sh > root_hash
+lua5.4 -e 'input_proof = require"pristine-input-proof"; print(input_proof.target_hash)' | \
+    hex --encode \ |
+    $RECIPES_DIR/trunc8.sh > target_hash
+lua5.4 -e 'input_proof = require"pristine-input-proof"; print(string.format("0x%x", input_proof.target_address))' > target_address
+lua5.4 -e 'input_proof = require"pristine-input-proof"; print(input_proof.log2_target_size)' > log2_target_size
+```
+
+The output of the command is
+```{replace=proofs_pristine_run}
+```
+
+In addition, the `pristine-input-proof.lua` file now contains a Lua table with the requested proof.
+The value of field `root_hash` is the expected initial state hash [...]{replace=proofs_pristine_run/root_hash} seen in the output of the `cartesi-machine` command.
+The `target_address` value []{replace=proofs_pristine_run/target_address} is the start of the input NVRAM.
+The `log2_target_size` value []{replace=proofs_pristine_run/log2_target_size} refers to the size of the 4KiB input NVRAM.
+The `target_hash` value [...]{replace=proofs_pristine_run/target_hash} in the proof gives the hash of the input NVRAM.
+
+The hash of the input NVRAM can be also computed externally with the `cartesi-hash-tree-hash` command-line utility.
+The utility can produce the hash of any file with a power-of-2 size.
+The `--log2-root-size=<log2_size>` option specifies the size.
+If an input file is smaller than the specified size, the utility assumes the missing data is composed entirely of bytes 0.
+The utility deals efficiently with zero paddings of any size because pristine hashes for all power-of-2 sizes can be precomputed.
+For example, to quickly generate the hash for a pristine input with 4KiB size, run
+```{.bash key=pristine_input_raw_hash replace=source}
+head -c 0 | cartesi-hash-tree-hash --log2-root-size=12
+```
+```{.bash key=pristine_input_raw_trunc_hash vars=hash->pristine_input_raw_hash/stdout/path replace=null}
+cat $hash | $RECIPES_DIR/trunc8.sh
+```
+to obtain
+```{replace=pristine_input_raw_hash}
+```
+As expected, the hash values match.
+
+The `sibling_hashes` array contains the hashes of the siblings to all nodes in the path from the root all the way down to the target node (excluding the root, which has no sibling).
+In a process explained in the [blockchain perspective](#hash-view-of-state), using the `address` field, the `target_hash` hash, and the `sibling_hashes` array, it is possible to go up the tree computing the hashes along the path, until the root hash is produced.
+If the root hash obtained by this process matches the expected root hash, the proof is valid.
+Otherwise, something is amiss.
+
+To compute the hash for the desired `input.raw` file with contents `6*2^1024 + 3*2^512\n`, padded with zeros, run
+```{.bash key=input_raw_hash replace=source}
+echo "6*2^1024 + 3*2^512" | cartesi-hash-tree-hash --log2-root-size=12
+```
+```{.bash key=input_raw_trunc_hash vars=hash->input_raw_hash/stdout/path replace=null}
+cat $hash | $RECIPES_DIR/trunc8.sh
+```
+to obtain
+```{replace=input_raw_hash}
+```
+
+The initial state hash for the instantiated template can be seen with the `cartesi-machine` command-line
+```{.bash key=input_raw_proof vars=template->calc_template/calculator-template/path outputs=input-proof.lua,root_hash,target_hash replace=source}
+ln -sf "$template" .
+rm -f input-proof.lua input.raw
+# docs:begin
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+cartesi-machine \
+    --no-init-splash \
+    --load="calculator-template" \
+    --replace-memory-range="label:input,data_filename:input.raw" \
+    --initial-hash \
+    --initial-proof="label:input,filename:input-proof.lua" \
+    --max-mcycle=0
+# docs:end
+lua5.4 -e 'input_proof = require"input-proof"; print(input_proof.root_hash)' | \
+    hex --encode \ |
+    $RECIPES_DIR/trunc8.sh > root_hash
+lua5.4 -e 'input_proof = require"input-proof"; print(input_proof.target_hash)' | \
+    hex --encode \ |
+    $RECIPES_DIR/trunc8.sh > target_hash
+```
+This produces the output
+
+```{replace=input_raw_proof}
+```
+
+In addition, the `input-proof.lua` file now contains a Lua table with the requested proof, which is produced after the input NVRAM has been replaced.
+The `target_hash` value [...]{replace=input_raw_proof/target_hash} reflects the hash computed for the input.
+The `root_hash` value [...]{replace=input_raw_proof/root_hash} differs from [...]{replace=calc_template_trunc_hash} obtained for the template, as expected, and matches the final hash printed by the utility.
+Moreover, the `sibling_hashes` entries in the template Cartesi Machine and in the instantiated Cartesi Machine remain the same, reflecting the fact that there were no other changes in the machine's initial state.
+
+Using a process similar to the proof verification described above, it is possible to go up the Merkle tree for the template using the `sibling_hashes` array in the proof, but starting from the hash [...]{replace=input_raw_trunc_hash} of the desired `input.raw` image rather than hash [...]{replace=pristine_input_raw_trunc_hash} of the template's pristine NVRAM.
+The result would be the same root hash as that of the instantiated template.
+
+Another useful proof is the one for the *output* drive, once the machine is halted.
+To obtain this proof, run
+
+```{.bash key=output_raw_proof outputs=output.raw,output-proof.lua,root_hash,target_hash vars=template->calc_template/calculator-template/path replace=source}
+rm -f output-proof input.raw output.raw
+ln -sf "$template" .
+# docs:begin
+truncate -s 4K output.raw
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+cartesi-machine \
+    --no-init-splash \
+    --load="calculator-template" \
+    --replace-memory-range="label:input,data_filename:input.raw" \
+    --replace-memory-range="label:output,data_filename:output.raw,shared" \
+    --final-hash \
+    --final-proof="label:output,filename:output-proof.lua"
+# docs:end
+lua5.4 -e 'proof = require"output-proof"; print(proof.root_hash)' | hex --encode \
+    | $RECIPES_DIR/trunc8.sh > root_hash
+lua5.4 -e 'proof = require"output-proof"; print(proof.target_hash)' | hex --encode \
+    | $RECIPES_DIR/trunc8.sh > target_hash
+```
+
+This produces the output
+
+```{replace=output_raw_proof}
+```
+
+The `root_hash` field in the proof [...]{replace=output_raw_proof/root_hash} matches the final state hash output by the `cartesi-machine` command-line utility.
+The `target_hash` field [...]{replace=output_raw_proof/target_hash} is the hash of the `output.raw` NVRAM.
+To compute it independently, use the `cartesi-hash-tree-hash` command-line utility
+```{.bash key=proofs_output_raw_hash vars=output_raw->output_raw_proof/output.raw/path replace=source}
+ln -sf "$output_raw" .
+# docs:begin
+cartesi-hash-tree-hash --log2-root-size=12 < output.raw
+# docs:end
+```
+```{replace=proofs_output_raw_hash}
+```
+
+The `cartesi-machine` command-line utility accepts an arbitrary number of `--initial-proof` and `--final-proof` parameters.
+They are computed one-by-one, and either printed or stored in the specified files, as requested.
+
+To read more about proofs, refer to [the blockchain perspective](#hash-view-of-state).
+
+### Remote Cartesi Machines
+
+The `cartesi-machine` command-line utility, as used until now, has always instantiated its own local Cartesi Machine.
+However, it can also be used to control a remote Cartesi Machine.
+Remote Cartesi Machines are managed by the `cartesi-jsonrpc-machine` server.
+The server exposes a JSON-RPC interface through which the `cartesi-machine` command-line utility (or any other software) can control the machine remotely.
+
+To avoid confusion, it is best to run the server and client in separate shells in the playground container.
+Leaving the existing shell for the client, open a separate shell for the server (For example, by running `docker exec -it playground /bin/bash`), then run
+```{.bash key=cmdline_remote outputs=server,client replace=source/server}
+{
+# docs:begin server
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8080
+# docs:end server
+} > server 2>&1 &
+srv_pid=$!
+{
+# docs:begin client
+while ! cartesi-machine \
+    --remote-address=127.0.0.1:8080 \
+    --remote-health-check 2>/dev/null; do sleep 1; done
+cartesi-machine \
+    --remote-address=127.0.0.1:8080 \
+    --remote-shutdown
+# docs:end client
+} > client 2>&1
+client_status=$?
+# If the client failed, it never sent SHUTDOWN, so the server would hang forever
+[ "$client_status" -ne 0 ] && kill "$srv_pid" 2>/dev/null
+wait "$srv_pid"
+```
+The `--server-address=<address>` command-line option specifies the address and port the server will listen to.
+
+:::note
+In this case, since we selected `127.0.0.1:8080`, the client must run in the same container in order to communicate with the server.
+To be accessible from outside the container, the `--server-address` option would have to refer to an address and port that were _exposed_ by the container.
+:::
+
+To instruct the `cartesi-machine` command-line utility to connect with the server, add the command-line option `--remote-address=<address>` to specify the remote server to connect to.
+The option `--remote-shutdown` causes the server to be shut down by the client when the client exits.
+(Otherwise, the server will remain available for the next client.)
+The option `--remote-health-check` causes the client to connect to the server, confirm it is responsive, and exit without instantiating a machine.
+All other options work as before.
+Keep in mind that any image files referred to by an option passed to the command-line utility `cartesi-machine` must be accessible to the `cartesi-jsonrpc-machine` server (and not necessarily to the client).
+Additionally, terminal output for the Cartesi Machine instantiated by the server will appear in the remote shell where the server was run (not the client's shell).
+Terminal input, when enabled, must also happen via the remote shell.
+
+With this in mind, running the command in the client shell
+```{.bash replace=cmdline_remote/source/client}
+```
+produces the following output on the client shell
+```{replace=cmdline_remote/client}
+```
+and the following output on the server shell
+```{replace=cmdline_remote/server}
+```
+
+The client first connects to the remote address and prints the connection status.
+It then asks the server to instantiate a machine (by sending the configuration over) and run it.
+The machine that runs in the server prints out the splash screen, boots Linux, and cedes control to the
+Cartesi-provided `/usr/sbin/cartesi-init` script.
+The `/usr/sbin/cartesi-init` script figures out there is nothing to do and halts the machine.
+The client detects the machine is halted and shuts down the server, as requested, printing the final message.
+
+When it is desirable to leave the server running and preserve the instantiated machine, omit the `--remote-shutdown`
+command-line option and add the `--no-remote-destroy`.
+For example, assuming the remote server has just been run:
+```{.bash key=cmdline_remote_end outputs=begin-end-server,end-client,begin-client replace=source/server}
+{
+# docs:begin server
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8081
+# docs:end server
+} > begin-end-server 2>&1 &
+srv_pid=$!
+{
+# docs:begin begin-client
+while ! cartesi-machine \
+    --remote-address=127.0.0.1:8081 \
+    --remote-health-check 2>/dev/null; do sleep 1; done
+cartesi-machine \
+    --remote-address=127.0.0.1:8081 \
+    --no-remote-destroy \
+    --max-mcycle=1Mi \
+    -- echo "Still here!"
+# docs:end begin-client
+} > begin-client 2>&1
+{
+# docs:begin end-client
+cartesi-machine \
+    --remote-address=127.0.0.1:8081 \
+    --remote-shutdown \
+    --no-remote-create
+# docs:end end-client
+} > end-client 2>&1
+client_status=$?
+# If the shutdown client failed, force the server down so wait returns
+[ "$client_status" -ne 0 ] && kill "$srv_pid" 2>/dev/null
+wait "$srv_pid"
+```
+use the `cartesi-machine` command-line utility to instantiate and run a Cartesi Machine for 2^20 cycles:
+```{.bash replace=cmdline_remote_end/source/begin-client}
+```
+
+The client shell shows:
+```{replace=cmdline_remote_end/begin-client}
+```
+To continue execution of the same Cartesi Machine until it halts, rather than instantiating a new one, use the `cartesi-machine` command-line utility with the option `--no-remote-create`:
+```{.bash replace=cmdline_remote_end/source/end-client}
+```
+The client shell now shows:
+```{replace=cmdline_remote_end/end-client}
+```
+The server shell shows the execution of both sessions:
+```{replace=cmdline_remote_end/begin-end-server}
+```
+
+Remote Cartesi Machines have one ability that local Cartesi Machines lack: they can be _forked_, producing a copy that runs forward independently in a child server while the original is preserved in the parent.
+Inspect-state requests and rejected advance-state requests require that changes to the state of the Rolling Cartesi Machine be reverted.
+One way to implement this is for the host to run the inspect or advance against a fork, then discard it.
+
+### Rolling Cartesi Machines
+
+Applications involving Rolling Cartesi Machines are not designed to interact with the `cartesi-machine` command-line utility.
+Instead, they rely on a variety of software components that allow a front-end to post to the blockchain requests to advance the state of the server.
+The Cartesi Node polls the blockchain for advance-state requests posted by others so a local copy of the server can be kept in sync.
+It also allows a front-end to inspect the state of the server.
+
+Nevertheless, in debugging or prototyping tasks, the `cartesi-machine` command-line utility can simulate the external environment that a guest application (running inside a Rolling Cartesi Machine) would encounter in production.
+To use this functionality, the developer creates a sequence of advance-state requests as numbered files, or a single inspect-state request as a file, and instructs the `cartesi-machine` command-line utility to feed them to the guest application.
+As each request is processed, the utility stores the responses as separate files.
+
+An advance-state request is a single ABI-encoded `EvmAdvance(uint256 chainId, address appContract, address msgSender, uint256 blockNumber, uint256 blockTimestamp, uint256 prevRandao, uint256 index, bytes payload)` calldata blob carrying the fields important for the operation of Cartesi Rollups.
+Recall that, as responses, the guest application can issue _vouchers_, _notices_, _reports_, and _exceptions_.
+In contrast, an inspect-state request carries only a _query_ and, as response, produces only reports and exceptions.
+The query in an inspect-state request consists of an application-specific payload.
+
+Guest applications running inside Rolling Cartesi Machines do not access the network or the file-system directly.
+They communicate with the host through a Cartesi-specific mechanism, detailed under [Communication between guest and host](#communication-between-guest-and-host) in the guest perspective.
+
+In a nutshell, the process is as follows.
+To obtain the next request, the guest application _yields_ control back to the host (in our case, the `cartesi-machine` command-line utility).
+The host writes the next request where the guest can read it and resumes the machine, so the guest application can process it.
+When the guest application emits an output (a voucher, notice, report, or exception), it again yields control to the host so it can collect the output (in our case, saving it to a file or printing it to the terminal) before resuming the machine.
+
+To help debugging applications, developers can obtain from Cartesi Rollups, as files, the inputs associated to each advance-state request, so the sequence can be replayed locally in the command line.
+When prototyping, developers can create their own files simulating requests that test the behavior of their guest application under customized conditions.
+
+#### Encoding requests
+
+The `cartesi-rollup-data.lua` command-line utility, available in the `cartesi/machine-emulator-docs` Docker image, can encode advance-state requests and inspect-state queries to files, and decode vouchers, notices, reports, exceptions, and delegate-call vouchers from files.
+The calculator we will run treats the payload of each advance-state request as an arbitrary-precision arithmetic expression and emits the result as a notice.
+The following commands encode six such requests as `input-1.bin` through `input-6.bin`, sharing their common structure through a small `encode_input` shell function, and one inspect-state query as `query.bin`:
+
+```{.bash key=rolling_calc_encode outputs=ls_bin replace=source}
+# docs:begin
+encode_input() {
+  cartesi-rollup-data.lua encode advance <<EOF
+{
+  "chain_id": 0,
+  "app_contract": "0x0000000000000000000000000000000000000000",
+  "msg_sender": "$(printf '0x%040d' "$1")",
+  "block_number": 0,
+  "block_timestamp": 0,
+  "prev_randao": "0x0000000000000000000000000000000000000000000000000000000000000000",
+  "index": $1,
+  "payload": "$(printf '%s\n' "$2" | hex --encode)"
+}
+EOF
+}
+encode_input 1 '6*2^1024 + 3*2^512' > input-1.bin
+encode_input 2 'invalid input' > input-2.bin
+encode_input 3 '2^2048' > input-3.bin
+encode_input 4 '(2^256 - 1) * (2^256 - 1)' > input-4.bin
+encode_input 5 'scale=80; sqrt(2)' > input-5.bin
+encode_input 6 'scale=100; 355/113' > input-6.bin
+cartesi-rollup-data.lua encode inspect > query.bin <<EOF
+{
+  "payload": "$(printf 'scale=70; (1+sqrt(5))/2\n' | hex --encode)"
+}
+EOF
+# docs:end
+ls *.bin > ls_bin
+```
+Listing the files created with `ls *.bin`, we see
+```{.text replace=rolling_calc_encode/ls_bin}
+```
+The six numbered files are advance-state requests, and `query.bin` is an inspect-state query.
+
+#### A simple calculator guest application
+
+We will run an arbitrary-precision arithmetic expression evaluator that outputs, as notices, the result of the computation it receives as the payload of each advance-state request.
+We will rely on the `bc` command-line utility to perform the computations.
+To interact with the `/dev/cmio` Linux device (i.e., to obtain the advance-state request inputs and to generate the notices), we will use the `/usr/bin/rollup` command-line utility.
+
+The `rollup` command-line utility supports the commands `accept`, `reject`, `voucher`, `notice`, `report`, and `exception`.
+It uses JSON objects as inputs and outputs.
+The `accept` and `reject` commands accept or reject the previous request and output the next request.
+For advance-state requests, the output is in the format
+```js
+{
+  "request_type": "advance_state",
+  "data": {
+    "chain_id": <number>,
+    "app_contract": <address>,
+    "msg_sender": <address>,
+    "block_number": <number>,
+    "block_timestamp": <number>,
+    "prev_randao": <hex-uint256>,
+    "index": <number>,
+    "payload": <hex-data>
+  }
+}
+```
+Appropriately, the `notice` command generates a notice.
+The input format is as follows
+```js
+{
+  "payload": <hex-data>
+}
+```
+and the output gives the index of the just-output notice as follows
+```js
+{
+  "index": <number>
+}
+```
+
+The `report` command takes the same input format as `notice`.
+However, since reports are not verifiable, there is no associated index to print out.
+
+Shell scripts become surprisingly powerful with the help of the `rollup`, `hex`, and `jq` command-line utilities.
+A `bc`-based arbitrary precision application, for example, might look like this:
+```{.bash key=rolling_calc_sh include=calc.sh title="calc.sh"}
+```
+
+The loop in the `calc.sh` script calls `rollup accept` or `rollup reject` (shortcuts for `rollup finish`) to accept or reject the previous request and obtain the next one.
+It uses `jq` to read the `request_type` field, which selects the output verb: an advance-state request emits the result as a notice, and an inspect-state request emits it as a report.
+Both kinds of request carry the expression at `.data.payload`, which `jq` extracts.
+The hex-encoded payload is decoded back to bytes by `hex --decode` and passed to `bc`, which outputs the result split into lines terminated by `\`.
+Unfortunately, `bc` does not exit with an error when it detects one.
+Instead, it prints a message to the error stream and exits successfully.
+The `grep .` exits with an error in that case, because the output stream of `bc` will be empty.
+Otherwise, `grep .` simply passes the output through unchanged.
+In that case, `tr` utility joins the lines back together.
+The joined result is hex-encoded by `hex --encode` and fed to `jq`, which assembles the proper JSON object with a `"payload"` field that is passed to `rollup notice` or `rollup report`, the verb chosen by the request type.
+
+To run `calc.sh`, first create a file-system with the program:
+```{.bash key=calc_ext2 outputs=calc.ext2 replace=source}
+trap 'rm -rf calc calc.tar' EXIT
+rm -rf calc
+ln -sf "$RECIPES_DIR/calc.sh" .
+# docs:begin
+mkdir calc
+cp calc.sh calc
+chmod +x calc/calc.sh
+tar \
+    --sort=name \
+    --mtime="2022-01-01" \
+    --owner=1000 \
+    --group=1000 \
+    --numeric-owner \
+    -cf calc.tar \
+    --directory=calc .
+xgenext2fs \
+    -fzB 4096 \
+    -i 4096 \
+    -a calc.tar \
+    calc.ext2
+# docs:end
+```
+
+Running a Rolling Cartesi Machine in the command line requires using the `cartesi-jsonrpc-machine` server in combination with the `cartesi-machine` client.
+The server provides the fork functionality the client uses to roll the machine state back when an input to advance-state request is rejected, or after an inspect-state request.
+With the encoded inputs and `calc.ext2` in the working directory, run the remote server with the command
+```{.bash key=rolling_calc_run vars=rolling_calc_encode,calc_ext2->calc_ext2/calc.ext2/path outputs=server,client1,client2,output-0-input-1.bin,output-1-input-3.bin,output-2-input-4.bin,output-3-input-5.bin,output-4-input-6.bin,rejected-output-1-input-2.bin,output-0-input-1-proof.lua,output-1-input-3-proof.lua,output-2-input-4-proof.lua,output-3-input-5-proof.lua,output-4-input-6-proof.lua,input-1-output-hashes-root-hash.bin,input-3-output-hashes-root-hash.bin,input-4-output-hashes-root-hash.bin,input-5-output-hashes-root-hash.bin,input-6-output-hashes-root-hash.bin,input-1-output-hashes-root-hash-proof.lua,input-3-output-hashes-root-hash-proof.lua,input-4-output-hashes-root-hash-proof.lua,input-5-output-hashes-root-hash-proof.lua,input-6-output-hashes-root-hash-proof.lua,epoch-1-state-hash.bin,query-report-0.bin replace=source/server}
+ln -sf $rolling_calc_encode/*.bin .
+rm -f calc.ext2
+ln -sf "$calc_ext2" .
+{
+# docs:begin server
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8082
+# docs:end server
+} > server 2>&1 &
+srv_pid=$!
+{
+# docs:begin client1
+while ! cartesi-machine \
+    --remote-address=127.0.0.1:8082 \
+    --remote-health-check 2>/dev/null; do sleep 1; done
+cartesi-machine \
+    --no-init-splash \
+    --remote-address=127.0.0.1:8082 \
+    --no-remote-destroy \
+    --flash-drive=label:calc,data_filename:calc.ext2,user:dapp \
+    --cmio-advance-state=input_index_begin:1,input_index_end:4,hashes \
+    --final-hash=epoch-1-state-hash.bin \
+    -- /mnt/calc/calc.sh
+# docs:end client1
+} > client1 2>&1
+client1_status=$?
+{
+# docs:begin client2
+cartesi-machine \
+    --no-init-splash \
+    --remote-address=127.0.0.1:8082 \
+    --no-remote-create \
+    --remote-shutdown \
+    --cmio-advance-state=input_index_begin:4,input_index_end:7,last_output_proof:output-1-input-3-proof.lua,hashes \
+    --cmio-inspect-state=query:query.bin,hashes
+# docs:end client2
+} > client2 2>&1
+client2_status=$?
+{ [ "$client1_status" -eq 0 ] && [ "$client2_status" -eq 0 ]; } || kill "$srv_pid" 2>/dev/null
+wait "$srv_pid"
+```
+
+We will run the inputs in two separate epochs against this server, kept alive between runs.
+From a different shell into the same container, run the client to process the first epoch
+```{.bash replace=rolling_calc_run/source/client1}
+```
+This run instantiates the machine from the `calc.ext2` flash drive and advances inputs 1 to 3.
+Passing `--no-remote-destroy` and omitting `--remote-shutdown` leaves both the server and the machine it holds alive for the next epoch.
+
+The client shell shows
+```{replace=rolling_calc_run/client1}
+```
+```{.bash key=rolling_calc_output outputs=first_rx_accepted,hash_before_input1,hash_after_input1,input1_tx_output,input1_rx_accepted,input2_rx_rejected,hash_before_input3 vars=client1->rolling_calc_run/client1/path replace=null}
+$RECIPES_DIR/cycle-of.sh 'Manual yield rx-accepted'   < $client1 > first_rx_accepted
+$RECIPES_DIR/hash-of.sh 'Before input 1'              < $client1 | $RECIPES_DIR/trunc8.sh > hash_before_input1
+$RECIPES_DIR/hash-of.sh 'Before input 1' 2            < $client1 | $RECIPES_DIR/trunc8.sh > hash_after_input1
+$RECIPES_DIR/cycle-of.sh 'Automatic yield tx-output'  < $client1 > input1_tx_output
+$RECIPES_DIR/cycle-of.sh 'Manual yield rx-accepted' 2 < $client1 > input1_rx_accepted
+$RECIPES_DIR/cycle-of.sh 'Manual yield rx-rejected'   < $client1 > input2_rx_rejected
+$RECIPES_DIR/hash-of.sh 'Before input 3'              < $client1 | $RECIPES_DIR/trunc8.sh > hash_before_input3
+```
+
+The client starts by printing information about the remote server it connected to.
+It then runs the machine in a loop, occasionally transferring information in and out.
+The first `manual yield rx-accepted`, at cycle []{replace=rolling_calc_output/first_rx_accepted}, is the point at which the calculator attempted to obtain its first request.
+
+Upon receiving control back, the client prints input index 1 and the state hash [...]{replace=rolling_calc_output/hash_before_input1}.
+It loads `input-1.bin` as the next request, prints the modified state hash [...]{replace=rolling_calc_output/hash_after_input1}, and resumes the machine.
+The calculator evaluates `6*2^1024 + 3*2^512` and emits the result as a notice.
+That emission is an `automatic yield tx-output` at cycle []{replace=rolling_calc_output/input1_tx_output}, which returns control to the client.
+The client collects the emitted output and stores it as `output-0-input-1.bin`.
+The `manual yield rx-accepted` at cycle []{replace=rolling_calc_output/input1_rx_accepted} signals that input index 1 was accepted.
+At this point the client also stores the output hashes root hash the guest reported, as `input-1-output-hashes-root-hash.bin`, and double-checks it against its own local computation of the same hash.
+This hash commits to every output the machine has emitted so far.
+
+The client then loads input index 2 and resumes the machine.
+The payload `invalid input` is not an expression that `bc` understands, so the calculator rejects the request.
+An empty notice is still emitted just before the rejection.
+Shell pipelines run concurrently, so `rollup notice` has already run by the time `bc`'s failure is detected.
+Rejection discards all outputs, such as this notice.
+For debugging purposes, the client saves the notice contents as `rejected-output-1-input-2.bin`.
+The resulting `manual yield rx-rejected` at cycle []{replace=rolling_calc_output/input2_rx_rejected} rolls the machine state back to what it was before the input was processed.
+The state hash before input 3, [...]{replace=rolling_calc_output/hash_before_input3}, is identical to the hash after input 1 was accepted, which confirms the rejected input left no trace.
+
+Input index 3, with payload `2^2048`, is accepted like the first, so the client stores `output-1-input-3.bin` and `input-3-output-hashes-root-hash.bin`.
+On each accept the client also writes the proof that the output hashes root hash occupied the machine's CMIO tx buffer, as `input-1-output-hashes-root-hash-proof.lua` and `input-3-output-hashes-root-hash-proof.lua`.
+The two output proofs for this epoch, `output-0-input-1-proof.lua` and `output-1-input-3-proof.lua`, are written at the end, once all of the epoch's outputs are known.
+Each proves that one of the epoch's outputs belongs to the tree the final output hashes root hash commits to.
+The `--final-hash` option saves the machine state hash at the end of the epoch, as `epoch-1-state-hash.bin`, the state a dispute over this epoch would settle on.
+
+Now run the client to process the second epoch in the same server
+```{.bash replace=rolling_calc_run/source/client2}
+```
+The command-line option `--no-remote-create` reuses the machine where the first epoch left off.
+The output hashes tree inside the machine keeps growing across the epoch boundary on its own.
+The `last_output_proof:output-1-input-3-proof.lua` option is there for the `cartesi-machine` command-line-utility alone, which uses the first epoch's last output proof to rebuild its own copy of the output hashes tree as it stood at the end of that epoch.
+With this copy, the output hashes root hash `cartesi-machine` computes for each accepted input matches the one produced inside the emulator, which is what the default `check_output_hashes_root_hash` verifies.
+The copy also lets `cartesi-machine` emit correct proofs, at the right global output indices, for the outputs it collects during this epoch.
+The three inputs evaluate `(2^256 - 1) * (2^256 - 1)`, `sqrt(2)` to 80 decimal places, and `355/113` to 100 decimal places.
+Arbitrary-precision results like these are awkward to compute on the blockchain, whose native arithmetic works on fixed-width 256-bit integers and has no fractions.
+Their outputs continue the global output index, becoming outputs 2, 3, and 4.
+The run passes `--remote-shutdown` to stop the server once the epoch is done.
+
+The client shell now shows
+```{replace=rolling_calc_run/client2}
+```
+
+After the second epoch's advances, the same run sends the inspect-state query from `query.bin`.
+The calculator evaluates `scale=70; (1+sqrt(5))/2`, the golden ratio, and returns it as a report rather than a notice.
+An inspect-state request cannot emit verifiable outputs such as notices or vouchers, because any change its processing makes to the machine state is reverted afterward.
+The client saves the report as `query-report-0.bin`.
+
+The hash operations behind the output proofs are explained later, under [The output hashes tree](#the-output-hashes-tree) in the Blockchain perspective.
+
+The server shell shows only the error message output by `bc` and `rollup`.
+In production, these error messages should have been captured and output as a report, rather than being allowed to leak into the console.
+```{replace=rolling_calc_run/server}
+```
+
+#### Decoding responses
+
+The `cartesi-rollup-data.lua` command-line utility can also decode the binary records produced by the guest application.
+
+For example, to see the value of `sqrt(2)` computed in the second epoch, decode its notice with the command
+```{.bash key=rolling_calc_decode vars=output_3_input_5_bin->rolling_calc_run/output-3-input-5.bin/path replace=source}
+ln -sf $output_3_input_5_bin .
+# docs:begin
+cartesi-rollup-data.lua decode notice < output-3-input-5.bin | \
+    jq -j .payload | \
+    hex --decode | \
+    fold -w 68
+# docs:end
+```
+to produce
+```{replace=rolling_calc_decode}
+```
+This is `sqrt(2)` to 80 decimal places.
+
+The inspect-state report is decoded the same way, with `decode report`
+```{.bash key=rolling_calc_decode_report vars=query_report->rolling_calc_run/query-report-0.bin/path replace=source}
+ln -sf $query_report .
+# docs:begin
+cartesi-rollup-data.lua decode report < query-report-0.bin | \
+    jq -j .payload | \
+    hex --decode | \
+    fold -w 68
+# docs:end
+```
+to produce
+```{replace=rolling_calc_decode_report}
+```
+This is the golden ratio to 70 decimal places.
+
+Vouchers, exceptions, and delegate-call vouchers are also supported by `cartesi-rollup-data.lua decode`.
+A voucher carries a _destination_, a _value_, and a _payload_.
+Payloads are 0x-prefixed hex.
+
+### Rolling Cartesi Machine templates
+
+A Rolling Cartesi Machine template is a machine that has been configured to support Cartesi Rollups, is running a guest application in a request-processing loop, is ready to process the next request, and has been stored.
+
+A template is the genesis of a Cartesi Rollups application.
+Its state hash is what a freshly deployed application looks like to the blockchain, and the stored template is the artifact distributed to anyone who wants to run the application in their own Cartesi Node.
+
+We store the calculator from the previous section as a template with the command
+```{.bash key=rolling_calc_template outputs=template,rolling-calculator-template vars=calc_ext2->calc_ext2/calc.ext2/path replace=source/template}
+rm -f calc.ext2
+ln -sf "$calc_ext2" .
+rm -rf rolling-calculator-template
+{
+# docs:begin template
+cartesi-machine \
+    --no-init-splash \
+    --assert-rolling-template \
+    --flash-drive=label:calc,data_filename:calc.ext2,user:dapp \
+    --store="rolling-calculator-template" \
+    --final-hash \
+    -- /mnt/calc/calc.sh
+# docs:end template
+} > template 2>&1
+```
+
+The `--assert-rolling-template` option makes `cartesi-machine` exit with a status-code reporting failure if the generated machine is not a Rolling Cartesi Machine template, which helps catch errors.
+The result is as follows
+```{replace=rolling_calc_template/template}
+```
+The machine execution stops when the first call to `rollup finish` yields, and the machine at that state is stored in directory `"rolling-calculator-template"`.
+The `--final-hash` option prints the state hash of the stored machine, the genesis state hash that identifies this application to the blockchain.
+
+:::note
+In production, if the guest application finds an irrecoverable error during initialization, it should abort with an exception.
+In that case, the `cartesi-machine` command-line utility will detect the exception, print it to the console, and exit with a status-code reporting failure.
+:::
+
+To run the application, load the template into a server and feed it the same inputs.
+With the encoded inputs and the stored template in the working directory, run the remote server with the command
+```{.bash key=rolling_calc_template_run vars=rolling_calc_encode,tmpl->rolling_calc_template/rolling-calculator-template/path outputs=server,client,output-0-input-1.bin,output-1-input-3.bin,output-2-input-4.bin,output-3-input-5.bin,output-4-input-6.bin replace=source/server}
+ln -sf $rolling_calc_encode/input-?.bin .
+ln -sf "$tmpl" rolling-calculator-template
+{
+# docs:begin server
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8083
+# docs:end server
+} > server 2>&1 &
+srv_pid=$!
+{
+# docs:begin client
+while ! cartesi-machine \
+    --remote-address=127.0.0.1:8083 \
+    --remote-health-check 2>/dev/null; do sleep 1; done
+cartesi-machine \
+    --no-init-splash \
+    --remote-address=127.0.0.1:8083 \
+    --remote-shutdown \
+    --cmio-advance-state=input_index_begin:1,input_index_end:7,output_proof:,hashes \
+    --load="rolling-calculator-template"
+# docs:end client
+} > client 2>&1
+client_status=$?
+[ "$client_status" -ne 0 ] && kill "$srv_pid" 2>/dev/null
+wait "$srv_pid"
+```
+From a different shell into the same container, run the client
+```{.bash replace=rolling_calc_template_run/source/client}
+```
+This loads the machine from the stored template and advances all six inputs.
+Abbreviated, the client shell shows
+```{.bash key=rolling_calc_template_run_elided vars=client->rolling_calc_template_run/client/path outputs=elided replace=null}
+{ head -n 16 "$client"; echo ...; tail -n 8 "$client"; } > elided
+```
+```{replace=rolling_calc_template_run_elided/elided}
+```
+The outputs and their hashes are identical to those produced in the previous section, because the template captured exactly the same genesis state.
+
+### Additional options
+
+:::warning
+This is an advanced section, not needed by regular users of the Cartesi platform.
+:::
+
+A guest application can inform the host of its progress by using the Cartesi-specific `/dev/cmio` Linux device.
+Within the guest, the device can be controlled from the shell with the `/usr/bin/yield` utility, pre-installed in the root file-system `rootfs.ext2`.
+The progress feedback is accessed via the `automatic progress <permil>` command-line option.
+
+For example, during the execution of the loop,
+```{.bash key=progress replace=source outputs=config-progress.lua}
+cartesi-machine \
+    --no-init-splash \
+# docs:begin null
+    --store-config=config-progress.lua \
+# docs:end null
+    -- $'for i in $(seq 0 5 1000); do yield automatic progress $i; done'
+```
+the `cartesi-machine` utility receives control back from the emulator at every iteration, when the guest executes the `yield` utility.
+(The directory `/usr/bin/`, where `yield` resides, is in the default `PATH`.)
+
+By default, the emulator honors automatic yield requests from the guest.
+Passing `--no-htif-yield-automatic` makes `cartesi-machine` ignore them, but be careful since doing so would _also_ prevent Rolling Cartesi Machines from generating outputs.
+Each time `cartesi-machine` receives control due to a yield, it prints a progress message (shown at 44% below) and resumes the emulator so it can continue working.
+
+```{.text key=truncated_progress_output runner=bash replace=stdout vars=log->progress/both/path}
+# tr replaces carriage returns with line feeds
+# first sed command passes through anything not a progress line.
+# second sed command finds 44.00 and immediately aborts
+tr '\r' '\n' < $log | sed -n '/^Progress:/!p; /^Progress:  44\.00$/{p;q;}'
+```
+This feature is most useful when the emulator is controlled programmatically, via its Lua, C++, or JSON-RPC interfaces, where Cartesi Machines typically run disconnected from the console.
+In these situations, the progress device can be used to drive a dynamic user interface element that reassures users progress is being made during long, silent computations.
+Its handling by `cartesi-machine`, which does have access to the console, is simply to help with prototyping and debugging.
+
+The protocols followed by the `yield` utility to interact with the `/dev/cmio` driver and by the driver itself to communicate with the HTIF device are explained in detail under the [guest perspective](#system-architecture).
+In particular, the section explains the _manual_ yield commands needed for proper operation of Cartesi Rollups.
+
+The command-line option `--append-bootargs=<string>` can be used to append any `<string>` to the kernel command-line.
+A detailed description of all kernel command-line parameters is beyond the scope of this document.
+Please refer to the appropriate [section of the kernel documentation](https://www.kernel.org/doc/html/v6.5/admin-guide/kernel-parameters.html).
+
+For example, to prevent clutter in the console, the `cartesi-machine` utility automatically adds the `quiet` option to the kernel command-line, disabling most log messages.
+To override this setting and see more of the log messages output to console, use the `loglevel=<n>` parameter.
+```{.bash key=append_bootargs_loglevel replace=source}
+cartesi-machine \
+    --quiet \
+    --no-init-splash \
+    --append-bootargs="loglevel=8"
+```
+The output is
+```{replace=append_bootargs_loglevel}
+```
+
+To clear the kernel command-line, use the option `--no-bootargs`.
+Notice that, without any options, the machine will not operate properly.
+In particular, as explained under the [Lua interface](#lua-interface), flash-drives use kernel command-line arguments.
+For example, running the `cartesi-machine` command-line utility with no arguments produces a kernel command-line
+equivalent to running the command
+
+```{.bash key=default_bootargs replace=null}
+cartesi-machine \
+    --no-init-splash \
+    --max-mcycle=0 \
+    --store-config=format:json | \
+        jq -r '.dtb.bootargs'
+```
+```{.bash key=no_bootargs_equiv replace=source vars=bootargs->default_bootargs/stdout}
+cartesi-machine \
+    --no-init-splash \
+    --no-bootargs \
+    --append-bootargs="$bootargs"
+```
+
+The command-line option `--periodic-hashes=<period>[,start:<mcycle>]` causes the command-line utility to periodically obtain and print the state hash.
+The `<period>` argument gives the distance between hashes in cycles. The optional `start:<mcycle>` sub-key gives the starting cycle for the periodic hashes. (Both `--initial-hash` and `--final-hash` are implied by this option.)
+
+For example, to see the last 10 state hashes from the calculator machine computation, run the command
+
+```{.bash key=periodic_initial_cycle vars=log->output_raw_proof/both/path replace=null}
+cycles=$(cat $log | $RECIPES_DIR/last-cycles.sh)
+printf '%d\n' "$((cycles - 10))"
+```
+```{.bash key=rarely_periodic_hashes vars=initial_cycle->periodic_initial_cycle/stdout,template->calc_template/calculator-template/path replace=source}
+rm -f input.raw
+ln -sf "$template" .
+# docs:begin
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+cartesi-machine \
+    --no-init-splash \
+    --load="calculator-template" \
+    --replace-memory-range="label:input,data_filename:input.raw" \
+    --periodic-hashes=1,start:$initial_cycle
+# docs:end
+```
+The output is
+
+```{replace=rarely_periodic_hashes}
+```
+
+The command-line option `--dump-memory-ranges[=<dir>]` causes the emulator to dump the contents of all memory ranges in the address space to files under `<dir>`.
+If `<dir>` is omitted, files are written to the current working directory.
+Each memory range produces a file `<start>--<length>.bin`.
+Every other byte in the address space has value 0.
+This is useful to inspect the entire state of the machine from outside the emulator.
+
+The command-line options `--store-config` and `--load-config` store or load a Lua file with information that can be used to initialize the exact same Cartesi Machine that the `cartesi-machine` command-line utility will use.
+The format of these configuration files is explained in detail under the [Lua interface](#lua-interface) to Cartesi Machines.
+In particular, the `--store-config` option, without arguments, dumps to screen all the options used to define the Cartesi Machine.
+This information can be very useful when debugging problems.
+Both options accept a `format:<lua|json>` sub-key to select between Lua and JSON. When `format:` is omitted, the format is inferred from the filename extension (`.json` or `.lua`), defaulting to Lua.
+
+The remaining options in the command-line utility `cartesi-machine` are mostly useful for low-level tests and debugging.
+As such, they require some context.
+
+During verification, the blockchain mediates a *verification game* between the disputing parties.
+This process is explained in detail under the [the blockchain perspective](#verification-game).
+In a nutshell, both parties started from a Cartesi Machine that has a known and agreed upon initial state hash.
+(E.g., an agreed upon template that was instantiated with an agreed upon input drive, or an agreed upon rolling template
+with an agreed upon advance-state input box.)
+At the end of the computation, these parties now disagree on the final state hash.
+ (E.g., the state hash for the halted machine, or the state hash of the yielded machine after a number of advance-state inputs have been processed.)
+The state hash evolves as the machine executes steps in its fetch-execute loop.
+The first stage of the verification game therefore searches for the *step of disagreement*: the particular main processor cycle such that the parties agree on the state hash before the step, but disagree on the state hash after the step.
+When the uarch is in use, every main processor instruction can also be implemented by a sequence of micro-instructions in the uarch interpreter, and a single uarch step is one of those micro-instructions.
+So the search is refined to find the *uarch step of disagreement*: the particular uarch cycle such that the parties agree on the state hash before the uarch step, but disagree on the state hash after the uarch step.
+Once this uarch step of disagreement is identified, one of the parties sends to the blockchain a log of state accesses that happen along the uarch step, including Merkle-tree proofs for every value read from or written to the state.
+This log proves to the blockchain that the execution of the uarch step transitions the state in such a way that it reaches the state hash claimed by the submitting party.
+
+```{.bash key=cycles_uarch_putchar_ecall vars=config->nothing_to_do/config-nothing-to-do.lua/path,cycles->cycles_htif_putchar replace=null}
+ln -sf "$config" .
+lua5.4 $RECIPES_DIR/find-uarch-putchar-ecall.lua $cycles > /dev/null
+```
+
+Consider again the example in which the Cartesi Machine was stopped while it drew the splash screen.
+Let's assume that this is the step of disagreement.
+In an honest Cartesi Machine, the main processor instruction about to execute when `mcycle` is []{replace=cycles_htif_putchar/stderr} is the `sd` that issues a putchar command to the HTIF console device by writing it to the `htif.tohost` CSR.
+That single main processor instruction expands into many uarch instructions.
+The one that actually triggers the host to emit a character is an `ecall` with `a7 = UARCH_ECALL_FN_PUTCHAR` and `a0 = 0x0a`.
+This happens when `uarch_cycle` is []{replace=cycles_uarch_putchar_ecall/stderr}.
+
+In the following command, the `--max-mcycle` and `--max-uarch-cycle` options tell `cartesi-machine` to stop just before the putchar `ecall`.
+The `--log-step-uarch` command-line option instructs `cartesi-machine` to then dump to screen a user-friendly version of the access log produced by a single uarch step:
+```{.bash key=rarely_log_uarch_putchar replace=source vars=cycles->cycles_htif_putchar,ucycles->cycles_uarch_putchar_ecall/stderr}
+cartesi-machine \
+    --max-mcycle=$cycles \
+    --max-uarch-cycle=$ucycles \
+    --log-step-uarch
+```
+producing the log
+```{replace=rarely_log_uarch_putchar/stderr}
+```
+Understanding these logs in detail is unnecessary for all but the most low-level internal development at Cartesi.
+It requires deep knowledge of not only RISC-V architecture, but also how Cartesi's uarch interpreter implements the main processor fetch-execute loop.
+The material is therefore beyond the scope of this document.
+
+This particular example, however, was hand-picked for illustration purposes.
+The uarch instruction logged is the `ecall` that asks the host to emit one character.
+At this point, register `a7` (i.e., `uarch_x17`) holds the value `2` (`UARCH_ECALL_FN_PUTCHAR`) and register `a0` (i.e., `uarch_x10`) holds the character `0x0a` (a line-feed).
+When the host processes this `ecall`, it emits the line-feed to the console, completing the row `       \    / CARTESI` in the splash screen.
+
+```{.bash key=cmio_rx_buffer_range replace=null}
+lua5.4 -e 'local c = require "cartesi"; io.write(string.format("start:0x%x,length:2<<%d", c.AR_CMIO_RX_BUFFER_START, c.AR_CMIO_RX_BUFFER_LOG2_SIZE - 1))'
+```
+```{.bash key=cmio_tx_buffer_range replace=null}
+lua5.4 -e 'local c = require "cartesi"; io.write(string.format("start:0x%x,length:2<<%d", c.AR_CMIO_TX_BUFFER_START, c.AR_CMIO_TX_BUFFER_LOG2_SIZE - 1))'
+```
+The command-line options `--cmio-rx-buffer=<key>:<value>...` and `--cmio-tx-buffer=<key>:<value>...` configure backing-store options for the two memory ranges used by the `/dev/cmio` device.
+The RX buffer occupies []{replace=cmio_rx_buffer_range} and the TX buffer occupies []{replace=cmio_tx_buffer_range}.
+Although their addresses and lengths are fixed and cannot be overridden, their backing storage can be configured.
+See the [guest perspective](#system-architecture) for details on how these buffers are used by Cartesi Rollups, and the section on [Rolling Cartesi Machines](#rolling-cartesi-machines) for the request/response data flow.
+
+Automatic and manual yields are enabled by default.
+Disable them with `--no-htif-yield-automatic` or `--no-htif-yield-manual` (note that disabling automatic yield prevents Rolling Cartesi Machines from generating outputs).
+
+## Lua interface
+
+:::caution
+This entire chapter is for advanced users only, since typical users of the Cartesi platform will likely never need to programmatically control a Cartesi Machine.
+:::
+
+The Lua interface to Cartesi Machines is available from the `cartesi` Lua module.
+In a properly setup installation (such as what is available in the playground Docker image), the module can be loaded with the `require` function
+```lua
+-- Load the Cartesi module
+local cartesi = require"cartesi"
+```
+
+A Cartesi Machine instance is defined by its *organization* and the *contents* of its state.
+The organization specifies a variety of memory ranges (such as RAM, flash drives, NVRAMs, the DTB, and CMIO buffers).
+To support Cartesi Machine's transparency, all these memory ranges are mapped into the machine's 64-bit physical memory address space.
+The layout defines each entry's start and length in the address space.
+The DTB and the CMIO buffers have fixed layouts.
+RAM has a fixed start, but its length is user-configurable.
+For flash drives and NVRAMs, the user chooses the start and length of each entry.
+The contents of the state include the values stored in all these memory ranges, in addition to the values of all processor registers and device-specific state.
+
+### Instantiation by configuration
+
+Cartesi Machines can be instantiated directly from a configuration structure.
+
+<a name="machine_config"></a>
+
+```lua
+machine_config ::= {
+    processor ::= processor_config,
+
+    ram ::= {
+        backing_store ::= backing_store_config,
+        length ::= number
+    },
+
+    dtb ::= {
+        backing_store ::= backing_store_config,
+        bootargs ::= string,
+        init ::= string,
+        entrypoint ::= string
+    },
+
+    flash_drive ::= {
+        [1] ::= memory_range_config, -- flash drive 0
+        [2] ::= memory_range_config, -- flash drive 1
+        ...
+        [n] ::= memory_range_config
+    },
+
+    nvram ::= {
+        [1] ::= memory_range_config, -- nvram 0
+        [2] ::= memory_range_config, -- nvram 1
+        ...
+        [n] ::= memory_range_config
+    },
+
+    cmio ::= {
+        rx_buffer ::= {
+            backing_store ::= backing_store_config
+        },
+        tx_buffer ::= {
+            backing_store ::= backing_store_config
+        }
+    },
+
+    uarch ::= {
+        processor ::= uarch_processor_config,
+
+        ram ::= {
+            backing_store ::= backing_store_config
+        }
+    },
+
+    pmas ::= {
+        backing_store ::= backing_store_config,
+    },
+
+    hash_tree ::= hash_tree_config,
+
+    virtio ::= virtio_config
+}
+```
+
+<a name="backing_store_config"></a>
+
+```lua
+backing_store_config ::= {
+    data_filename ::= string,
+    shared ::= boolean,
+    create ::= boolean,
+    truncate ::= boolean,
+    dht_filename ::= string,
+    dpt_filename ::= string
+}
+```
+
+<a name="memory_range_config"></a>
+
+```lua
+memory_range_config ::= {
+    backing_store ::= backing_store_config,
+    start ::= number,
+    length ::= number,
+    label ::= string,
+    read_only ::= boolean
+}
+```
+
+<a name="processor_config"></a>
+
+```lua
+processor_config ::= {
+    backing_store ::= backing_store_config,
+
+    registers ::= {
+        x0 ::= number, -- always 0
+        x1 ::= number,
+        ...
+        x31 ::= number,
+        f0 ::= number,
+        ...
+        f31 ::= number,
+        fcsr ::= number,
+        pc ::= number,
+        mvendorid ::= number,
+        marchid ::= number,
+        mimpid ::= number,
+        mcycle ::= number,
+        misa ::= number,
+        mstatus ::= number,
+        mtvec ::= number,
+        mscratch ::= number,
+        mepc ::= number,
+        mcause ::= number,
+        mtval ::= number,
+        mie ::= number,
+        mip ::= number,
+        medeleg ::= number,
+        mideleg ::= number,
+        mcounteren ::= number,
+        menvcfg ::= number,
+        stvec ::= number,
+        sscratch ::= number,
+        sepc ::= number,
+        scause ::= number,
+        stval ::= number,
+        satp ::= number,
+        scounteren ::= number,
+        senvcfg ::= number,
+        icycleinstret ::= number,
+        iflags ::= {
+            H ::= number,
+            X ::= number,
+            Y ::= number
+        },
+        ilrsc ::= number,
+        iprv ::= number,
+        iunrep ::= number,
+        htif ::= {
+            tohost ::= number,
+            fromhost ::= number,
+            ihalt ::= number,
+            iconsole ::= number,
+            iyield ::= number
+        },
+        clint ::= {
+           mtimecmp ::= number
+        },
+        plic ::= {
+            girqpend ::= number,
+            girqsrvd ::= number
+        }
+    },
+}
+```
+
+<a name="uarch_processor_config"></a>
+
+```lua
+uarch_processor_config ::= {
+    backing_store ::= backing_store_config,
+    registers ::= {
+        halt_flag ::= number,
+        cycle ::= number,
+        pc ::= number,
+        x0 ::= number, -- always 0
+        x1 ::= number,
+        ...
+        x31 ::= number,
+    }
+}
+```
+
+<a name="hash_tree_config"></a>
+
+```lua
+hash_tree_config ::= {
+    shared ::= boolean,
+    create ::= boolean,
+    sht_filename ::= string,
+    phtc_filename ::= string,
+    phtc_size ::= number,
+    hash_function ::= string
+}
+```
+
+Every memory range in a Cartesi Machine has a corresponding <a href="#backing_store_config">`backing_store`</a> entry.
+This is the basis for the implementation of persistent Cartesi Machines.
+Field `backing_store.data_filename` gives the filename of an image on disk in the host with the initial contents for that memory range.
+Since the image is mapped, its size on disk must exactly match the length of the memory range.
+When `backing_store.shared` is set to `true` (default is `false`), changes made by the guest to the memory range pass through to modify the host image file.
+Otherwise, changes are kept private to the guest.
+When `backing_store.create` is set to `true` (default is `false`), the emulator creates the file at `data_filename` at instantiation, zero-initialized to the entry's `length`.
+In that case, `shared` must also be set to `true` (after all, the emulator is modifying the image file in the host).
+When `backing_store.truncate` is set to `true` (default is `false`), the emulator resizes an existing file at `data_filename` to match the memory range's length before mapping it, padding with zeros if the file is smaller than the corresponding memory range.
+Once again, in that case, `shared` must be set to `true`.
+Fields `backing_store.dht_filename` (for _dense hash-tree_) and `backing_store.dpt_filename` (for _dirty-page tree_) support the efficient computation of state hashes and proofs.
+When instantiating a machine from scratch, these are normally left empty.
+In fact, for many of the entries in the `machine_config`, the `backing_store` field is populated and consumed automatically by the emulator when storing and loading persistent machines.
+I.e., when using `cartesi-machine` command-line options `--load=<directory>` and `--store=<directory>`, or when using the Lua API methods `machine:store(<directory>)` and `machine:load(<directory>)` on which they are based.
+The multiple instances of field `backing_store` will not be described individually.
+
+The `ram` entry in `machine_config` describes the main processor RAM.
+Field `length` gives the amount of RAM in bytes (RAM always starts at offset []{replace=ar_ram_start}).
+This length should be a multiple of 4Ki, the length of a RISC-V memory page.
+The `backing_store.data_filename` holds the filename of an image that will be loaded at the start of RAM.
+This is where the RAM image `linux.bin` generated by the [`machine-linux-image`](https://github.com/cartesi/machine-linux-image) repository is typically loaded.
+
+The `flash_drive` entry in `machine_config` is a list of <a href="#memory_range_config">`memory_range_config`</a> structures.
+The same is true of the `nvram` entry.
+In each `memory_range_config`, fields `start` and `length` give the start and length of the memory range in the machine's address space.
+Once again, the length must be a multiple of 4Ki.
+The `start` of a drive must be aligned to its `length` rounded up to the next power of 2.
+No memory range in a Cartesi Machine can overlap with any other, considering their rounded-up lengths.
+If `length` is omitted, it defaults to the size of the backing image on disk.
+If `start` is omitted, it is automatically placed to respect the alignment and overlap restrictions.
+The first flash drive is placed past RAM, then each remaining flash drive is placed past the previous.
+The first NVRAM is placed past the last flash drive, and then each remaining NVRAM is placed past the previous.
+Field `label` is a string used by the emulator to expose the entry to the guest via DTB aliases.
+Each flash drive is exposed to the guest as a `/dev/pmem*` device, and each NVRAM as a `/dev/uio*` device.
+Field `read_only` is a Boolean (defaults to `false`) that makes the corresponding memory range read-only from the point
+of view of the guest.
+The `backing_store.data_filename` holds the filename of an image that will be loaded into the corresponding memory range.
+
+The `dtb` entry in `machine_config` describes the memory range that holds the device tree for the emulator.
+Field `entrypoint` is the user-mode command that `cartesi-init` runs after setup, by default as user `dapp`.
+This is what the `cartesi-machine` command-line utility appends to when arguments are passed after `--`.
+Field `init` is a shell snippet appended to the initialization phase, executed as `root` before the entrypoint.
+This is where the `cartesi-machine` command-line utility appends instructions to change ownership and permissions of flash-drives and NVRAMs, to mount flash-drives at `/mnt/<label>`, and other important initializations of the guest Linux environment.
+Field `bootargs` is the kernel command-line string passed to Linux at boot.
+When `dtb.backing_store.data_filename` is empty, the emulator generates the DTB image at instantiation from the rest of the configuration.
+
+The `cmio` entry in `machine_config` configures the two CMIO buffers used to send data in and out of the machine.
+Fields `rx_buffer` and `tx_buffer` each contain only a `backing_store` configuration.
+For example, the input to an advance-state request and the query to an inspect-state request are written to the `rx_buffer` memory range.
+Conversely, vouchers, notices, reports, and exceptions are written to the `tx_buffer` memory range.
+For more details on how exactly these memory ranges are used, please read the [architecture section](#system-architecture) under the guest perspective.
+
+The <a href="#processor_config">`processor`</a> entry in `machine_config` describes the main processor state.
+Field `registers` is a flat table of all general-purpose, floating-point, and control-and-status registers, plus the nested sub-tables `iflags`, `htif`, `clint`, and `plic`.
+Each register field is a number that sets its value.
+Most users only need to set `mvendorid`, `mimpid`, and `marchid`, which the emulator checks at instantiation to ensure the configuration matches the running emulator version.
+During prototyping, these can be set to `-1` to make the emulator accept any value.
+In production code, they should be hard-coded.
+Most CSRs are defined in volumes [1 and 2](https://riscv.org/technical/specifications/) of the ISA specification.
+The Cartesi-specific registers (`iprv`, `iunrep`, `iflags`, the HTIF and CMIO interfaces) are described under the [architecture section](#system-architecture) from the guest perspective.
+The `processor.registers.htif` sub-table holds the initial values of HTIF state.
+Field `iconsole` is a bitmask declaring whether the emulator honors console-putchar and console-getchar commands.
+Defaults to putchar-only.
+The `cartesi-machine` command-line option `-i`/`--htif-console-getchar` enables getchar.
+Field `iyield` is a bitmask declaring whether the emulator honors automatic and manual yield commands.
+Defaults to both enabled.
+The `cartesi-machine` command-line options `--no-htif-yield-automatic` and `--no-htif-yield-manual` clear the corresponding bits.
+
+The `uarch` entry describes the microarchitecture state.
+The `uarch.processor` field controls the uarch processor.
+Like the main processor, it includes a `uarch.processor.registers` flat table with all registers.
+Register `uarch.processor.registers.halt_flag` is non-zero when the uarch is halted.
+The `uarch.ram` field controls the uarch RAM.
+Unlike the main processor RAM, the uarch RAM is fixed in length.
+Moreover, the `uarch.ram.backing_store.data_filename` is typically left blank (other than in unit tests), as the emulator automatically fills the uarch RAM with an implementation of the main processor fetch-execute loop compiled to function within the uarch.
+
+The `pmas` entry describes the memory range containing one PMA (for _physical memory attributes_) entry for each address range that is visible to the main processor.
+This is automatically filled by the emulator during initialization.
+PMAs are described in the [PMAs subsection](#pmas) of the system architecture chapter.
+
+The `hash_tree` entry configures the global hash-tree structure that supports efficient computation of state hashes and proofs.
+Field `hash_tree.hash_function` controls the hash function used in the hash tree.
+It defaults to `"keccak256"`, and is suitable for use with the uarch.
+Set it to `"sha256"` for use with the ZK prover instead.
+These options are mutually exclusive: a machine that was initialized for use with the uarch can never be used with the ZK prover (and vice-versa).
+Fields `hash_tree.phtc_size` and `hash_tree.phtc_filename` control the _page hash-tree cache_.
+This is a cache that contains the entire dense hash tree for the most recently used pages in the address space.
+Field `hash_tree.phtc_size` gives the number of entries, and `hash_tree.phtc_filename` gives the filename for the backing image in the host.
+Field `hash_tree.sht_filename` gives the filename for the backing image of the global _sparse hash tree_ that combines the dense hash trees of the different memory ranges.
+
+Finally, the `virtio` entry is a list of configuration for VirtIO devices that can be used when the machine is used in non-reproducible mode during development.
+
+### Default configuration
+
+The `cartesi.machine:get_default_config()` method can be used to obtain the default Cartesi Machine configuration:
+```{.lua key=dump_default_config_lua include=dump-default-config.lua title="dump-default-config.lua"}
+```
+
+This produces:
+```{.lua key=config_default runner=bash depends=dump_default_config_lua outputs=config-default.lua replace=both}
+lua5.4 $RECIPES_DIR/dump-default-config.lua | tee config-default.lua
+```
+
+As it is, the default configuration is not functional.
+At a minimum, it is missing the RAM length, the image to be loaded into RAM, and a flash drive with the root file-system.
+
+The `dtb.bootargs` field carries the default kernel command line.
+The individual parameters have the following meaning:
+
+- []{replace=dtb_bootargs_console_part} silences the printing of kernel initialization messages, enables the SBI-based early console, used before the main console is up, and sets the main console to the hypervisor console virtual device;
+- []{replace=dtb_bootargs_uio_part} instructs the UIO platform driver to bind to nodes with the `generic-uio` compatible string, used by NVRAM ranges;
+- []{replace=dtb_bootargs_root_part} sets the first flash drive (exposed by the kernel as a persistent-memory block device) as the root file-system and instructs the kernel to mount the root file-system read-write;
+- []{replace=dtb_bootargs_init_part} runs the Cartesi-provided init script, ends up reading the property `/cartesi-machine/entrypoint` from the device tree (with the contents of `dtb.entrypoint`) running it as user `dapp`.
+
+### Generating configurations
+
+The `cartesi-machine` command-line utility can be used to output complete Cartesi Machine configurations.
+Recall from an [earlier example](#initialization) that the `cartesi-machine` command
+```{.bash replace=ls_bin/source}
+```
+builds a Cartesi Machine that, when run, lists the contents of the `/bin/` directory before gracefully halting.
+The kernel `linux.bin` and root file-system `rootfs.ext2` come from the defaults under `/usr/share/cartesi-machine/images/`.
+
+The command-line option `--store-config[=<filename>]` makes the utility capture the initial machine configuration.
+Without an argument, the configuration is printed to standard output.
+With `=<filename>`, it is written to that file (and `--load-config=<filename>` reloads it later).
+
+Adding `--store-config` to the example above, we obtain the complete contents of the corresponding `machine_config`, including default values conveniently marked as such by the `cartesi-machine` utility.
+Editing them out and storing into a file, we would get:
+```{.lua runner=bash key=config_ls_bin replace=stdout vars=config->ls_bin/config-ls-bin.lua/path title="config-ls-bin.lua"}
+lua5.4 $RECIPES_DIR/minimal-config.lua $config
+```
+
+Flash drives are exposed by the kernel as `/dev/pmem<i>` devices.
+NVRAMs are exposed as `/dev/uio<i>` devices.
+The emulator publishes each drive's `label` field inside the device-tree node `/aliases`.
+
+When the user passes arguments after `--` on the `cartesi-machine` command line, the utility appends them to `dtb.entrypoint`.
+The emulator then publishes this in the device-tree property `entrypoint` of the `/cartesi-machine` node.
+
+The command-line utility can also run Cartesi Machines with additional flash drives.
+Adding `--store-config` to the [earlier example](#flash-drives) that loaded `foo.ext2` as a flash drive
+```{.bash replace=cat_foo_bar/source}
+```
+captures a configuration whose essential, edited-down form is
+```{.lua runner=bash key=config_cat_foo_bar vars=config->cat_foo_bar/config-cat-foo-bar.lua/path replace=stdout title="config-cat-foo-bar.lua"}
+lua5.4 $RECIPES_DIR/minimal-config.lua $config
+```
+
+The new flash drive with label `foo` is added by the `cartesi-machine` command-line utility right after `root`.
+The utility also adds a small snippet to `dtb.init` that mounts the drive at `/mnt/foo`.
+The emulator adds the contents of `dtb.init` to the device-tree as property `init` of node `/cartesi-machine`, and the Cartesi-provided init script sources it as user `root` before executing the entrypoint.
+As a result, the file-system carried by `foo.ext2` on the host is mounted at `/mnt/foo` in the guest.
+That is where the entrypoint `cat /mnt/foo/bar.txt` finds the file to dump to the console.
+
+### Additional sample configurations
+
+Here are the (simplified) configurations for the other examples from the documentation of the `cartesi-machine` command-line utility.
+
+A Cartesi Machine that has nothing to do.
+This is the [introductory example](#command-line-interface), and its configuration, edited down to its essential, is
+```{.lua runner=bash key=config_nothing_to_do vars=config->nothing_to_do/config-nothing-to-do.lua/path replace=stdout title="config-nothing-to-do.lua"}
+lua5.4 $RECIPES_DIR/minimal-config.lua $config
+```
+The `dtb.init` field carries the ASCII-art splash that the `cartesi-machine` utility appends to its setup phase by default.
+This is what produces the Cartesi logo printed before each entrypoint runs.
+
+A Cartesi Machine that periodically reports its progress using the HTIF Yield device:
+```{.lua runner=bash key=config_progress replace=stdout vars=config->progress/config-progress.lua/path title="config-progress.lua"}
+lua5.4 $RECIPES_DIR/minimal-config.lua $config
+```
+
+A Cartesi Machine that computes the value of a generic mathematical expression:
+```{.lua runner=bash key=config_calculator vars=config->calc_run/config-calculator.lua/path replace=stdout title="config-calculator.lua"}
+lua5.4 $RECIPES_DIR/minimal-config.lua $config
+```
+
+Note the two NVRAMs, one for the input and one for the output, and how the `cartesi-machine` utility adds a snippet to `dtb.init` that changes permissions and ownership of the corresponding devices.
+
+### Loading and running machines
+
+To create a new handle for a machine, use the `cartesi.new()` function.
+The returned `machine` handle can hold a single machine instance, and starts empty.
+To instantiate a Cartesi Machine from a machine configuration (e.g., the configurations produced by the `cartesi-machine` utility above), use the `machine:create(<machine_config>)` method.
+Alternatively, the shortcut `cartesi.machine(<machine_config>)` combines the effects of `cartesi.new()` and `machine:create(<machine_config>)` into a single call.
+
+For example, the script
+```{.lua key=run_config include=run-config.lua title="run-config.lua"}
+```
+loads a machine configuration from the Lua module specified in the command-line (using `require(arg[1])`).
+It then creates an instance by calling the `cartesi.machine(<machine_config>)` constructor, which it stores in the
+`machine` local variable.
+
+The `machine:run(<max_mcycle>)` method of the Cartesi Machine instance runs the corresponding machine until the register `mcycle` reaches at most `<max_mcycle>`.
+The value `math.maxinteger` of `<max_mcycle>` used in the script is a very large integer, providing the machine with enough cycles to run until it halts or yields manual.
+Note that the `machine:run()` method can return prematurely for a variety of reasons (see below), so it should always be called inside a loop.
+It returns a break reason explaining why control was returned to the caller, taken from the `cartesi.BREAK_REASON_*` set.
+The script's loop terminates when the break reason is `BREAK_REASON_HALTED` or `BREAK_REASON_YIELDED_MANUALLY`, the two reasons that signal the machine has reached a state past which it cannot continue on its own.
+
+At any point, the `machine:get_initial_config()` method can be used to obtain the configuration that was used to create a Cartesi Machine instance.
+
+<a name="run-cat-foo-bar"></a>
+
+For example, to run the configuration stored in `./config-cat-foo-bar.lua` (assuming `./foo.ext2` is available) simply run
+
+```{.bash key=run_config_cat_foo_bar replace=source vars=foo_ext2->foo_ext2/foo.ext2/path,config->cat_foo_bar/config-cat-foo-bar.lua/path depends=run_config}
+ln -sf "$foo_ext2" .
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/run-config.lua" .
+# docs:begin
+lua5.4 run-config.lua config-cat-foo-bar
+# docs:end
+```
+```{.text replace=run_config_cat_foo_bar}
+```
+
+(The function call `require(arg[1])` translates the argument `"config-cat-foo-bar"` to `"config-cat-foo-bar.lua"` and loads that file.)
+
+### Instantiation from persistent state
+
+At any point in their execution, Cartesi Machines can be stored to disk.
+A stored machine can later be loaded to continue its execution from where it left off.
+
+:::note
+If the machine initialization involved large image files or a considerable amount of RAM, this operation may consume significant disk space.
+It will also take the time required by the copying of image files into the directory.
+:::
+
+To store a machine at its current state, use the `machine:store(<directory>)` method of the Cartesi Machine instance.
+The function call fails when the directory already exists, so existing persistent Cartesi Machines are not inadvertently overwritten:
+```{.lua key=store_cat_foo_bar include=store-cat-foo-bar.lua title="store-cat-foo-bar.lua"}
+```
+
+```{.bash key=run_store_cat_foo_bar outputs=cat-foo-bar replace=null vars=foo_ext2->foo_ext2/foo.ext2/path,config->cat_foo_bar/config-cat-foo-bar.lua/path depends=store_cat_foo_bar}
+ln -sf "$foo_ext2" .
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/store-cat-foo-bar.lua" .
+rm -rf cat-foo-bar
+lua5.4 store-cat-foo-bar.lua
+```
+
+After the execution of the script above, the directory `./cat-foo-bar/` contains all the information needed to instantiate the same machine, including copies of all necessary image files.
+There are no external dependencies.
+
+To load a machine from disk, use the `machine:load(<directory>)` method on an empty `machine` handle.
+Alternatively, the shortcut `machine = cartesi.machine(<directory>)` combines the effects of `machine = cartesi.new()` and `machine:load(<directory>)` into a single call.
+In fact, running the following script
+```{.lua key=load_cat_foo_bar include=load-cat-foo-bar.lua title="load-cat-foo-bar.lua"}
+```
+has exactly the same effect as the example [above](#run-cat-foo-bar), where the machine was instantiated from the configuration and directly run until it halted:
+
+```{.text key=run_load_cat_foo_bar runner=bash replace=both vars=template->run_store_cat_foo_bar/cat-foo-bar/path depends=load_cat_foo_bar}
+ln -sf "$RECIPES_DIR/load-cat-foo-bar.lua" .
+ln -sf "$template" .
+lua5.4 load-cat-foo-bar.lua
+```
+
+As before, the configuration that was used to instantiate a Cartesi Machine can be obtained from the machine instance with the method `machine:get_initial_config()`.
+Note that this is *not* the configuration that was used to instantiate the machine for the first time, but rather the configuration used to instantiate a copy of the machine that was stored.
+More specifically, any `backing_store.data_filename` fields point to copies that reside inside the storage `<directory>`.
+Likewise, the values of all registers will reflect the values as they were when stored.
+As for the contents of the initial backing files, they may have been modified by the running instance before a copy was
+saved into `<directory>`.
+
+### Limiting execution
+
+The host cannot predict how many cycles the emulator will need until a call to `machine:run(math.maxinteger)` returns.
+One of the uses for the `<max_mcycle>` argument in production code is to ensure the call returns at a desired frequency, rather than potentially blocking the caller indefinitely.
+
+The following script illustrates the process
+```{.lua key=run_config_in_chunks include=run-config-in-chunks.lua title="run-config-in-chunks.lua"}
+```
+
+Each iteration runs the machine for at most an additional `CHUNK` cycles.
+Reading the `mcycle` register with `machine:read_reg("mcycle")` returns the current cycle count, which is used to set the new limit to `mcycle+CHUNK`.
+After the call to `machine:run()` returns, the application is free to perform other tasks.
+The loop exits when the returned break reason is `BREAK_REASON_HALTED` or `BREAK_REASON_YIELDED_MANUALLY`. Any other reason (such as `BREAK_REASON_REACHED_TARGET_MCYCLE`, signalling the chunk expired) just continues the loop.
+
+```{.bash key=run_config_cat_foo_bar_in_chunks replace=source vars=foo_ext2->foo_ext2/foo.ext2/path,config->cat_foo_bar/config-cat-foo-bar.lua/path depends=run_config_in_chunks}
+ln -sf "$foo_ext2" .
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/run-config-in-chunks.lua" .
+# docs:begin
+lua5.4 run-config-in-chunks.lua config-cat-foo-bar
+# docs:end
+```
+```{.text replace=run_config_cat_foo_bar_in_chunks}
+```
+
+### Progress feedback
+
+When the computation running inside a Cartesi Machine is intensive, it may be desirable to inform users of the progress, so they can plan accordingly.
+On its own, the current value of `mcycle` does not give any information concerning how much of the computation still remains.
+What is needed is the value of `mcycle` when the machine halts.
+This is, unfortunately, difficult to estimate from the outside.
+The guest application is in a much better position to estimate its own progress.
+However, it needs a mechanism to communicate its progress back to the program controlling the emulator.
+
+The command-line utility `/usr/bin/yield` can be used for this purpose.
+Internally, the tool uses an `ioctl` system-call on the Cartesi-specific `/dev/cmio` device.
+The protocols followed by the `/usr/bin/yield` utility to interact with the `/dev/cmio` driver, and by the driver itself to communicate with the HTIF Yield device are explained in detail under the [guest perspective](#system-architecture).
+The focus here is on its effect on the host program controlling the emulator.
+
+By default, a Cartesi Machine is configured via `processor.registers.htif.iyield` to accept HTIF yield automatic commands.
+The field is a bitmask of enabled commands.
+Setting the `cartesi.HTIF_YIELD_CMD_AUTOMATIC_MASK` bit accepts yield automatic, and setting `cartesi.HTIF_YIELD_CMD_MANUAL_MASK` accepts yield manual.
+The default machine configuration sets both bits.
+When automatic yields are accepted, a yield automatic command causes the emulator to return prematurely from `machine:run(<max_mcycle>)` with break reason `BREAK_REASON_YIELDED_AUTOMATICALLY`.
+When the bit is clear, the command is silently ignored and execution continues until the machine halts or `mcycle` hits `<max_mcycle>`.
+
+The following example illustrates how Lua scripts can receive progress information throughout a computation performed inside a Cartesi Machine:
+```{.lua key=run_config_in_chunks_with_progress include=run-config-in-chunks-with-progress.lua title="run-config-in-chunks-with-progress.lua"}
+```
+The loop repeats until the break reason returned by `machine:run()` is `BREAK_REASON_HALTED` or `BREAK_REASON_YIELDED_MANUALLY`.
+As before, the computation is performed in chunks.
+At each iteration, the script tries to advance the computation until the end of the next chunk.
+A `BREAK_REASON_YIELDED_AUTOMATICALLY` return means the guest ran a yield automatic command.
+That command can be called for different reasons.
+The reason and the associated data are available in the `htif_tohost_reason` and `htif_tohost_data` registers, which expose pre-decoded fields of the HTIF `tohost` register.
+The constant `cartesi.HTIF_YIELD_AUTOMATIC_REASON_PROGRESS` corresponds to a progress report, in which case `htif_tohost_data` holds the progress in per-mille.
+A `BREAK_REASON_REACHED_TARGET_MCYCLE` return means the chunk expired without a yield or halt.
+In that case the script bumps `max_mcycle` by another `CHUNK` and could perform any desired &ldquo;per-chunk&rdquo; tasks before looping.
+
+For example, running the script with the command-line
+```{.bash key=lua_progress replace=source depends=run_config_in_chunks_with_progress vars=config->progress/config-progress.lua/path}
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/run-config-in-chunks-with-progress.lua" .
+# docs:begin
+lua5.4 run-config-in-chunks-with-progress.lua config-progress
+# docs:end
+```
+produces the output (shown at 44% completion) below
+```{.text key=truncated_lua_progress_output runner=bash replace=stdout vars=log->lua_progress/both/path}
+# tr replaces carriage returns with line feeds
+# first sed command passes through anything not a progress line.
+# second sed command finds 44.00 and immediately aborts
+tr '\r' '\n' < $log | sed -n '/^Progress:/!p; /^Progress:  44\.00$/{p;q;}'
+```
+
+This is similar to the `cartesi-machine` command-line
+```{.bash replace=progress/source}
+```
+which uses an equivalent mechanism for progress reports.
+
+### Cartesi Machine templates
+
+Recall that, to instantiate a [Cartesi Machine template](#cartesi-machine-templates), we first replace its NVRAM place-holders with their actual content.
+After that, we can run the resulting machine.
+We saved the simple calculator template into directory `"calculator-template"` by running the `cartesi-machine` utility with `--store="calculator-template"`, [as shown earlier](#cartesi-machine-templates).
+There, we also instantiated and ran the template with `cartesi-machine`'s `--replace-memory-range` command-line option.
+Internally, the utility uses the `machine:replace_memory_range(<memory_range_config>)` method of the Cartesi Machine instance to replace an existing memory range.
+The replacement target is identified by the `memory_range_config`'s `start` and `length` fields, which must match those of an existing memory range in the Cartesi Machine instance.
+If the memory range is a flash drive or an NVRAM, the `label` field can be used to identify it instead.
+The following code snippet shows how to instantiate a Cartesi Machine template using the Lua API:
+```{.lua key=run_calculator_with_new_drives include=run-calculator-with-new-drives.lua title="run-calculator-with-new-drives.lua"}
+```
+The code starts by loading the calculator template from directory `"calculator-template"`.
+It then calls `machine:replace_memory_range(<memory_range_config>)` to replace the input NVRAM, identifying it by `label` and pointing `backing_store.data_filename` at the filename passed as the first argument to the script.
+A second call replaces the output NVRAM analogously, also setting `backing_store.shared` to `true` so results can be read from the file after the machine is executed.
+Finally, the script runs the machine until it halts or yields manual.
+
+To see the example running,
+```{.bash key=lua_calculator_with_new_drives vars=template->calc_template/calculator-template/path depends=run_calculator_with_new_drives replace=source}
+ln -sf "$template" .
+ln -sf "$RECIPES_DIR/run-calculator-with-new-drives.lua" .
+echo "6*2^1024 + 3*2^512" > input.raw
+truncate -s 4K input.raw
+truncate -s 4K output.raw
+# docs:begin
+lua5.4 run-calculator-with-new-drives.lua input.raw output.raw
+lua5.4 -e 'print((string.unpack("z", io.read("a"))))' < output.raw
+# docs:end
+```
+The result is, as expected,
+```{replace=lua_calculator_with_new_drives}
+```
+
+### State hashes
+
+State hashes (defined earlier under [State hashes](#state-hashes)) are Merkle tree root hashes of the machine's entire address space.
+Here we obtain them from a Cartesi Machine instance with the following script:
+```{.lua key=run_config_with_hashes include=run-config-with-hashes.lua title="run-config-with-hashes.lua"}
+```
+
+State hashes can be obtained with the `machine:get_root_hash()` method, which returns the corresponding Keccak-256 hash as a 32-byte binary string.
+State hashes are produced from an internal Merkle tree data structure that is maintained in a lazy fashion.
+The performance penalty imposed on the emulator, were it required to keep the Merkle tree up-to-date, would be unacceptable (by several orders of magnitude).
+If no state hashes are needed, the Merkle tree is not updated and negligible cost is incurred.
+However, depending on the extent to which the state was modified since the Merkle tree was last updated, the cost of implicitly updating it prior to returning the state hash can be substantial.
+
+In past releases, the Merkle-tree was kept in memory only.
+When a machine was stored to disk with `machine:store(<directory>)`, the root hash was updated and stored along with the machine state.
+Then, when it was loaded with `machine:load(<directory>)`, the root hash was computed from scratch and compared against what was stored.
+
+Now, every address range in the machine has an associated `backing_store` that includes the `backing_store.dht_filename`
+(for dense hash tree) and `backing_store.dpt_filename` (for dirty-page tree) fields, and the `machine_config` includes a
+new `hash_tree` entry with `phtc_filename` (for page hash-tree cache) and `sht_filename` (for sparse hash tree) fields.
+These were added to enable persistent Merkle trees.
+A call to `machine:store(<directory>)` stores the Merkle tree structures in their current state.
+Conversely, `machine:load(<directory>)` loads the tree structure back up.
+Moreover, when these files are marked as `shared` in the configuration, the tree is maintained up-to-date on disk as well.
+This means that it is now possible to operate a machine entirely from disk with minimal additional overhead.
+
+Before running the machine, the script obtains the initial state hash, converts it to hexadecimal, and prints the result.
+The script then runs the machine until it halts or yields manual.
+Once the machine is halted, the script obtains and prints the final state hash.
+
+Initial state hashes can be used to ensure the machine instantiated by the script indeed matches the machine created by the `cartesi-machine` utility, and final state hashes to verify that computations also agree.
+The output of running
+```{.bash key=state_hashes_lua depends=run_config_with_hashes vars=config->nothing_to_do/config-nothing-to-do.lua/path replace=source}
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/run-config-with-hashes.lua" .
+# docs:begin
+lua5.4 run-config-with-hashes.lua config-nothing-to-do
+# docs:end
+```
+is exactly the same as running the same Cartesi Machine via the `cartesi-machine` utility.
+```{.bash key=state_hashes_utility replace=source}
+cartesi-machine \
+    --initial-hash \
+    --final-hash
+```
+
+```{.bash key=reorder_state_hashes_lua vars=err->state_hashes_lua/stderr/path,out->state_hashes_lua/stdout/path replace=null}
+cat $err | head -n 1
+cat $out
+cat $err | tail -n +2
+```
+```{.bash key=reorder_state_hashes_utility vars=err->state_hashes_utility/stderr/path,out->state_hashes_utility/stdout/path replace=null}
+cat $err | head -n 1
+cat $out
+cat $err | tail -n +2
+```
+```{.text key=compare_utility_and_lua runner=bash replace=stdout vars=lua->reorder_state_hashes_lua/stdout/path,utility->reorder_state_hashes_utility/stdout/path}
+diff $lua $utility && cat $utility
+```
+
+Note that the initial state hashes and the final state hashes match, as expected.
+
+### External state access
+
+The entire Cartesi Machine state is transparently exposed to the controlling program.
+A variety of methods can be used to query a machine instance for any value in its state.
+
+The method `machine:read_word(<address>)` returns the 64-bit word at `<address>`, which must be 8-byte aligned.
+(Due to the alignment requirements, this always falls entirely inside a single address range.)
+
+The value of any register can be obtained by name with the `machine:read_reg("<name>")` method.
+The valid names are derived from the leaves of `processor.registers` in the [`processor_config`](#processor_config) schema by joining nested sub-tables with an underscore.
+For example, `processor.registers.htif.tohost` becomes `htif_tohost`, `processor.registers.iflags.H` becomes `iflags_H`, and `processor.registers.clint.mtimecmp` becomes `clint_mtimecmp`.
+(The call `machine:read_reg("mcycle")` has already been encountered several times.)
+In addition, the pre-decoded `dev`, `cmd`, `reason`, and `data` fields of the `htif_tohost` and `htif_fromhost` registers are exposed by appending the field name (e.g. `htif_tohost_reason`).
+Most registers are part of the [RISC-V ISA](https://content.riscv.org/wp-content/uploads/2017/05/riscv-spec-v2.2.pdf), and its [privileged architecture](https://content.riscv.org/wp-content/uploads/2017/05/riscv-privileged-v1.10.pdf).
+Cartesi-specific registers are described under the guest perspective sections that cover the [processor](#the-main-processor) and [board](#the-board) of the Cartesi Machine architecture.
+
+The method `machine:read_memory(<start>, <length>)` returns a string with `<length>` bytes starting at the physical-memory address `<start>`, anywhere in the machine address space.
+This region can fall inside RAM, any of the flash drives or NVRAMs, the DTB, the CMIO buffers etc.
+It can straddle two adjacent memory ranges, or even touch unmapped memory (which is presumed filled with zeros for
+this purpose).
+
+Conversely, any value in the state of a Cartesi Machine instance can be modified by the controlling program.
+In contrast to reading the state, writing to the state requires extreme care.
+First, for obvious reasons, external modifications to the state break the reproducibility of Cartesi Machines.
+Second, careless state modifications can easily panic the Linux kernel or crash any programs running under it.
+Nevertheless, there are a few scenarios where these modifications are safe and useful.
+
+The method `machine:write_word(<address>, <value>)` writes a 64-bit value at the 8-byte aligned `<address>`, with the same address range as `read_word`.
+
+The value of any register can be changed with the `machine:write_reg("<name>", <value>)` method, where `<name>` is one of the names accepted by `read_reg` and `<value>` is a 64-bit integer.
+
+The `machine:write_memory(<start>, <data>)` method writes the string `<data>` into any memory range in the state, starting at the physical-memory address `<start>`.
+In contrast to `machine:read_memory()`, the bytes in the string `<data>` must fit entirely inside a single memory range (i.e., it cannot straddle an address range boundary and cannot fall in a range mapped to a device, or in an unmapped region).
+Memory ranges include the RAM, the DTB, any of the flash drives or NVRAMs, the CMIO buffers, etc.
+
+The typical use for `machine:write_memory()` is when a new input to a Rolling Cartesi Machine has become available from Cartesi Rollups.
+Another use is when an input flash drive or NVRAM was instantiated without an image file, and is thus filled with zeros in the initial machine state.
+Before running the machine for the first time, it is safe to replace the contents of the range with the desired input.
+(Note, however, that if a memory range does have an associated `shared` image file, the `machine:write_memory()` method *will* modify the associated image file on disk as well as its mapping in the Cartesi Machine state.)
+Another use case is in low-level debugging sessions.
+(The `gdb` remote serial protocol requires the ability to externally modify the state.)
+
+As an example, consider the following script:
+```{.lua key=run_calculator include=run-calculator.lua title="run-calculator.lua"}
+```
+
+The script loads `calculator_config` from its Lua module `./config-calculator.lua` and instantiates a Cartesi Machine from it.
+This is the configuration for using the `bc` program to evaluate an arithmetic expression.
+It locates the pristine input and output NVRAMs with the `cartesi.util.find_drive(<config>, <kind>, <label>)` helper, which returns the `<kind>` drive (here an `nvram`) carrying the given `<label>`, with its `log2_size` filled in.
+The script concatenates its command-line arguments, line-terminates them, and writes them at the start of the input NVRAM.
+It then runs the machine until it halts or yields manual.
+Finally, it reads the output NVRAM contents, extracts the first null-terminated string from it, and prints the result.
+
+Running the script with the command-line
+```{.bash key=lua_calculator vars=config->calc_run/config-calculator.lua/path depends=run_calculator replace=source}
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/run-calculator.lua" .
+truncate -s 4K input.raw output.raw
+# docs:begin
+lua5.4 run-calculator.lua 6*2^1024 + 3*2^512
+# docs:end
+```
+produces the output
+```{replace=lua_calculator/stdout}
+```
+The number is indeed the value of the expression 6&times;2<sup>1024</sup>+3&times;2<sup>512</sup>.
+
+External state modifications are widely used in the setup of artificial, unexpected conditions for regression tests.
+
+### State value proofs
+
+Value proofs concerning the state of the Cartesi Machine can be obtained from any instance using the method `machine:get_proof(<address>, <log2_target_size>[, <log2_root_size>])`.
+
+*State value proofs* are proofs that a given node in the Merkle tree of the Cartesi Machine state has a given hash.
+Each Merkle tree node covers a contiguous range of the machine's 64-bit address space.
+The size of a range is always a power of 2 (given by the `<log2_target_size>` parameter).
+Since the leaves have size []{replace=hash_tree_constants/word_size} bytes, the valid values for `<log2_target_size>` are []{replace=hash_tree_constants/log2_word_size}&hellip;[]{replace=hash_tree_constants/log2_root_size}.
+The range corresponding to each node starts at an `<address>` that is a multiple of its size.
+
+Recall that the state Merkle tree is maintained in a lazy fashion.
+Therefore, just like with the `machine:get_root_hash()` method, the Merkle tree will be implicitly updated to account for state changes.
+This means the time it takes to obtain a proof depends on the extent to which the state has been modified since the
+Merkle tree was last updated.
+
+The `machine:get_proof()` method returns a table with the following structure:
+```lua
+proof ::= {
+  root_hash ::= string,
+  target_hash ::= string,
+  sibling_hashes ::= {
+    [1] ::= string,
+    [2] ::= string,
+    ...
+    [log2_root_size-log2_target_size] ::= string
+  }
+}
+```
+
+Field `root_hash` is the root hash of the 2^`<log2_root_size>`-byte subtree containing `<address>`. The value of `<log2_root_size>` defaults to `cartesi.HASH_TREE_LOG2_ROOT_SIZE`, in which case `root_hash` equals the value returned by `machine:get_root_hash()`.
+The `target_hash` field contains the hash of the node corresponding to the `<address>` and `<log2_target_size>` arguments.
+
+To understand the contents of the `sibling_hashes` array, consider a path from the target node (included), up the Merkle tree, all the way to the root node (excluded).
+When this path is traversed, a number of nodes are visited.
+The `sibling_hashes` array contains the hashes of the *siblings* of all nodes visited.
+
+Using the data in a proof, it is possible to verify the claim that a Merkle tree with a given root hash contains a target node with a given hash and size at the position given by its address.
+The following script verifies the state value proof for the output NVRAM in the calculator example discussed above.
+It uses two helper functions from the `hash-tree.lua` sample module to check the proof returned by `machine:get_proof()`.
+These helpers are shown and explained under [Slicing and splicing](#slicing-and-splicing) in the Blockchain perspective.
+
+The `cartesi.keccak256(<string>)` function of the `cartesi` Lua module returns the hash of the byte string `<string>`.
+The `cartesi.keccak256(<hash1>, <hash2>)` overload returns the hash of the concatenation of `<hash1>` and `<hash2>`.
+The `cartesi.sha256(<string>)` and `cartesi.sha256(<hash1>, <hash2>)` behave analogously.
+
+The calculator script requires this module and uses `verify_slice` to verify the output NVRAM proof.
+```{.lua key=run_calculator_with_proof include=run-calculator-with-proof.lua title="run-calculator-with-proof.lua"}
+```
+
+```{.lua key=proof_module include=../../usr/share/lua/5.4/cartesi/hash-tree.lua replace=null}
+```
+
+Running the script with the command-line
+```{.bash key=lua_calculator_with_proof vars=config->calc_run/config-calculator.lua/path depends=run_calculator_with_proof,proof_module replace=source}
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/run-calculator-with-proof.lua" .
+truncate -s 4K input.raw output.raw
+# docs:begin
+lua5.4 run-calculator-with-proof.lua 6*2^1024 + 3*2^512
+# docs:end
+```
+produces the output
+```{replace=lua_calculator_with_proof}
+```
+
+### Remote Cartesi Machines
+
+The Lua API can also be used to control a Remote Cartesi Machine.
+The functionality is available as the `cartesi.jsonrpc` module.
+Denote by `cartesi_jsonrpc` the module returned by `require"cartesi.jsonrpc"`.
+
+The `cartesi_jsonrpc.connect_server(<remote-address>[, <timeout-ms>])` function opens a connection to an existing Remote Cartesi Machine server and returns a handle to the connection.
+Denote the handle by `cartesi_jsonrpc_machine`.
+It is the remote counterpart to the local `cartesi.machine`, and behaves in the same way, other than being connected to the remote server and exposing additional server-control methods.
+
+The `cartesi_jsonrpc_machine:fork_server()` call creates a new server, in the same remote computer as the server `cartesi_jsonrpc_machine` points to, with an exact, independent copy of the current machine instance (if any), and returns a handle connected to this new server.
+
+Just as `cartesi.machine(<machine_config>)` instantiates a local machine, `cartesi_jsonrpc_machine(<machine_config>)` instantiates a remote machine in the server.
+Each server can hold a single machine, and therefore the machine handle returned is the server handle itself.
+It supports all methods that a local machine supports, and these behave in exactly the same way.
+We will describe the remote-specific behavior.
+
+If a machine already exists in the server, trying to instantiate a new one will cause an error.
+Use the `cartesi_jsonrpc_machine:is_empty()` method to check if the server holds a machine instance (`cartesi_jsonrpc_machine:destroy()` destroys an existing instance).
+
+The `cartesi_jsonrpc_machine:get_server_version()` method returns a `semantic_version` object that contains the server version:
+```lua
+semantic_version ::= {
+  major ::= number,
+  minor ::= number,
+  patch ::= number,
+  pre_release ::= string,
+  build ::= string
+}
+```
+
+The `cartesi_jsonrpc_machine:set_cleanup_call(<call>)` method controls what happens when the handle is closed or garbage-collected.
+The three constants `cartesi_jsonrpc.NOTHING`, `cartesi_jsonrpc.DESTROY`, and `cartesi_jsonrpc.SHUTDOWN` select the cleanup action.
+In a handle created by `cartesi_jsonrpc.connect_server()`, this defaults to `NOTHING`.
+After all, the server was created by some other process that should control its cleanup.
+In a handle created by `cartesi_jsonrpc.spawn_server()`, this defaults to `SHUTDOWN`.
+The new server starts as owned by the current script, and when the handle is destroyed, so is the server process.
+
+The following script illustrates the use of the `cartesi.jsonrpc` module:
+```{.lua key=run_remote_config include=run-remote-config.lua title="run-remote-config.lua"}
+```
+The script loads the `cartesi.jsonrpc` module and connects to the server address given as the first command-line argument.
+It calls `cartesi_jsonrpc_machine:get_server_version()` to test the connection and prints the version number.
+It then instantiates a remote machine by calling `cartesi_jsonrpc_machine` with the configuration obtained from the second command-line argument, and runs it until it halts or yields.
+The `<close>` annotation combined with `set_cleanup_call(cartesi.jsonrpc.SHUTDOWN)` retires the server automatically when the script exits.
+
+Recall that, to run a server inside the playground, we opened a separate shell into the same playground container (for example, by running `docker exec -it playground /bin/bash`), and then ran the `cartesi-jsonrpc-machine` server in it
+```{.bash key=lua_remote outputs=server,client vars=config->nothing_to_do/config-nothing-to-do.lua/path depends=run_remote_config replace=source/server}
+{
+# docs:begin server
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8084
+# docs:end server
+} > server 2>&1 &
+srv_pid=$!
+while ! cartesi-machine --remote-address=127.0.0.1:8084 --remote-health-check > /dev/null 2>&1; do sleep 1; done
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/run-remote-config.lua" .
+{
+# docs:begin client
+lua5.4 run-remote-config.lua \
+    127.0.0.1:8084 \
+    config-nothing-to-do
+# docs:end client
+} > client 2>&1
+client_status=$?
+# If the client failed, it never sent SHUTDOWN, so the server would hang forever
+[ "$client_status" -ne 0 ] && kill "$srv_pid" 2>/dev/null
+wait "$srv_pid"
+```
+Now, instead of using the `cartesi-machine` command-line utility to control it, run the `run-remote-config.lua` client script in the other shell
+```{.bash replace=lua_remote/source/client}
+```
+The client shell produces
+```{replace=lua_remote/client}
+```
+The server shell produces
+```{replace=lua_remote/server}
+```
+
+### Rolling Cartesi Machines
+
+Guest applications running inside Rolling Cartesi Machines communicate with the outside world by using Cartesi Rollups.
+In production, the Cartesi Node is responsible for passing advance-state and inspect-state requests to the machine and collecting the responses (vouchers, notices, reports, and exceptions) that were generated while processing each request.
+When prototyping, the `cartesi-machine` command-line utility can be used to play the same part, loading sequentially-numbered requests from files and storing sequentially-numbered responses to files.
+Naturally, the Lua interface can also be used to feed requests to a Rolling Cartesi Machine and obtain the responses it produces.
+
+The guest application uses the `/dev/cmio` device (typically using the libcmt library) to notify the host it is done with the current request and ready for the next.
+While processing each request, it again uses the `/dev/cmio` to notify the host of each new output or report it generates.
+In both cases, the host retrieves the yield _command_, _reason_, and request _data_ via `machine:receive_cmio_request()`.
+When transitioning between requests, the reason can take the values `cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED` (previous request was accepted), `cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED` (previous request was rejected), or `cartesi.HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION` (an unrecoverable error was encountered).
+When generating a new response to a request, the reason can take the self-explanatory values `cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT` (a voucher or notice) and `cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT`.
+
+The data associated with new requests is sent to the machine in the CMIO memory range defined by the `memory_range_config` entry stored in the `machine_config` as `cmio.rx_buffer`.
+Conversely, the data associated with responses (or exceptions) is obtained from the machine in the `cmio.tx_buffer` memory range.
+The host does not need to access these ranges directly.
+The call `machine:send_cmio_response(<revert_root_hash>, <reason>, <data>)` records `<revert_root_hash>` in the machine state, writes `<data>` into `cmio.rx_buffer`, records the reason and length in `htif_fromhost`, and clears `iflags_Y` so the machine can resume.
+Conversely, the _data_ value returned by `machine:receive_cmio_request()` is the contents of `cmio.tx_buffer` at the yield.
+
+Advance-state inputs are passed as ABI-encoded `EvmAdvance(uint256 chainId, address appContract, address msgSender, uint256 blockNumber, uint256 blockTimestamp, uint256 prevRandao, uint256 index, bytes payload)` calldata blobs.
+The _block timestamp_ field is in seconds since the _Unix epoch_, and the _prev randao_ field is a 32-byte big-endian unsigned integer.
+(See the table in the guest perspective [architecture](#rollup).)
+
+Outputs come back as ABI-encoded `Voucher(address,uint256,bytes)` or `Notice(bytes)` calldata blobs.
+Reports, exceptions, and inspect-state queries are raw payload bytes with no ABI wrapping.
+The `cartesi.evmu` Lua submodule provides `encode_calldata` and `decode_calldata` helpers for these signatures.
+
+The following script illustrates how the Lua API can be used to send advance-state requests to a Rolling Cartesi Machine, and how it can be used to collect the notices produced as responses (we will use the server calculator [example](#rolling-cartesi-machines)):
+
+```{.lua key=run_rolling_calculator include=run-rolling-calculator.lua}
+```
+Rolling Cartesi Machines must be rolled-back to the state they were at before they received an advance-state request they later rejected.
+This requires snapshot and rollback support, which are easy to implement using the fork functionality of Remote Cartesi Machines.
+The script therefore uses the `cartesi.jsonrpc` module to instantiate a remote machine based on the `"rolling-calculator-template"`.
+The `machine:fork_server()` call creates a backup server with a copy of the current state.
+On rejection, the script shuts down the server that rejected the input, swaps the backup handle into `machine`, and rebinds it to the original server address.
+On acceptance, it shuts down the now-stale backup.
+
+It then enters its main loop, which is executed until the machine halts.
+For each iteration, the script invokes `machine:run(math.maxinteger)` to run the machine until it yields or halts.
+When the call returns, it checks if the machine yielded manual.
+If so, it checks the reason for the yield.
+
+If the reason was `cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED`, the application accepted the previous request and is ready for the next.
+The script then attempts to obtain a mathematical expression from the console.
+If the user provides one, it creates a new snapshot, ABI-encodes the expression as `EvmAdvance` calldata with `cartesi.evmu`, and feeds the encoded input through `machine:send_cmio_response(machine:get_root_hash(), cartesi.HTIF_YIELD_REASON_ADVANCE_STATE, ...)`.
+If, however, the reason was anything else, the script rolls back the machine and continues with the next loop iteration.
+
+:::note
+The `machine:get_root_hash()` passed to `machine:send_cmio_response()` is recorded into the machine state as the state hash to revert to in case the guest application rejects the input.
+This is required for dispute resolution to operate properly.
+:::
+
+If the machine yielded automatic, the script once again checks for the yield reason.
+If the reason was `cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT`, the script decodes the data as a `Notice` calldata blob, extracts its `payload` field as raw bytes, and prints the formatted result to the console.
+
+Here is what a session looks like.
+First, open a separate shell into the same docker container (for example, by running `docker exec -it playground /bin/bash`) and run the `cartesi-jsonrpc-machine` server in it
+```{.bash key=lua_rolling_calculator outputs=client,server depends=run_rolling_calculator vars=template->rolling_calc_template/rolling-calculator-template/path replace=source/server}
+rm -f rolling-calculator-template run-rolling-calculator.lua
+ln -sf "$template" .
+ln -sf "$RECIPES_DIR/run-rolling-calculator.lua" .
+{
+# docs:begin server
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8085
+# docs:end server
+} > server 2>&1 &
+srv_pid=$!
+while ! cartesi-machine --remote-address=127.0.0.1:8085 --remote-health-check 2>/dev/null; do sleep 1; done
+{
+# docs:begin client
+lua5.4 run-rolling-calculator.lua 127.0.0.1:8085
+# docs:end client
+} > client 2>&1 <<EOF
+6*2^1024 + 3*2^512
+1+(
+EOF
+client_status=$?
+# If the client failed, it never sent SHUTDOWN, so the server would hang forever
+[ "$client_status" -ne 0 ] && kill "$srv_pid" 2>/dev/null
+wait "$srv_pid"
+```
+Then, run the `run-rolling-calculator.lua` client script in the other shell
+```{.bash replace=lua_rolling_calculator/source/client}
+```
+The client prints the connection status to the console and then prompts us to type an expression.
+Entering `6*2^1024 + 3*2^512` causes the expected result to be printed, after which the client asks for a new expression.
+Entering an invalid expression `1+(` causes the `calc.sh` script running inside the Rolling Cartesi Machine to reject the input.
+Finally, entering `^D` causes the client script to exit and shut down the server.
+The full transcript is
+```{replace=lua_rolling_calculator/client}
+```
+The remote console shows only the error generated when the invalid expression `1+(` was entered:
+```{replace=lua_rolling_calculator/server}
+```
+
+### Output proofs
+
+Recall that the advance-state requests serviced by a Rolling Cartesi Machine are grouped into epochs.
+The outputs that these requests produce, across every epoch, are accumulated in order from genesis as the
+leaves of a single fixed-height Merkle tree.
+The root of this tree over the outputs accepted so far is the *output hashes root hash*.
+The guest writes it to the CMIO tx buffer on every accept, so it is part of the machine state.
+
+Disputes are settled over the machine state hash at the end of an epoch.
+The latest output hashes root hash sits in the tx-buffer in that state.
+A [state value proof](#state-value-proofs-1) of the tx-buffer word it occupies ties it to the state hash.
+Therefore, once the [verification game](#verification-game) settles the state hash, the output hashes root hash is settled with it.
+The blockchain then verifies any output with its *output proof* alone, checking that the leaf
+`keccak256(<output>)` rolls up to the settled output hashes root hash from its global output index.
+
+The `hash-tree.lua` sample module accumulates the output hashes tree with an incremental keccak Merkle accumulator
+whose leaves are `keccak256(<output>)`.
+A *frontier* captures the outputs accepted so far.
+At genesis, the frontier is `hash_tree.frontier(<log2_max_leaves>)`.
+The frontier for a later epoch can be obtained from the previous epoch's last output using `hash_tree.frontier(<last_output_proof>)`.
+As each output is accepted, `hash_tree.frontier_push_back(<frontier>, <leaf>)` folds its leaf in, and
+`hash_tree.frontier_get_root_hash(<frontier>)` yields the output hashes root hash to check against the one
+the guest wrote.
+Once the epoch closes, `hash_tree.frontier_next_proofs(<frontier>, <leaves>)` returns one proof per new
+output, all against the single final root.
+These helpers are shown and explained under [The output hashes tree](#the-output-hashes-tree) in the
+Blockchain perspective.
+
+The following script extends the Rolling Cartesi Machine calculator [example](#rolling-cartesi-machines-1) to collect output proofs and
+the state-value proof for the output hashes root hash.
+It buffers the outputs of each input until the input's verdict is known.
+On accept, it folds the buffered outputs into the running frontier, checks the resulting root against the
+output hashes root hash the guest wrote to the tx buffer, and saves the state value proof of that tx-buffer
+word, obtained with `machine:get_proof(cartesi.AR_CMIO_TX_BUFFER_START, cartesi.HASH_TREE_LOG2_WORD_SIZE)`,
+whose `target_hash` equals `cartesi.keccak256(<root hash>)`.
+On reject, it simply discards the buffered outputs, leaving the tree untouched.
+Once the epoch closes, it generates the per-output proofs against the final root and verifies each with the
+same `verify_slice` used above.
+```{.lua key=run_rolling_calculator_output_proofs include=run-rolling-calculator-output-proofs.lua title="run-rolling-calculator-output-proofs.lua"}
+```
+
+Here is what a session looks like.
+As before, open a separate shell into the same docker container and run the `cartesi-jsonrpc-machine` server
+in it
+```{.bash key=lua_rolling_calculator_output_proofs outputs=client,server depends=run_rolling_calculator_output_proofs vars=template->rolling_calc_template/rolling-calculator-template/path replace=source/server}
+rm -f rolling-calculator-template run-rolling-calculator-output-proofs.lua
+ln -sf "$template" .
+ln -sf "$RECIPES_DIR/run-rolling-calculator-output-proofs.lua" .
+{
+# docs:begin server
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8089
+# docs:end server
+} > server 2>&1 &
+srv_pid=$!
+while ! cartesi-machine --remote-address=127.0.0.1:8089 --remote-health-check 2>/dev/null; do sleep 1; done
+{
+# docs:begin client
+lua5.4 run-rolling-calculator-output-proofs.lua 127.0.0.1:8089
+# docs:end client
+} > client 2>&1 <<EOF
+6*2^1024 + 3*2^512
+EOF
+client_status=$?
+# If the client failed, it never sent SHUTDOWN, so the server would hang forever
+[ "$client_status" -ne 0 ] && kill "$srv_pid" 2>/dev/null
+wait "$srv_pid"
+```
+Then, run the `run-rolling-calculator-output-proofs.lua` client script in the other shell
+```{.bash replace=lua_rolling_calculator_output_proofs/source/client}
+```
+Entering `6*2^1024 + 3*2^512` produces the expected result, after which the client saves the tx-buffer-word
+proof tying the output hashes root hash into the accepting state, and then, once `^D` closes the epoch, the
+per-output proof against that root.
+The full transcript is
+```{replace=lua_rolling_calculator_output_proofs/client}
+```
+
+The same proofs are what the `cartesi-machine` command-line utility writes for each accepted input and output
+when given `--cmio-advance-state=output_hashes_root_hash_proof:<pattern>,output_proof:<pattern>`.
+Verifying these proofs against a machine state hash, from the blockchain's perspective, is shown under
+[Output verification](#output-verification).
+
+### State-transition proofs
+
+During verification, the blockchain mediates a [*verification game*](#verification-game) between the disputing parties.
+In brief, the parties agree on an initial state hash but claim different final state hashes.
+The game first narrows down the disagreement to the first main-processor instruction that deviates, and within it the first uarch instruction that deviates.
+After that, the honest party submits an access log, with Merkle-tree proofs for every value read from or written to the state, which the blockchain uses to identify the honest party.
+
+To obtain the access log for a specific uarch instruction in the execution of a Cartesi Machine instance, first advance to the last agreed `<mcycle>` using `machine:run(<mcycle>)`.
+Then advance the uarch to the last agreed `<uarch_cycle>` using `machine:run_uarch(<uarch_cycle>)`.
+Like `machine:run()`, `machine:run_uarch()` can return prematurely for a variety of reasons.
+It returns a break reason explaining why control was returned to the caller, taken from the `cartesi.UARCH_BREAK_REASON_*` set.
+For example, `cartesi.UARCH_BREAK_REASON_UARCH_HALTED` if the uarch halted before reaching the target cycle.
+
+Once the target uarch cycle has been reached, use the `machine:log_step_uarch(<log_type>)` function to produce a log that advances to the next uarch cycle.
+Alternatively, if the uarch is halted at that point, use `machine:log_reset_uarch()` to produce the log that reverts the state of the uarch to its pristine form.
+Note that the function indeed performs the action, and therefore modifies the uarch state, in addition to collecting the access log.
+The `<log_type>` argument is an integer bitfield formed by OR-ing `cartesi.ACCESS_LOG_TYPE_ANNOTATIONS` (to include the notes and brackets metadata consumed by the pretty-printer `util.print_log`) and `cartesi.ACCESS_LOG_TYPE_LARGE_DATA` (to include the full raw payload of large accesses, not just their hashes).
+Merkle-tree proofs are always included in the log.
+
+The format of the access log returned is as follows:
+
+```lua
+access_log ::= {
+  log_type ::= {
+    annotations ::= boolean,
+    large_data  ::= boolean
+  },
+  accesses ::= {
+    [1] ::= access,
+    [2] ::= access,
+    ...
+    [n] ::= access
+  },
+  notes ::= {
+    [1] ::= string,
+    ...
+    [n] ::= string
+  },
+  brackets ::= {
+    [1] ::= bracket,
+    ...
+    [m] ::= bracket
+  }
+}
+
+access ::= {
+  type         ::= "read" | "write",
+  address      ::= number,
+  log2_size    ::= number,
+  read_hash    ::= string,
+  read         ::= string,
+  written_hash ::= string,
+  written      ::= string,
+  proof        ::= proof
+}
+
+proof ::= {
+  target_address   ::= number,
+  log2_target_size ::= number,
+  log2_root_size   ::= number,
+  target_hash      ::= string,
+  root_hash        ::= string,
+  sibling_hashes   ::= {
+    [1] ::= string,
+    ...
+    [k] ::= string
+  }
+}
+
+bracket ::= {
+  type  ::= "begin" | "end",
+  where ::= number,
+  text  ::= string
+}
+```
+
+The `accesses` array records, in order, all accesses to the machine state performed during the execution of the uarch step.
+Accesses can be of `type` either `"read"` or `"write"`.
+The `address` field gives the physical address of the accessed region and `log2_size` gives its size as a power of two.
+The `read_hash` field contains the hash of the data as read before the access.
+For `"write"` accesses, `written_hash` contains the hash of the written data.
+The `read` and `written` fields carry the data itself.
+For accesses at or above the 32-byte hash-tree leaf granularity (`log2_size >= 5`), each field is exactly `2^log2_size` bytes long.
+For sub-leaf accesses (`log2_size < 5`, typically `log2_size = 3` for an 8-byte word), the field contains the entire enclosing aligned 32-byte tree leaf.
+The `proof` field is used when [verifying state transitions](#verifying-state-transitions).
+
+#### Inspecting access logs
+
+When `log_type` includes `cartesi.ACCESS_LOG_TYPE_ANNOTATIONS`, the access log includes annotations that help put each access into a larger context.
+
+The `notes` array contains a string corresponding to each entry in the `accesses` array, describing the word access.
+The `brackets` contain information that groups ranges of word accesses into *scopes*.
+Each bracket entry `type` field tells if the entry marks the `"begin"` or `"end"` of a scope.
+The `where` field gives the position in the `accesses` array where the bracket should be &ldquo;inserted&rdquo;.
+
+The `print_log(<log>, <out>)` function in the `cartesi.util` module uses these annotations to dump a detailed description of the access `<log>` into an open file object `<out>` (E.g., `io.stdout` or the return of `io.open()`).
+It indents each access according to the number of enclosing scopes and uses the notes to identify what each address refers to (a register, a CSR, memory).
+Addresses and values are printed in hexadecimal and decimal.
+
+Running the `dump-uarch-step.lua` program:
+
+```{.lua key=dump_uarch_step_source include=dump-uarch-step.lua title="dump-uarch-step.lua"}
+```
+with command:
+```{.bash key=dump_uarch_step vars=config->nothing_to_do/config-nothing-to-do.lua/path,cycles->cycles_htif_putchar,ucycles->cycles_uarch_putchar_ecall/stderr depends=dump_uarch_step_source replace=source/cmd}
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/dump-uarch-step.lua" .
+{
+# docs:begin cmd
+lua5.4 dump-uarch-step.lua config-nothing-to-do "$cycles" "$ucycles"
+# docs:end cmd
+}
+```
+produces the output:
+```{key=reorder_dump_uarch_step vars=out->dump_uarch_step/stdout/path,err->dump_uarch_step/stderr/path replace=stdout}
+cat $out
+cat $err
+```
+Understanding these logs in detail is unnecessary for all but the most low-level internal development at Cartesi.
+It requires deep knowledge of not only RISC-V architecture, but also how Cartesi's emulator implements it.
+The material is beyond the scope of this document.
+This particular example, however, was hand-picked for illustration purposes.
+The uarch step being executed is the ECALL micro-instruction that asks the emulator to print a line-feed (`0x0a`) to the console, completing the row `       \    / CARTESI` in the splash screen.
+
+#### Verifying state transitions
+
+Each access carries a `proof` field.
+Using the known state hash before the access, it is possible to verify that the `read` value was indeed the value stored at `address` in the machine state.
+For a `"write"` access, the `sibling_hashes` in the proof can be used to compute the new state hash.
+Doing this for each access in sequence yields the state hash at the end of the step.
+
+The method `machine:verify_step_uarch(<state_hash_before>, <access_log>, <state_hash_after>)` performs this verification, additionally checking that the accesses correspond to the operation of the Cartesi Machine uarch starting from `<state_hash_before>`.
+Note there is no need for a Cartesi Machine instance to verify a transition: all required state information is in the access log.
+
+The following script illustrates the verification of a state transition.
+
+```{.lua key=verify_uarch_step_source include=verify-uarch-step.lua title="verify-uarch-step.lua"}
+```
+
+Running the script without arguments accepts the valid state transition:
+```{.bash key=verify_uarch_step_run vars=config->nothing_to_do/config-nothing-to-do.lua/path,cycles->cycles_htif_putchar,ucycles->cycles_uarch_putchar_ecall/stderr depends=verify_uarch_step_source replace=source/cmd}
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/verify-uarch-step.lua" .
+{
+# docs:begin cmd
+lua5.4 verify-uarch-step.lua config-nothing-to-do "$cycles" "$ucycles"
+# docs:end cmd
+} || true
+```
+```{replace=verify_uarch_step_run/stderr}
+```
+
+The script is much more interesting when the argument is used to &ldquo;mess&rdquo; with the access log before verification.
+For example, changing the address of access #7 (the write to `uarch.pc`) causes the program to reject the state transition proof:
+```{.bash key=verify_uarch_step_mess_address vars=config->nothing_to_do/config-nothing-to-do.lua/path,cycles->cycles_htif_putchar,ucycles->cycles_uarch_putchar_ecall/stderr depends=verify_uarch_step_source replace=source/cmd}
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/verify-uarch-step.lua" .
+{
+# docs:begin cmd
+lua5.4 verify-uarch-step.lua config-nothing-to-do "$cycles" "$ucycles" 'log.accesses[7].address = 0x100'
+# docs:end cmd
+} || true
+```
+```{replace=verify_uarch_step_mess_address/stderr}
+```
+
+Starting from `<state_hash_before>`, a true Cartesi Machine uarch would have written to `uarch.pc` at `0x400010` for the 7th access, not at `0x100` as our corrupt log claims.
+
+Changing the `written` data of the same access fails the access's internal consistency check, because `written` no longer hashes to `written_hash`:
+```{.bash key=verify_uarch_step_mess_written vars=config->nothing_to_do/config-nothing-to-do.lua/path,cycles->cycles_htif_putchar,ucycles->cycles_uarch_putchar_ecall/stderr depends=verify_uarch_step_source replace=source/cmd}
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/verify-uarch-step.lua" .
+{
+# docs:begin cmd
+lua5.4 verify-uarch-step.lua config-nothing-to-do "$cycles" "$ucycles" 'log.accesses[7].written = string.pack("<I8", 0x1234)..string.rep("\0", 24)'
+# docs:end cmd
+} || true
+```
+```{replace=verify_uarch_step_mess_written/stderr}
+```
+
+Changing the `read` data of access #5 (the read of `uarch.x17`) fails the same consistency check on the read side, because `read` no longer hashes to `read_hash`:
+```{.bash key=verify_uarch_step_mess_read vars=config->nothing_to_do/config-nothing-to-do.lua/path,cycles->cycles_htif_putchar,ucycles->cycles_uarch_putchar_ecall/stderr depends=verify_uarch_step_source replace=source/cmd}
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/verify-uarch-step.lua" .
+{
+# docs:begin cmd
+lua5.4 verify-uarch-step.lua config-nothing-to-do "$cycles" "$ucycles" 'log.accesses[5].read = string.pack("<I8", 0x1234)..string.rep("\0", 24)'
+# docs:end cmd
+} || true
+```
+```{replace=verify_uarch_step_mess_read/stderr}
+```
+
+Updating `read_hash` to match the tampered `read` passes the internal consistency check, but the verifier still combines `read_hash` with the proof's `sibling_hashes` to reconstruct the state hash before the access. That reconstruction no longer matches the expected root:
+```{.bash key=verify_uarch_step_mess_target_hash vars=config->nothing_to_do/config-nothing-to-do.lua/path,cycles->cycles_htif_putchar,ucycles->cycles_uarch_putchar_ecall/stderr depends=verify_uarch_step_source replace=source/cmd}
+ln -sf "$config" .
+ln -sf "$RECIPES_DIR/verify-uarch-step.lua" .
+{
+# docs:begin cmd
+lua5.4 verify-uarch-step.lua config-nothing-to-do "$cycles" "$ucycles" 'local a = log.accesses[5]; a.read = string.pack("<I8", 0x1234)..string.rep("\0", 24); a.read_hash = cartesi.keccak256(a.read)'
+# docs:end cmd
+} || true
+```
+```{replace=verify_uarch_step_mess_target_hash/stderr}
+```
+
+In a nutshell, only valid state transitions are accepted by the `machine:verify_step_uarch()` method.
+
+# The guest perspective
+
+The goal of the guest perspective is to serve both guest application-developers and guest system-developers.
+The documentation therefore starts from the familiar Linux environment that runs inside Cartesi Machines.
+This is the abstraction level at which guest application-developers interact with Cartesi Machines.
+The documentation then moves towards the system architecture implemented by Cartesi Machines, including Cartesi-specific extensions to the RISC-V architecture.
+This is what surrounds the Linux environment, and is the abstraction level at which guest system-developers work.
+
+This is, of course, not the most natural order for presenting the material.
+After all, running the Linux environment experienced by application-developers is only possible after successful initialization of the Linux kernel, which in turn depends on knowledge of the system architecture.
+However, presenting the material in this order would quickly alienate application developers.
+Since there are many more application developers than system developers, we cater to the former.
+
+## Linux environment
+
+:::note
+[The host perspective](#the-host-perspective) section describes in detail the `cartesi-machine` command-line utility and the general structure of Cartesi Machines.
+In order to avoid repetition, this section assumes familiarity with the material presented there.
+:::
+
+The most direct way for guest developers to familiarize themselves with the Linux environment is to run the Cartesi Machine emulator in interactive mode.
+The `cartesi/machine-emulator-docs` Docker image comes pre-installed with the emulator, the default kernel and root file-system, and the host-side tooling used by the examples in this documentation (`xgenext2fs`, `pandoc`, the `e2tools` family, and assorted shell utilities).
+Inside that image, the following command instructs the emulator to load the default machine configuration and run a shell in interactive mode
+
+```{.bash replace=cmdline_interactive_ls_shown/source}
+```
+
+Once executed, the Cartesi Machine boots Linux and drops into an interactive shell (the `sh` argument in the command-line).
+
+```{replace=cmdline_interactive_ls/both}
+# Hidden setup. The user-facing command is shown in the bash block above.
+# To capture this interactive session non-interactively, we feed `ls /bin`
+# followed by the VEOF character (^D, byte 0x04) on stdin. The guest TTY's
+# line discipline turns ^D into a 0-byte read, so the shell exits cleanly
+# without an `exit` command -- and ^D itself is not echoed, so the
+# captured output is just the prompt, the command echo, the listing, and
+# the final prompt.
+# --no-init-splash is added so the captured output omits the init banner.
+printf 'ls /bin\n\x04' | cartesi-machine \
+    --no-init-splash \
+    -i \
+    --quiet \
+    --console-io=input_fd:0 \
+    -- sh 2>&1
+```
+
+The session shows a user listing the contents of `/bin/`, then leaving the emulator by pressing Ctrl+D at the prompt.
+The point of the exercise is that, from the inside, the environment will be familiar to any regular Unix user.
+
+One of the key differences is that, unlike stand-alone systems, many embedded systems are not self-hosting.
+None of the utilities visible inside the `/usr/bin/` and `/bin/` directories were built with a compiler that ran inside a Cartesi Machine.
+They were built in a separate host system, on which a cross-compiling toolchain for the target architecture has been installed.
+In the case of Linux, the key elements in the toolchain are the GNU Compiler Collection and the GNU C Library.
+Support for RISC-V is upstream in the official [GCC compiler collection](https://gcc.gnu.org/).
+The Rust language toolchain likewise supports RISC-V natively through [`rustup`](https://rustup.rs/).
+The examples below pull both toolchains in on demand via a multi-stage Docker build, so the only host-side prerequisite is `docker buildx`.
+
+### Building a custom root file-system
+
+To run a custom guest application inside the emulator, the most natural approach is to build a custom root file-system that replaces the default `rootfs.ext2`.
+The custom image contains the guest application alongside the Cartesi guest tools and any runtime dependencies.
+
+Once a custom image is in hand, there are two ways to put it in front of the emulator.
+A given `cartesi-machine` invocation can use `--flash-drive=label:root,data_filename:<path>.ext2` to override the default root flash drive with the file at `<path>`.
+The `root` label matches the label that `cartesi-machine` assigns to the default root flash drive, so this flag wins over the kernel-supplied default for the lifetime of that invocation.
+Alternatively, the file can be installed at `/usr/share/cartesi-machine/images/rootfs.ext2` (or symlinked there) so that every invocation picks it up by default.
+
+The example we work through here is the `rootfs-docs.ext2` image used by the `cartesi/machine-emulator-docs` Docker image as its `rootfs.ext2`.
+It contains a few small &ldquo;Hello world!&rdquo; programs in different languages, plus the `puppet` libcmt-rollup guest application used in the [rolling-machines walk-through](#rolling-cartesi-machines).
+The docs image installs it via the second mechanism above (`rootfs.ext2` symlinked to `rootfs-docs.ext2`), so the rest of this section can invoke `cartesi-machine` with no flash-drive override.
+
+Building the rootfs requires two host-side steps.
+The first assembles the rootfs with `docker buildx build --platform=linux/riscv64 --output type=tar`, which uses binfmt and QEMU to emulate riscv64 and emits the result as a flat tarball.
+The second converts the tarball into an ext2 image with [`xgenext2fs`](https://github.com/cartesi/genext2fs), which must be installed on the host (release `v1.5.6` or newer).
+
+:::note
+The fourth stage of the multi-stage Dockerfile runs natively on `riscv64` through `binfmt_misc` and QEMU emulation. Depending on your host platform's hardware (e.g., building on x86_64 vs. Apple Silicon), emulating RISC-V instructions during package installation and setup can introduce considerable execution overhead, leading to noticeably slower build times.
+:::
+
+The Dockerfile below illustrates the approach with a four-stage build.
+The first stage cross-compiles a C17 and a C++23 &ldquo;Hello world!&rdquo; program using `g++-14-riscv64-linux-gnu` from the Ubuntu archives, and the `puppet` libcmt-rollup guest application against the headers and shared library shipped by `machine-guest-tools` (downloaded as a tarball release artifact and extracted into a sysroot inside the build stage).
+The second stage cross-compiles an equivalent Rust program, using `rustup` and the same RISC-V GCC as the linker.
+The third stage cross-compiles an equivalent Go program using the upstream `golang` Docker image with `GOARCH=riscv64`.
+The fourth stage runs natively on riscv64 (through binfmt and QEMU), installs the Cartesi `machine-guest-tools` Debian package alongside `libstdc++6` and a handful of scripting language interpreters, and copies the compiled binaries and example scripts into `/home/dapp/`.
+The C, C++, Rust, and `puppet` binaries are dynamically linked against the rootfs's `libc`.
+The `puppet` binary also dynamically links to `libcmt.so`, which the `machine-guest-tools` Debian package installs at `/usr/lib/libcmt.so` inside the rootfs.
+The Go binary is fully static.
+The scripts depend on their interpreters being present.
+
+```{.dockerfile key=rootfs_docs_dockerfile include=Dockerfile.rootfs-docs}
+```
+
+The C source compiled in the first stage is the ubiquitous &ldquo;Hello world!&rdquo; program, printing 5 lines:
+
+```{.c key=hello_c_src include=hello/hello.c}
+```
+
+The C++ counterpart:
+
+```{.cpp key=hello_cpp_src include=hello/hello.cpp}
+```
+
+The same stage also cross-compiles `puppet`, the libcmt-rollup guest application used in the rolling-machines walk-through.
+Its source is shown under [The libcmt library](#the-libcmt-library).
+
+The second step converts the tarball into an ext2 image:
+
+```{.bash key=build_rootfs_docs include=build-rootfs-docs.sh}
+```
+
+The two additional flags here, relative to the base set introduced above, are `-r +50000` (reserve 50000 extra free blocks so the running system has room to write into the rootfs) and `-L docs` (ext2 volume label).
+
+### Guest &ldquo;Hello world!&rdquo;
+
+The C++ program can now be run inside the emulator.
+(The `machine-guest-tools` package post-install script creates the `dapp` Unix user, so the compiled binaries and example scripts will reside in `/home/dapp/`.)
+
+```{.bash key=hello_cpp depends=rootfs_docs_dockerfile,build_rootfs_docs,hello_cpp_src replace=source}
+cartesi-machine \
+    --no-init-splash \
+    -- /home/dapp/hello-cpp
+```
+The output is
+```{replace=hello_cpp}
+```
+
+The Dockerfile's second stage cross-compiles the following Rust program:
+
+```{.rust key=hello_rs_src include=hello/hello.rs}
+```
+
+The `rust-builder` stage runs `rustup target add riscv64gc-unknown-linux-gnu` and `cargo build --release --target riscv64gc-unknown-linux-gnu`, with `riscv64-linux-gnu-gcc` (from the `gcc-riscv64-linux-gnu` package) as the linker.
+The resulting binary is placed in `/home/dapp/hello-rust`.
+
+The Dockerfile's third stage cross-compiles the following Go program:
+
+```{.go key=hello_go_src include=hello/hello.go}
+```
+
+The `go-builder` stage builds with `GOARCH=riscv64 GOOS=linux CGO_ENABLED=0`, which uses Go's built-in cross-compilation toolchain to produce a fully-static binary.
+The resulting binary is placed in `/home/dapp/hello-go`.
+
+The rootfs also includes a selection of scripting language interpreters from the Ubuntu archives, so the same &ldquo;Hello world!&rdquo; can be realized in any of them:
+
+```{.forth key=hello_4th_src include=hello/hello.4th}
+```
+
+```{.awk key=hello_awk_src include=hello/hello.awk}
+```
+
+```{.js key=hello_js_src include=hello/hello.js}
+```
+
+```{.lua key=hello_lua_src include=hello/hello.lua}
+```
+
+```{.perl key=hello_pl_src include=hello/hello.pl}
+```
+
+```{.php key=hello_php_src include=hello/hello.php}
+```
+
+```{.python key=hello_py_src include=hello/hello.py}
+```
+
+```{.ruby key=hello_rb_src include=hello/hello.rb}
+```
+
+```{.bash key=hello_sh_src include=hello/hello.sh}
+```
+
+```{.tcl key=hello_tcl_src include=hello/hello.tcl}
+```
+
+The following shell script runs the examples one after another.
+In order not to bloat our example image, the heaviest interpreters were left out (Node.js, Ruby, and PHP).
+To add them back, uncomment the corresponding lines in the Dockerfile and in the `all.sh` script.
+
+```{.bash key=hello_all_src include=hello/all.sh}
+```
+
+Running it inside the custom rootfs:
+
+```{.bash key=hello_all depends=rootfs_docs_dockerfile,build_rootfs_docs,hello_c_src,hello_cpp_src,hello_rs_src,hello_go_src,hello_4th_src,hello_awk_src,hello_js_src,hello_lua_src,hello_pl_src,hello_php_src,hello_py_src,hello_rb_src,hello_sh_src,hello_tcl_src,hello_all_src replace=source}
+cartesi-machine \
+    --no-init-splash \
+    -- /home/dapp/all.sh
+```
+The output is
+```{replace=hello_all}
+```
+
+The take-away message is that developers can use the tools they are most familiar with to accomplish the task at hand.
+
+### Flash drives and NVRAMs
+
+Flash drives and NVRAMs are simply regions of physical memory accessible to the guest through different Linux drivers.
+
+Flash drives use the persistent-memory block-device driver `pmem-region`, which makes them accessible as block devices `/dev/pmem0` to `/dev/pmem7`.
+The initialization script added by `cartesi-machine` to the `machine_config` field `dtb.init` mounts any labeled flash
+drive containing a valid file-system at `/mnt/<label>`.
+In this fashion, file-systems present in all flash drives become available for use.
+
+The default kernel command-line parameter contains the substring `root=/dev/pmem0 rw`, which declares that the root file-system resides in device `/dev/pmem0`, i.e., flash drive 0, and that it should be mounted read-write.
+
+NVRAMs are raw byte buffers for guest code that needs unstructured memory without a file-system layer.
+They are backed by UIO devices, through driver `generic-uio`, and are accessible inside the guest as `/dev/uio0` to
+`/dev/uio7`.
+Unlike with flash drives, there is no page cache between the guest and the underlying memory range.
+
+Custom labels for flash drives and NVRAMs are published in the DTB `/aliases` node.
+The node also carries the auto-assigned aliases `flashdrive0` to `flashdrive7` and `nvram0` to `nvram7`.
+The `root` label is added by the `cartesi-machine` command-line utility as the custom label for `/dev/pmem0`.
+The command-line utilities `flashdrive`, `nvram`, and `memoryrange`, installed by `machine-guest-tools` can translate
+these labels to the corresponding devices and their extents in physical memory.
+
+A flash drive or NVRAM holds whatever data is made available by the emulator in the corresponding guest physical memory region.
+The data can come from an image file specified during machine instantiation, from an image file specified after instantiation via the `machine:replace_memory_range(<memory_range_config>)`, or through external state access method `machine:write_memory()`.
+Additionally, the `readmmap` and `writemmap` utilities can read and write NVRAM or flash-drive ranges by label.
+
+Some scripting languages, like the Lua programming language, have packing and unpacking libraries that can be very helpful for structured data.
+
+For example, the previously discussed [arbitrary-precision calculator Cartesi Machine](#cartesi-machine-templates) is given the entrypoint
+
+```{.bash replace=calc_pipeline/source}
+```
+
+The input is a null-terminated string containing the expression to be evaluated.
+This string is stored inside an NVRAM with label `input`.
+The output is once again a null-terminated string with the result, this time stored inside an NVRAM with label `output`.
+
+The `readmmap input` command therefore reads the entire 4KiB of the input NVRAM and sends it to the standard output.
+The second command, `lua5.4 -e 'print((string.unpack("z", io.read("a"))))'` extracts the first null-terminated string and prints it to standard out.
+This is the meaning of the `"z"` format argument to the `string.unpack()` function.
+There are a variety of other formats available, including reading integers of different sizes, big- or little-endian etc.
+Please see the [documentation for the `string.unpack()`](https://www.lua.org/manual/5.4/manual.html#6.4.2) function for more details.
+The string is received by the `bc` command-line utility.
+In the example, that string is `6*2^1024 + 3*2^512\n`.
+The `bc` command-line utility computes the value of the expression and sends it to standard out.
+This is finally received by `writemmap output`, which writes it to the output NVRAM.
+(No need to null-terminate, since the drive is already completely filled with zeros.)
+
+### Initialization
+
+```{.lua key=ar_ram_start replace=null}
+local c = require "cartesi"
+io.write(string.format("0x%x", c.AR_RAM_START))
+```
+
+```{.lua key=ar_dtb_start replace=null}
+local c = require "cartesi"
+io.write(string.format("0x%x", c.AR_DTB_START))
+```
+
+Earlier versions of the emulator booted from a `rom.bin` image whose main purpose was to build, inside the guest
+itself, a [device tree](https://www.devicetree.org/) describing the hardware.
+Starting with version 0.16, the emulator builds the device tree in the host, at instantiation, derived from the machine configuration, and stores it in the DTB memory range immediately below RAM.
+The hart starts execution directly at the beginning of RAM (address []{replace=ar_ram_start}), where the RAM image is loaded.
+The start address of the DTB memory range ([]{replace=ar_dtb_start}) is pre-loaded in register `a1`, per the conventional RISC-V boot ABI.
+
+The Cartesi-provided `linux.bin` image is an OpenSBI `fw_payload` bundle, a small machine-mode firmware that exposes the Supervisor Binary Interface to Linux, linked together with the kernel.
+The firmware occupies the first 512KiB of RAM, declared as a no-map region in the device tree so the kernel does not touch it.
+OpenSBI initializes itself, then hands control to the kernel, passing along the address it received in `a1`.
+The kernel reads the device tree, loads drivers, and finishes its own initialization.
+
+When kernel initialization is complete, the kernel mounts the device named by the `root=` parameter, by default `/dev/pmem0`.
+It then executes the program named by `init=`, by default `/usr/sbin/cartesi-init`.
+
+The Cartesi-provided `cartesi-init` program sets up a basic Linux environment on which applications can run.
+It mounts `/proc`, `/dev/pts`, `/dev/shm`, `/sys`, `/tmp`, and `/run`, and sources any drop-in scripts under `/etc/cartesi-init.d/`.
+Next, it sources (as `root`) the script it reads from the device-tree node `/cartesi-machine/init`, which the emulator
+has filled from the contents of the `machine_config` at `dtb.init`.
+(The `cartesi-machine` utility adds there a script to mount each labeled flash drive carrying a recognized file-system
+at `/mnt/<label>`.)
+Finally, `cartesi-init` reads the entrypoint string from the device tree at `/cartesi-machine/entrypoint`, which the emulator fills from `machine_config` at `dtb.entrypoint`, and executes it in a shell, by default as user `dapp`.
+(This is where `cartesi-machine` puts the commands it finds after the `--` separator in the command-line.)
+
+Given a proper rootfs and an appropriate entrypoint, applications can run any general computation, consuming input from flash drives or NVRAMs and writing outputs to flash drives or NVRAMs, or run a Rolling Cartesi Machine loop that uses the `/dev/cmio` device to read inputs and write outputs (see below).
+When the application exits, control returns to `cartesi-init`, which unmounts file-systems and gracefully halts the machine.
+
+### Communication between guest and host
+
+Guest applications inside a Cartesi Machine drive the rollups model by issuing requests to the yield sub-device of HTIF, the Cartesi Machine's host-guest communication device.
+HTIF itself and its yield sub-device are described later, under the System architecture chapter.
+The Cartesi-extended Linux kernel produced by [`machine-linux-image`](https://github.com/cartesi/machine-linux-image) exposes the rollups communication protocol to user-space through a single character device file, `/dev/cmio`.
+
+Guest applications interact with `/dev/cmio` through one of four layers, in decreasing order of convenience.
+When available, the preferred path is a language binding of the `libcmt` library included in [`machine-guest-tools`](https://github.com/cartesi/machine-guest-tools).
+C and C++ can use libcmt directly.
+In the future, other language ecosystems (Rust, Go, JavaScript, Python, Lua, and so on) will wrap libcmt and expose the rollups interface idiomatically.
+In the meantime, applications written in languages without a libcmt binding talk to the device through the `/usr/bin/rollup-http-server` daemon, which translates HTTP requests into libcmt operations.
+For shell-driven workflows, `machine-guest-tools` also includes the `/usr/bin/rollup` command-line utility, a libcmt consumer that exposes single libcmt operations on standard input and standard output.
+And for the adventurous, or for tooling that needs to talk to the device directly for testing or debugging, the raw `/dev/cmio` `ioctl` interface itself is documented at the bottom of this section, alongside the lower-level `/usr/bin/yield` command-line utility.
+
+When the application yields, the emulator returns control to the host.
+The host either provides a new input to the guest application, or processes an output generated by it.
+Manual yields require the host to reset the `iflags_Y` register before the machine can resume.
+Automatic yields briefly set the `iflags_X` register, which the emulator clears on the next instruction.
+
+#### The libcmt library
+
+The libcmt library comes with the `machine-guest-tools` package, installed in the rootfs as `/usr/lib/libcmt.{so,a}` with public headers under `/usr/include/libcmt/`.
+The high-level rollups loop lives in `rollup.h`.
+The supporting headers (`abi.h`, `buf.h`, `io.h`, `keccak.h`, `merkle.h`, `util.h`) exist mostly to back it.
+
+The `rollup.h` API mirrors the lifecycle of a guest application.
+`cmt_rollup_init()` opens `/dev/cmio` and maps the receive and transmit buffers.
+`cmt_rollup_finish()` accepts or rejects the previous request and blocks until the next one arrives.
+A field in the returned `cmt_rollup_finish_t` indicates whether the new request is an `HTIF_YIELD_REASON_ADVANCE_STATE` or an `HTIF_YIELD_REASON_INSPECT_STATE`.
+For an advance, `cmt_rollup_read_advance_state()` decodes the ABI-encoded `EvmAdvance(uint256 chainId, address appContract, address msgSender, uint256 blockNumber, uint256 blockTimestamp, uint256 prevRandao, uint256 index, bytes payload)` calldata blob from the CMIO RX buffer into a `cmt_rollup_advance_t` struct with one field per parameter.
+For an inspect, `cmt_rollup_read_inspect_state()` returns just the payload.
+
+While processing a request, the application emits zero or more outputs.
+`cmt_rollup_emit_voucher()`, `cmt_rollup_emit_delegate_call_voucher()`, `cmt_rollup_emit_notice()`, `cmt_rollup_emit_report()`, and `cmt_rollup_emit_exception()` emit the named output.
+`cmt_rollup_progress()` reports a per-mille progress value as an automatic yield.
+The rules of the request/response protocol and the meaning of each output type are spelled out under Rolling Cartesi Machines, in the host-side chapter.
+Finally, `cmt_rollup_fini()` tears down the mappings and closes the device.
+
+The `puppet` guest application is a small libcmt rollup loop whose advance-state payloads are commands.
+It exercises every emit call of the `rollup.h` API in roughly fifty lines.
+
+```{.c key=puppet include=puppet.c title="puppet.c"}
+```
+
+After `cmt_rollup_init` opens the device, the program makes the first call to `cmt_rollup_finish` with `accept_previous_request = true`, which signals that the guest is ready and blocks for the first request.
+The accept here is not optional: the alternative would have `cmt_rollup_finish` ask the host to revert the machine state, which has no meaning before any request has been processed.
+Each subsequent advance-state payload is a verb (`notice`, `report`, `voucher`, `exception`, or `exit`) optionally followed by `:` and arbitrary data.
+The verb selects a libcmt call to make with that data.
+`notice:<data>`, `report:<data>`, and `voucher:<data>` emit the named output and accept the request.
+`exception:<data>` emits an exception, halting the machine.
+`exit` breaks out of the loop and returns from `main`, and the machine halts when `cartesi-init` reaps the process.
+Any payload that does not match a known verb causes the advance-state request to be rejected, so the host rolls the state back.
+For inspect-state requests, the program emits a single report echoing the query and accepts.
+The loop exits when an error escapes from any libcmt call, which is also what happens when the host signals end of input by halting the machine.
+
+We can drive `puppet` through the same command-line harness used earlier for the calculator under [Rolling Cartesi Machines](#rolling-cartesi-machines).
+First, encode two advance-state requests and one inspect-state query:
+```{.bash key=rolling_puppet_encode outputs=ls_bin replace=source}
+# docs:begin
+cartesi-rollup-data.lua encode advance > input-1.bin <<EOF
+{
+  "chain_id": 0,
+  "app_contract": "0x0000000000000000000000000000000000000000",
+  "msg_sender": "$(printf '0x%040d' 1)",
+  "block_number": 0,
+  "block_timestamp": 0,
+  "prev_randao": "0x0000000000000000000000000000000000000000000000000000000000000000",
+  "index": 1,
+  "payload": "$(printf 'notice:hello from input 1' | hex --encode)"
+}
+EOF
+cartesi-rollup-data.lua encode advance > input-2.bin <<EOF
+{
+  "chain_id": 0,
+  "app_contract": "0x0000000000000000000000000000000000000000",
+  "msg_sender": "$(printf '0x%040d' 2)",
+  "block_number": 0,
+  "block_timestamp": 0,
+  "prev_randao": "0x0000000000000000000000000000000000000000000000000000000000000000",
+  "index": 2,
+  "payload": "$(printf 'something the puppet does not understand' | hex --encode)"
+}
+EOF
+cartesi-rollup-data.lua encode inspect > query.bin <<EOF
+{
+  "payload": "$(printf 'hello from query!' | hex --encode)"
+}
+EOF
+# docs:end
+ls *.bin > ls_bin
+```
+
+Then run the server and client, instantiating the machine directly from `/home/dapp/puppet`:
+```{.bash key=rolling_puppet vars=rolling_puppet_encode outputs=server,client,output-0-input-1.bin,input-1-output-hashes-root-hash.bin,output-0-input-1-proof.lua,query-report-0.bin replace=source/server}
+ln -sf $rolling_puppet_encode/*.bin .
+{
+# docs:begin server
+cartesi-jsonrpc-machine \
+    --server-address=127.0.0.1:8086
+# docs:end server
+} > server 2>&1 &
+srv_pid=$!
+{
+# docs:begin client
+while ! cartesi-machine \
+    --remote-address=127.0.0.1:8086 \
+    --remote-health-check 2>/dev/null; do sleep 1; done
+cartesi-machine \
+    --no-init-splash \
+    --remote-address=127.0.0.1:8086 \
+    --remote-shutdown \
+    --cmio-advance-state=input_index_begin:1,input_index_end:3,hashes \
+    --cmio-inspect-state=hashes \
+    --final-hash \
+    -- /home/dapp/puppet
+# docs:end client
+} > client 2>&1
+client_status=$?
+[ "$client_status" -ne 0 ] && kill "$srv_pid" 2>/dev/null
+wait "$srv_pid"
+```
+```{.bash replace=rolling_puppet/source/server}
+```
+
+From a different shell into the same container, run the client
+```{.bash replace=rolling_puppet/source/client}
+```
+The payload of `input-1.bin` is `notice:hello from input 1`, so the `puppet` emits a single notice and accepts.
+The payload of `input-2.bin` does not match any known verb, so the `puppet` rejects the advance-state request and the client rolls the machine state back, discarding any side-effects from its processing.
+The contents of `query.bin` are echoed back as a report, and once again the state of the machine reverts after the inspect-state request is processed.
+
+The client shell shows
+```{replace=rolling_puppet/client}
+```
+
+As expected, the yields and state hashes shown here follow the same pattern detailed for the calculator under [Rolling Cartesi Machines](#rolling-cartesi-machines).
+
+The `cartesi-rollup-data.lua` utility decodes the records the run produced.
+The advance-state request carries the command `puppet` acted on
+```{.bash key=rolling_puppet_decode_advance vars=rolling_puppet replace=source}
+ln -sf $rolling_puppet/*.bin .
+# docs:begin
+cartesi-rollup-data.lua decode advance < input-1.bin
+# docs:end
+```
+```{.js replace=rolling_puppet_decode_advance}
+```
+The payload field carries the hex encoding of the bytes `notice:hello from input 1`, which the `puppet` parsed as a command to emit a notice with payload `hello from input 1`.
+
+Notices and reports carry only a payload, which we recover with
+```{.bash key=rolling_puppet_decode_notice vars=notice->rolling_puppet/output-0-input-1.bin/path replace=source}
+ln -sf $notice .
+# docs:begin
+cartesi-rollup-data.lua decode notice < output-0-input-1.bin | jq -j .payload | hex --decode
+# docs:end
+```
+```{.text replace=rolling_puppet_decode_notice}
+```
+```{.bash key=rolling_puppet_decode_report vars=report->rolling_puppet/query-report-0.bin/path replace=source}
+ln -sf $report .
+# docs:begin
+cartesi-rollup-data.lua decode report < query-report-0.bin | jq -j .payload | hex --decode
+# docs:end
+```
+```{.text replace=rolling_puppet_decode_report}
+```
+
+#### The rollup HTTP server
+
+For guest applications written in languages that have no libcmt binding, the `/usr/bin/rollup-http-server` daemon is the practical bridge to `/dev/cmio`.
+The daemon listens on a local HTTP port and translates each request it receives into a libcmt operation.
+The guest application's request/response loop runs in the host language and issues HTTP calls to the daemon to advance state, emit outputs, and finish requests.
+
+#### The rollup command-line utility
+
+The `/usr/bin/rollup` utility is a thin libcmt wrapper that exposes single libcmt operations on the command line, reading and writing JSON on standard input and standard output.
+It is intended for shell-driven demos and tests.
+Production applications should use either a libcmt language binding or `/usr/bin/rollup-http-server` instead.
+The [calculator that evaluates `bc` expressions](#rolling-cartesi-machines) earlier in this document drives a `rollup`-based loop from a shell script.
+
+For reference, the help text of the `rollup` utility is
+
+```{.bash key=cli_rollup_help replace=source}
+cartesi-machine \
+    --no-init-splash \
+    --quiet \
+    -- rollup --help
+```
+
+```{replace=cli_rollup_help}
+```
+
+#### The /dev/cmio device
+
+The raw `/dev/cmio` character device file is the kernel-level interface to the HTIF yield sub-device.
+Most users should not interact with it directly.
+Language bindings should be built on top of libcmt rather than `/dev/cmio` directly, because libcmt does more than carry traffic through the device.
+It also maintains the output hashes tree that Cartesi Rollups relies on to validate the application's outputs.
+The information that follows is useful for the curious and for tooling that needs to talk to the device directly for testing or debugging.
+
+The kernel UAPI header is `<linux/cartesi/cmio.h>`, whose struct definitions are the source of truth.
+The device exposes two `ioctl` requests.
+`IOCTL_CMIO_SETUP` takes a `struct cmio_setup` argument and fills it with descriptors for the receive and transmit buffers.
+The caller `mmap`s those buffers once, at startup, and accesses them directly thereafter.
+`IOCTL_CMIO_YIELD` takes a `struct cmio_yield` argument and yields control to the host, encoding the yield kind in the struct's fields.
+The two arguments are roughly
+
+```C
+struct cmio_setup {
+    struct { uint64_t data; uint64_t length; } tx, rx;
+};
+
+struct cmio_yield {
+    uint8_t  dev;     /* HTIF_DEVICE_YIELD */
+    uint8_t  cmd;     /* HTIF_YIELD_CMD_AUTOMATIC or HTIF_YIELD_CMD_MANUAL */
+    uint16_t reason;
+    uint32_t data;
+};
+```
+
+The `dev` field identifies the HTIF sub-device targeted by the request.
+HTIF distinguishes three sub-devices internally, halt, console, and yield.
+`/dev/cmio` carries only yield-class traffic, so the `dev` field must be `HTIF_DEVICE_YIELD`.
+The `cmd` field selects between an automatic yield, where the host resumes the machine without further action, and a manual yield, where the host must reset `iflags_Y` before the machine can resume.
+The `reason` field carries one of the constants below, and the `data` field carries an auxiliary 32-bit value whose meaning is reason-specific.
+
+The reasons paired with `HTIF_YIELD_CMD_AUTOMATIC` are
+`HTIF_YIELD_AUTOMATIC_REASON_PROGRESS` (the `data` field carries a per-mille progress value),
+`HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT` (a voucher, delegate-call voucher, or notice has been written to the transmit buffer), and
+`HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT` (a report has been written to the transmit buffer).
+
+The reasons paired with `HTIF_YIELD_CMD_MANUAL` are
+`HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED` (the application has accepted the previous request and is ready for the next, and the host sets the `data` field on resume to `HTIF_YIELD_REASON_ADVANCE_STATE` or `HTIF_YIELD_REASON_INSPECT_STATE` to indicate the type of the freshly loaded input in the receive buffer),
+`HTIF_YIELD_MANUAL_REASON_RX_REJECTED` (the application has rejected the previous request, and the host reverts the machine state and replies with the next request as above), and
+`HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION` (the application has emitted an exception payload to the transmit buffer and the machine cannot continue).
+
+For convenience, `machine-guest-tools` also includes a `/usr/bin/yield` utility that sends a single yield request from the shell, useful for tests and one-off demos.
+It is a direct wrapper for `IOCTL_CMIO_YIELD` and only supports yield-class requests, so it does not send halt or console requests to HTIF.
+Its usage is
+
+```{.bash key=cli_yield_help replace=source}
+{
+{
+# docs:begin
+cartesi-machine \
+    --no-init-splash \
+    --quiet \
+    -- yield
+# docs:end
+} || true
+} | grep -v -e 'Too few arguments' -e '^$'
+```
+
+```{replace=cli_yield_help}
+```
+
+## System architecture
+
+The RISC-V ISA consists of a minimal integer instruction set to which several extensions can be added.
+The standard defines a privileged architecture with features commonly used by modern operating systems, such as multiple privilege levels, paged-based virtual-memory, timers, interrupts, exceptions and traps, etc.
+Implementations are free to select the combination of extensions that better suit their needs.
+
+The Cartesi Machine architecture can be separated into a main processor, board, and a microarchitecture (uarch).
+The processor performs the computations, executing the traditional fetch-execute loop while maintaining a variety of registers.
+The board defines the surrounding environment with an assortment of memories (RAM, flash drives, NVRAMs, CMIO buffers etc) and a number of devices.
+The uarch includes its own smaller processor and memory, invisible to the main processor, with full access into its inner workings.
+It can drive the main processor at a finer granularity that is suitable for dispute resolution in the context of blockchains.
+
+The Cartesi Machine maps its entire state to the physical address space in a well-defined way.
+This includes the internal states of the main processor, of the uarch processor, of all attached devices, and the contents of all memories.
+This state completely defines the Cartesi Machine.
+
+A full description of the RISC-V ISA is out of the scope of this documentation (See the volumes [1 and 2](https://riscv.org/technical/specifications/) of the ISA specification for details.)
+This section describes the RISC-V architecture of the main processor and uarch, the modifications made to support verification, the devices supported by the emulator, and the process the machine follows to boot the Linux kernel.
+
+### The main processor
+
+Following RISC-V terminology, the Cartesi Machine's main processor implements the `RV64IMAFDCZicsr_Zifencei` ISA.
+The letters after RV specify the extension set.
+This selection corresponds to a 64-bit machine, integer arithmetic with multiplication and division, atomic operations, single- and double-precision floating-point arithmetic, and compressed instructions, as well as the optional supervisor and user privilege levels.
+In addition, Cartesi Machines support the Sv39 mode of address translation and memory protection.
+Sv39 provides a 39-bit protected virtual address space, divided into 4KiB pages, organized by a three-level page table.
+This set of features creates a balanced compromise between the simplicity demanded by a blockchain implementation and the flexibility expected from off-chain computations.
+
+Even so, the instruction set remains compact.
+Most instructions are very simple and can be emulated in a few lines of high-level code.
+In contrast, the x86 ISA defines at least 2000 (potentially complex) instructions.
+In fact, the only complex operation in RISC-V is the virtual-to-physical address translation.
+Instruction decoding is particularly simple due to the reduced number of formats taking 32 or 16 bits.
+
+The entire processor state fits within 848 bytes, divided into 106 registers, each holding 64 bits.
+It consists of 32 general-purpose integer registers (`x0`&hellip;`x31`), 32 floating-point registers (`f0`&hellip;`f31`), and 42 standard or Cartesi-specific control registers.
+The last 8 of those control registers persist the externally-visible state of the board's CLINT, PLIC, and HTIF subsystems, which is otherwise also reachable through the device-mapped addresses described in the next section.
+The processor makes its entire state available, externally and read-only, by mapping every register to the start of the physical address space (in the <i>processor shadow</i>, a 4KiB range).
+The mapping is given in the following table:
+
+```{.lua key=reg_addr replace=null outputs=x0,x1,x31,mcycle,pc,fcsr,f0,f1,f31,iprv,mstatus,mtvec,mscratch,mepc,mcause,mtval,misa,mie,mip,medeleg,mideleg,mcounteren,menvcfg,mvendorid,marchid,mimpid,stvec,sscratch,sepc,scause,stval,satp,scounteren,senvcfg,ilrsc,icycleinstret,iunrep,iflags_X,iflags_Y,iflags_H,clint_mtimecmp,plic_girqpend,plic_girqsrvd,htif_tohost,htif_fromhost,htif_ihalt,htif_iconsole,htif_iyield}
+local cartesi = require "cartesi"
+local names = {"x0", "x1", "x31", "mcycle", "pc", "fcsr", "f0", "f1", "f31", "iprv",
+    "mstatus", "mtvec", "mscratch", "mepc", "mcause", "mtval", "misa", "mie", "mip",
+    "medeleg", "mideleg", "mcounteren", "menvcfg", "mvendorid", "marchid", "mimpid",
+    "stvec", "sscratch", "sepc", "scause", "stval", "satp", "scounteren", "senvcfg",
+    "ilrsc", "icycleinstret", "iunrep",
+    "iflags_X", "iflags_Y", "iflags_H",
+    "clint_mtimecmp", "plic_girqpend", "plic_girqsrvd",
+    "htif_tohost", "htif_fromhost", "htif_ihalt", "htif_iconsole", "htif_iyield"}
+for _, name in ipairs(names) do
+    local f = assert(io.open(name, "w"))
+    f:write(string.format("0x%03x", cartesi.machine:get_reg_address(name)))
+    f:close()
+end
+```
+
+| Offset | Register | Offset | Register | Offset | Register | Offset | Register |
+|--------|----------|--------|----------|--------|----------|--------|----------|
+| []{replace=reg_addr/x0} | `x0` | []{replace=reg_addr/mtvec} | `mtvec` | []{replace=reg_addr/marchid} | `marchid` | []{replace=reg_addr/iflags_X} | `iflags_X` |
+| []{replace=reg_addr/x1} | `x1` | []{replace=reg_addr/mscratch} | `mscratch` | []{replace=reg_addr/mimpid} | `mimpid` | []{replace=reg_addr/iflags_Y} | `iflags_Y` |
+| `...` | `...` | []{replace=reg_addr/mepc} | `mepc` | []{replace=reg_addr/stvec} | `stvec` | []{replace=reg_addr/iflags_H} | `iflags_H` |
+| []{replace=reg_addr/x31} | `x31` | []{replace=reg_addr/mcause} | `mcause` | []{replace=reg_addr/sscratch} | `sscratch` | []{replace=reg_addr/clint_mtimecmp} | `clint_mtimecmp` |
+| []{replace=reg_addr/mcycle} | `mcycle` | []{replace=reg_addr/mtval} | `mtval` | []{replace=reg_addr/sepc} | `sepc` | []{replace=reg_addr/plic_girqpend} | `plic_girqpend` |
+| []{replace=reg_addr/pc} | `pc` | []{replace=reg_addr/misa} | `misa` | []{replace=reg_addr/scause} | `scause` | []{replace=reg_addr/plic_girqsrvd} | `plic_girqsrvd` |
+| []{replace=reg_addr/fcsr} | `fcsr` | []{replace=reg_addr/mie} | `mie` | []{replace=reg_addr/stval} | `stval` | []{replace=reg_addr/htif_tohost} | `htif_tohost` |
+| []{replace=reg_addr/f0} | `f0` | []{replace=reg_addr/mip} | `mip` | []{replace=reg_addr/satp} | `satp` | []{replace=reg_addr/htif_fromhost} | `htif_fromhost` |
+| []{replace=reg_addr/f1} | `f1` | []{replace=reg_addr/medeleg} | `medeleg` | []{replace=reg_addr/scounteren} | `scounteren` | []{replace=reg_addr/htif_ihalt} | `htif_ihalt` |
+| `...` | `...` | []{replace=reg_addr/mideleg} | `mideleg` | []{replace=reg_addr/senvcfg} | `senvcfg` | []{replace=reg_addr/htif_iconsole} | `htif_iconsole` |
+| []{replace=reg_addr/f31} | `f31` | []{replace=reg_addr/mcounteren} | `mcounteren` | []{replace=reg_addr/ilrsc} | `ilrsc` | []{replace=reg_addr/htif_iyield} | `htif_iyield` |
+| []{replace=reg_addr/iprv} | `iprv` | []{replace=reg_addr/menvcfg} | `menvcfg` | []{replace=reg_addr/icycleinstret} | `icycleinstret` | | |
+| []{replace=reg_addr/mstatus} | `mstatus` | []{replace=reg_addr/mvendorid} | `mvendorid` | []{replace=reg_addr/iunrep} | `iunrep` | | |
+
+The only generally relevant standard register is&nbsp;`mcycle`.
+Since its value is advanced at every CPU cycle, it can be used to identify a particular step in the computation being performed by a Cartesi Machine.
+This is a key component of the verification process, and can also be used to bound the amount of computation.
+
+The registers whose names start with &ldquo;`i`&rdquo; are Cartesi additions, and have the following semantics:
+
+* Register&nbsp;`iprv` holds the current privilege level (0 for User, 1 for Supervisor, and 3 for Machine).
+* Register&nbsp;`iflags_X` is set to 1 when the processor has yielded automatic.
+The emulator clears it again as soon as the machine resumes.
+* Register&nbsp;`iflags_Y` is set to 1 when the processor has yielded manual.
+It remains set until the host clears it (either directly, or as a side effect of `send_cmio_response`).
+* Register&nbsp;`iflags_H` is set to 1 to signal the processor has been permanently halted.
+* Register&nbsp;`ilrsc` holds the reservation address for the&nbsp;LR/SC atomic memory operations.
+* Register&nbsp;`icycleinstret` holds the difference between `mcycle` and the architectural instruction count.
+* Register&nbsp;`iunrep` is non-zero in machines configured as unreproducible, a creation-time mode that enables host VirtIO devices in exchange for giving up state-hash verifiability.
+
+### The microarchitecture
+
+In normal execution (i.e., via `machine:run(<max_mcycle>)`), the Cartesi Machine emulator runs programs in an _interpreter_ that has been compiled to run natively on the host computer.
+The execution of this program modifies the registers and memories and interacts with the devices accessible to the main processor.
+The Cartesi Machine uarch can be seen as a lower-level emulator.
+The uarch is not visible to the main processor, but code running in the uarch has access to the entire state of the Cartesi Machine, including the main processor and the entire board.
+The same interpreter source-code for the Cartesi Machine that runs on the host can also be compiled to an `uarch.bin` binary that runs exactly one fetch-execute iteration of the main processor and then halts the uarch.
+In its pristine state, the uarch memory is loaded with this `uarch.bin`.
+Therefore, executing the uarch until it halts, and then resetting the uarch to its pristine state, is equivalent to executing one instruction of the main processor.
+This finer granularity enables state-transition proofs in architectures, such as blockchains, that lack sufficient computation power to reliably verify complex main-processor instructions (e.g., floating-point division and square-root, virtual-memory page-walks, TLB invalidations, etc.).
+It also greatly reduces the number and complexity of the instructions the blockchain must be taught to simulate.
+See [State-transition proofs](#state-transition-proofs) for details.
+
+In contrast to the main processor, the uarch processor implements the much more restricted RV64I set.
+This includes only 52 instructions, the implementation of which can be directly translated to run in any programmable blockchain.
+It has 32 general-purpose integer registers (`uarch_x0`&hellip;`uarch_x31`), a program counter&nbsp;(`uarch_pc`), a cycle counter&nbsp;(`uarch_cycle`), and a halt flag&nbsp;(`uarch_halt_flag`).
+Like the main processor, the uarch makes its entire state available, externally and read-only, by mapping every register to its own 4KiB <i>uarch shadow</i> range.
+The mapping is given in the following table:
+
+```{.lua key=uarch_reg_addr replace=null outputs=uarch_halt_flag,uarch_cycle,uarch_pc,uarch_x0,uarch_x1,uarch_x31}
+local cartesi = require "cartesi"
+local names = {"uarch_halt_flag", "uarch_cycle", "uarch_pc",
+    "uarch_x0", "uarch_x1", "uarch_x31"}
+for _, name in ipairs(names) do
+    local f = assert(io.open(name, "w"))
+    f:write(string.format("0x%06x", cartesi.machine:get_reg_address(name)))
+    f:close()
+end
+```
+
+| Offset | Register | Offset | Register |
+|--------|----------|--------|----------|
+| []{replace=uarch_reg_addr/uarch_halt_flag} | `uarch_halt_flag` | []{replace=uarch_reg_addr/uarch_x0} | `uarch_x0` |
+| []{replace=uarch_reg_addr/uarch_cycle} | `uarch_cycle` | []{replace=uarch_reg_addr/uarch_x1} | `uarch_x1` |
+| | | `...` | `...` |
+| []{replace=uarch_reg_addr/uarch_pc} | `uarch_pc` | []{replace=uarch_reg_addr/uarch_x31} | `uarch_x31` |
+
+In addition to being able to access all memory ranges and devices visible to the main processor, the uarch includes a private 2MiB of RAM.
+
+### The board
+
+The interaction between board and processor happens through interrupts and the memory bus. Devices are mapped to the processor's physical address space.
+The mapping can be seen in the following table:
+
+```{.lua key=ar_table replace=null outputs=shadow,tlb,pmas,pmas_start,clint,htif,virtio,plic,cmio_rx,cmio_tx,dtb,ram_start,uarch_shadow,uarch_ram}
+local c = require "cartesi"
+local function write(name, content)
+    local f = assert(io.open(name, "w"))
+    f:write(content)
+    f:close()
+end
+local function range_se(start, e) return string.format("0x%08x-0x%08x", start, e) end
+local function range_sl(start, len) return range_se(start, start + len - 1) end
+write("shadow",       range_se(c.AR_SHADOW_STATE_START,      c.AR_SHADOW_TLB_START - 1))
+write("tlb",          range_sl(c.AR_SHADOW_TLB_START,        c.AR_SHADOW_TLB_LENGTH))
+write("pmas",         range_sl(c.AR_PMAS_START,              c.AR_PMAS_LENGTH))
+write("pmas_start",   string.format("0x%x",                  c.AR_PMAS_START))
+write("clint",        range_sl(c.AR_CLINT_START,             c.AR_CLINT_LENGTH))
+write("htif",         range_sl(c.AR_HTIF_START,              c.AR_HTIF_LENGTH))
+write("virtio",       range_se(c.AR_FIRST_VIRTIO_START,      c.AR_LAST_VIRTIO_END - 1))
+write("plic",         range_sl(c.AR_PLIC_START,              c.AR_PLIC_LENGTH))
+write("cmio_rx",      range_sl(c.AR_CMIO_RX_BUFFER_START,    1 << c.AR_CMIO_RX_BUFFER_LOG2_SIZE))
+write("cmio_tx",      range_sl(c.AR_CMIO_TX_BUFFER_START,    1 << c.AR_CMIO_TX_BUFFER_LOG2_SIZE))
+write("dtb",          range_sl(c.AR_DTB_START,               c.AR_DTB_LENGTH))
+write("ram_start",    string.format("0x%x",                  c.AR_RAM_START))
+write("uarch_shadow", range_sl(c.UARCH_SHADOW_START_ADDRESS, c.UARCH_SHADOW_LENGTH))
+write("uarch_ram",    range_sl(c.UARCH_RAM_START_ADDRESS,    c.UARCH_RAM_LENGTH))
+```
+
+| Physical address | Mapping |
+|------------------|---------|
+| []{replace=ar_table/shadow} | Processor and board shadow |
+| []{replace=ar_table/tlb} | Shadow TLB |
+| []{replace=ar_table/pmas} | PMA Array |
+| []{replace=ar_table/uarch_shadow} | Uarch shadow |
+| []{replace=ar_table/uarch_ram} | Uarch RAM |
+| []{replace=ar_table/clint} | Core Local Interruptor (CLINT) |
+| []{replace=ar_table/htif} | Host-Target Interface (HTIF) |
+| []{replace=ar_table/virtio} (*unreproducible mode only*) | VirtIO devices |
+| []{replace=ar_table/plic} | Platform-Level Interrupt Controller (PLIC) |
+| []{replace=ar_table/cmio_rx} | CMIO RX buffer |
+| []{replace=ar_table/cmio_tx} | CMIO TX buffer |
+| []{replace=ar_table/dtb} | Device tree (DTB) |
+| []{replace=ar_table/ram_start}-[]{replace=ar_table/ram_start}+`ram.length`-1 | RAM |
+| *configurable with constraints* | Flash drive or NVRAM 0 |
+| ... | ... |
+| *configurable with constraints* | Flash drive or NVRAM 7 |
+
+Execution starts at the beginning of RAM, where the bootloader (an OpenSBI&nbsp;`fw_payload` bundle that wraps the Linux kernel) is loaded from `linux.bin`.
+The amount of RAM is user-configurable, but always starts at address []{replace=ar_table/ram_start}.
+The DTB occupies a fixed region immediately below RAM and carries the kernel command line, the description of every other range, and the init/entrypoint scripts.
+
+Flash drives must start after []{replace=ar_table/ram_start}+`ram.length`-1, end before []{replace=ar_table/ram_start}+64TiB, and be aligned to 2MiB.
+
+NVRAMs have much lighter requirements.
+Their start and length must be aligned to 4KiB page boundaries, but can otherwise start and end anywhere below the 2<sup>56</sup> limit as long as their length is less than 128TiB.
+
+:::note
+For the relentlessly curious, here are the reasons for these constraints:
+
+Flash drives are exposed via the persistent-memory block-device driver `pmem-region`.
+The kernel adds this memory to its physical memory map and reaches it through the direct linear mapping, a dedicated region of the kernel's virtual address space where physical memory is mapped continuously using fixed offsets rather than page-table traversals.
+Both buffered I/O through the page cache and direct access (DAX) rely on this mapping, so the constraints below hold regardless of how a drive is accessed.
+
+The linear mapping begins where RAM begins, at []{replace=ar_table/ram_start}.
+A Cartesi Machine fixes RAM at this address because it is the standard RISC-V layout, the 2GiB DRAM base used by QEMU's `virt` board and expected by firmware such as OpenSBI, with the lower 2GiB reserved for boot and memory-mapped devices.
+Since those lower addresses are not general-purpose memory, a flash drive must start at []{replace=ar_table/ram_start} or higher.
+The kernel caps the mapping at 64TiB, reserving the rest of the Sv48 address space for other kernel subsystems, so a drive must end no later than []{replace=ar_table/ram_start}+64TiB-1.
+Finally, a flash drive's start and length must be multiples of 2MiB, because the kernel brings persistent-memory regions online only in 2MiB subsections and cannot map a region whose start or end falls off that boundary. This is a generic Linux requirement, not something specific to RISC-V or to the Cartesi Machine.
+
+UIO devices exposed via the `generic-uio` driver allow user-space applications to directly interact with hardware, bypassing the page cache and the direct linear mapping.
+The kernel dynamically creates isolated virtual memory mappings for device registers and memory.
+
+UIO devices map directly to hardware addresses, so they must start and end below the 2<sup>56</sup> limit, the maximum
+physical address space supported by Sv48.
+Their dynamic mappings must align with 4KiB page boundaries, which establishes valid page table entries without altering access permissions for adjacent physical memory.
+(The Cartesi Machine itself imposes the same alignment constraint.)
+The maximum contiguous virtual memory available for user-space processes is 128TiB, half of the total 256TiB Sv48 virtual address space.
+(The limit for kernel-space mappings managed by the `vmalloc` and `ioremap` subsystems is even smaller, 32TiB, reserving the remaining kernel virtual address space for the direct linear mapping and fixed structures.)
+:::
+
+The board also maps non-memory devices to the physical address space: CLINT, HTIF, PLIC, and (in unreproducible machines only) one or more VirtIO devices.
+
+#### CLINT
+
+```{.lua key=clint_rtc_freq_div replace=null}
+local cartesi = require "cartesi"
+io.write(cartesi.RTC_FREQ_DIV)
+```
+The Core Local Interruptor (or CLINT) controls the timer interrupt.
+The active addresses are&nbsp;`0x0200bff8`&nbsp;(`mtime`) and&nbsp;`0x02004000`&nbsp;(`mtimecmp`).
+The CLINT issues a hardware interrupt whenever&nbsp;`mtime` equals&nbsp;`mtimecmp`.
+Since Cartesi Machines must ensure reproducibility, the processor's clock and the timer are locked by a constant frequency divisor of&nbsp;[]{replace=clint_rtc_freq_div}.
+In other words, `mtime` is incremented once for every []{replace=clint_rtc_freq_div} increments of&nbsp;`mcycle`.
+There is no notion of wall-clock time.
+
+#### HTIF
+
+The Host-Target Interface (HTIF) mediates communication with the external world.
+It is mapped to a physical memory starting at `0x40008000`, where registers can be accessed at the following offsets:
+
+| Offset | Register |
+|--------|----------|
+| `0x000` | `tohost` |
+| `0x008` | `fromhost` |
+| `0x010` | `ihalt` |
+| `0x018` | `iconsole` |
+| `0x020` | `iyield` |
+| `0x028` | *Reserved* |
+| `...` | `...` |
+| `0x218` | *Reserved* |
+
+The format of CSRs `tohost` and `fromhost` are as follows: <p></p>
+
+| Bits | `63-56` | `55-48` | `47-32` | `31-0` |
+|-------|---------|---------|---------|--------|
+| Field | `DEV` | `CMD` | `REASON` | `DATA` |
+
+Interactions with Cartesi's HTIF device follow the following protocol:
+
+1. start by writing 0 to `fromhost`;
+1. write the <i>request</i> to `tohost`;
+1. read the <i>response</i> from `fromhost`.
+
+Cartesi's HTIF supports 3 subdevices: Halt, Console, and Yield.
+These are identified by the following values for the field `DEV`.
+
+```{.lua key=htif_const replace=null outputs=HTIF_DEV_HALT,HTIF_DEV_CONSOLE,HTIF_DEV_YIELD,HTIF_HALT_CMD_HALT,HTIF_CONSOLE_CMD_GETCHAR,HTIF_CONSOLE_CMD_PUTCHAR,HTIF_YIELD_CMD_AUTOMATIC,HTIF_YIELD_CMD_MANUAL,HTIF_YIELD_AUTOMATIC_REASON_PROGRESS,HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT,HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT,HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED,HTIF_YIELD_MANUAL_REASON_RX_REJECTED,HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION,HTIF_YIELD_REASON_ADVANCE_STATE,HTIF_YIELD_REASON_INSPECT_STATE}
+local cartesi = require "cartesi"
+for _, n in ipairs({"HTIF_DEV_HALT", "HTIF_DEV_CONSOLE", "HTIF_DEV_YIELD",
+        "HTIF_HALT_CMD_HALT", "HTIF_CONSOLE_CMD_GETCHAR", "HTIF_CONSOLE_CMD_PUTCHAR",
+        "HTIF_YIELD_CMD_AUTOMATIC", "HTIF_YIELD_CMD_MANUAL",
+        "HTIF_YIELD_AUTOMATIC_REASON_PROGRESS", "HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT",
+        "HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT", "HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED",
+        "HTIF_YIELD_MANUAL_REASON_RX_REJECTED", "HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION",
+        "HTIF_YIELD_REASON_ADVANCE_STATE", "HTIF_YIELD_REASON_INSPECT_STATE"}) do
+    local f = assert(io.open(n, "w"))
+    f:write(tostring(cartesi[n]))
+    f:close()
+end
+```
+
+| Name | `DEV` |
+|------|-------|
+| `HTIF_DEV_HALT` | []{replace=htif_const/HTIF_DEV_HALT} |
+| `HTIF_DEV_CONSOLE` | []{replace=htif_const/HTIF_DEV_CONSOLE} |
+| `HTIF_DEV_YIELD` | []{replace=htif_const/HTIF_DEV_YIELD} |
+
+Registers `ihalt`, `iconsole`, and `iyield` are bit masks specifying the commands that are available for the respective devices.
+Unavailable commands are silently ignored by the machine.
+
+##### Halt
+
+| Name | `CMD` |
+|------|-------|
+| `HTIF_HALT_CMD_HALT` | []{replace=htif_const/HTIF_HALT_CMD_HALT} |
+
+The Halt device (`DEV=HTIF_DEV_HALT`) is used to halt the machine.
+This will permanently set register `iflags_H` to 1 and return control back to the host.
+
+Send request `CMD=HTIF_HALT_CMD_HALT` with bit 0 of the 32-bit `DATA` field (bits 31&ndash;0) set to&nbsp;1.
+The remaining bits 31&ndash;1 of `DATA` carry an arbitrary exit code, read as `DATA >> 1`, following the convention used by the RISC-V test framework.
+The `cartesi-machine` utility reports this value as the machine's exit code.
+
+##### Console
+
+| Name | `CMD` |
+|------|-------|
+| `HTIF_CONSOLE_CMD_GETCHAR` | []{replace=htif_const/HTIF_CONSOLE_CMD_GETCHAR} |
+| `HTIF_CONSOLE_CMD_PUTCHAR` | []{replace=htif_const/HTIF_CONSOLE_CMD_PUTCHAR} |
+
+The Console device (`DEV=HTIF_DEV_CONSOLE`) can be used to input/output characters.
+
+To input a character from console (in interactive sessions), request `CMD=HTIF_CONSOLE_CMD_GETCHAR`, `DATA=0`, then read response `CMD=HTIF_CONSOLE_CMD_GETCHAR`, `DATA=<ch>+1`. (`DATA=0` means no character was available);
+
+To output a character `<ch>` to console, request `CMD=HTIF_CONSOLE_CMD_PUTCHAR`, with `DATA=<ch>`.
+
+##### Yield
+
+The Yield device can be used to return control to the host.
+There are two types of yield: _automatic_ and _manual_.
+
+| Name | `CMD` |
+|------|-------|
+| `HTIF_YIELD_CMD_AUTOMATIC` | []{replace=htif_const/HTIF_YIELD_CMD_AUTOMATIC} |
+| `HTIF_YIELD_CMD_MANUAL` | []{replace=htif_const/HTIF_YIELD_CMD_MANUAL} |
+
+To issue an automatic yield, request `CMD=HTIF_YIELD_CMD_AUTOMATIC`.
+An automatic yield sets register `iflags_X` to 1 and returns control back to the host.
+There are currently 3 supported reasons for automatic yields:
+
+| Name | `REASON` |
+|------|----------|
+| `HTIF_YIELD_AUTOMATIC_REASON_PROGRESS` | []{replace=htif_const/HTIF_YIELD_AUTOMATIC_REASON_PROGRESS} |
+| `HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT` | []{replace=htif_const/HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT} |
+| `HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT` | []{replace=htif_const/HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT} |
+
+To report `progress`, set `REASON=HTIF_YIELD_AUTOMATIC_REASON_PROGRESS`, and `DATA=<permil>`, where `<permil>` gives the progress in per-mille.
+The other reasons for automatic yield signal the production of Cartesi Rollups responses.
+`REASON=HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT` denotes the production of an output (a voucher, delegate-call voucher, or notice) and `REASON=HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT` denotes the production of a report.
+In both cases, the guest writes the payload to the CMIO TX buffer and `DATA` carries the payload length in bytes.
+
+To issue a manual yield, request `CMD=HTIF_YIELD_CMD_MANUAL`.
+A manual yield sets register `iflags_Y` to 1 and returns control back to the host.
+There are currently 3 supported reasons for manual yields, all used with Cartesi Rollups:
+
+| Name | `REASON` |
+|------|----------|
+| `HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED` | []{replace=htif_const/HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED} |
+| `HTIF_YIELD_MANUAL_REASON_RX_REJECTED` | []{replace=htif_const/HTIF_YIELD_MANUAL_REASON_RX_REJECTED} |
+| `HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION` | []{replace=htif_const/HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION} |
+
+To accept or reject the previous request, set `REASON=HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED` or
+`REASON=HTIF_YIELD_MANUAL_REASON_RX_REJECTED`, respectively.
+On accept, the guest writes the root hash of the output hashes tree to the CMIO TX buffer, and `DATA` in `tohost` carries the length of that hash in bytes.
+On reject, `DATA` is ignored.
+Upon return, the host has loaded the next request into the CMIO RX buffer.
+The `REASON` field in `fromhost` carries the request type, and the `DATA` field carries the request length in bytes.
+
+| Name | `REASON` in response |
+|------|----------------------|
+| `HTIF_YIELD_REASON_ADVANCE_STATE` | []{replace=htif_const/HTIF_YIELD_REASON_ADVANCE_STATE} |
+| `HTIF_YIELD_REASON_INSPECT_STATE` | []{replace=htif_const/HTIF_YIELD_REASON_INSPECT_STATE} |
+
+To signal the throwing of a rollup exception, set `REASON=HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION`.
+The guest writes the exception payload to the CMIO TX buffer and `DATA` in `tohost` carries the payload length in bytes.
+
+Before resuming the emulator after a manual yield, the host must manually reset register `iflags_Y` to 0.
+Otherwise, the emulator will immediately return with no changes to its state.
+
+#### Rollup
+
+In order to interact with Cartesi Rollups, the host application controlling the emulator and the guest application running inside the emulator must follow an agreed-upon protocol, mediated by the HTIF Yield device.
+
+The low-level view of what happens inside the machine is as follows:
+```
+Initialize
+`reason` = HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED
+`length` = 0
+Repeat
+    Yield manual with `reason` as `REASON` and `length` as `DATA` in `tohost`
+    If `DATA` in `fromhost` is HTIF_YIELD_REASON_ADVANCE_STATE
+        Read ABI-encoded EvmAdvance(...) from CMIO RX buffer
+        Process advance-state request
+        For each output to emit (voucher, delegate-call voucher, or notice)
+            Write ABI-encoded output to CMIO TX buffer and its length to `length`
+            Add output hash to output hashes tree
+            Yield automatic with HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT as `REASON` and `length` as `DATA` in `tohost`
+        End
+        For each report to emit
+            Write raw report data to CMIO TX buffer and its length to `length`
+            Yield automatic with HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT as `REASON` and `length` as `DATA` in `tohost`
+        End
+        If exception to emit
+            Write raw exception data to CMIO TX buffer and its length to `length`
+            `reason` = HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION
+        ElseIf input rejected
+            `length` = 0
+            `reason` = HTIF_YIELD_MANUAL_REASON_RX_REJECTED
+        Else
+            Write output hashes root hash to CMIO TX buffer
+            `length` = hash size
+            `reason` = HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED
+        End
+    ElseIf `DATA` in `fromhost` is HTIF_YIELD_REASON_INSPECT_STATE
+        Read raw query from CMIO RX buffer
+        Process inspect-state request
+        For each report to emit
+            Write raw report data to CMIO TX buffer and its length to `length`
+            Yield automatic with HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT as `REASON` and `length` as `DATA` in `tohost`
+        End
+        If exception to emit
+            Write raw exception data to CMIO TX buffer and its length to `length`
+            `reason` = HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION
+        Else
+            `length` = 0
+            `reason` = HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED
+        End
+    Else
+        `length` = 0
+        `reason` = HTIF_YIELD_MANUAL_REASON_RX_REJECTED
+    End
+End
+```
+At a higher level, the guest application running inside the emulator is supported by the libcmt library or by even higher-level interfaces based on it, such as the `/usr/bin/rollup` command-line utility, the HTTP API exposed by the `/usr/bin/rollup-http-server` command-line utility, or a language-specific framework.
+The libcmt library handles ABI encoding and decoding, maintains the output hashes tree in userspace, and uses the `/dev/cmio` device driver to move data to and from the CMIO buffers and perform the required yields.
+See [The libcmt library](#the-libcmt-library), [The /dev/cmio device](#the-devcmio-device), [The rollup command-line utility](#the-rollup-command-line-utility), and [The rollup HTTP server](#the-rollup-http-server) for the corresponding interfaces.
+
+There are two types of request: advance-state requests and inspect-state requests.
+The loop processes one request per iteration.
+To transition between requests, the application accepts the previous request, rejects it, or throws an exception.
+The return from the accept yield defines the type of the next request.
+
+When the application identifies an advance-state request, it reads the ABI-encoded input from the CMIO RX buffer.
+While processing advance-state requests, the application can emit outputs (vouchers, delegate-call vouchers, or notices) and reports, in any order.
+Outputs and reports are written to the CMIO TX buffer.
+Outputs contribute to the output hashes tree maintained by libcmt.
+When the application is ready to accept the next input, libcmt writes the current output hashes root hash to the CMIO TX buffer as part of the accept yield.
+
+When an application identifies an inspect-state request, it reads the raw query from the CMIO RX buffer.
+While processing inspect-state requests, the application can emit reports.
+Reports are written to the CMIO TX buffer and do not affect the output hashes tree.
+
+Instead of accepting or rejecting a request, the application can emit an exception to signal some unrecoverable error.
+The exception is also written to the CMIO TX buffer.
+
+All data exchanged through the CMIO buffers follows the Solidity ABI specification.
+Advance-state inputs arrive in the CMIO RX buffer as `EvmAdvance(uint256 chainId, address appContract, address msgSender, uint256 blockNumber, uint256 blockTimestamp, uint256 prevRandao, uint256 index, bytes payload)`.
+Vouchers are encoded as `Voucher(address destination, uint256 value, bytes payload)`.
+Delegate-call vouchers are encoded as `DelegateCallVoucher(address destination, bytes payload)`.
+Notices are encoded as `Notice(bytes payload)`.
+Reports, inspect queries, and exceptions travel as raw bytes.
+
+In the host, the loop is as follows:
+```
+Save fresh fork of machine as a snapshot
+Repeat
+    Obtain the next request from an external source
+    If advance-state request
+        Write the current state hash to the state at AR_SHADOW_REVERT_ROOT_HASH_START
+        Write ABI-encoded EvmAdvance(...) to CMIO RX buffer and its length to `length`
+        Write HTIF_YIELD_REASON_ADVANCE_STATE to `REASON` and `length` as `DATA` in `fromhost`
+        Reset register `iflags_Y` to 0
+        While register `iflags_H` is 0 and register `iflags_Y` is 0 (neither halted nor manual yield)
+            Resume machine
+            If register `iflags_X` is set (automatic yield)
+                If `REASON` in `tohost` is HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT
+                    `length` = `DATA` from `tohost`
+                    Read ABI-encoded output from CMIO TX buffer using `length`
+                End
+                If `REASON` in `tohost` is HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT
+                    `length` = `DATA` from `tohost`
+                    Read raw report data from CMIO TX buffer using `length`
+                End
+            End
+        End
+        If register `iflags_Y` is not 0 (machine yielded manual)
+            If `REASON` in `tohost` is HTIF_YIELD_MANUAL_REASON_RX_REJECTED
+                Replace machine with fresh fork of snapshot
+            End
+            If `REASON` in `tohost` is HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED
+                `length` = `DATA` from `tohost` (length of hash)
+                Read output hashes root hash from CMIO TX buffer using `length`
+                Replace snapshot with fresh fork of machine
+            End
+            If `REASON` in `tohost` is HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION
+                `length` = `DATA` from `tohost`
+                Read raw exception data from CMIO TX buffer using `length`
+                Abort
+            End
+        End
+        If register `iflags_H` is not 0 (machine is halted)
+            Abort
+        End
+    End
+    If inspect-state request
+        Write raw query to CMIO RX buffer and its length to `length`
+        Write HTIF_YIELD_REASON_INSPECT_STATE to `REASON` and `length` as `DATA` in `fromhost`
+        Reset register `iflags_Y` to 0
+        While register `iflags_H` is 0 and register `iflags_Y` is 0 (neither halted nor manual yield)
+            Resume machine
+            If register `iflags_X` is set (automatic yield)
+                If `REASON` in `tohost` is HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT
+                    `length` = `DATA` from `tohost`
+                    Read raw report data from CMIO TX buffer using `length`
+                End
+            End
+        End
+        Replace machine with fresh fork of snapshot
+    End
+End
+```
+The host controls the emulator via the C, Lua, or JSON-RPC APIs.
+It loops obtaining requests from an external source.
+Processing requests modifies the state of the machine.
+However, at the end of a request, the host may have to revert these changes.
+Therefore, the host keeps a snapshot of the state of the machine before any request is processed.
+
+For an advance-state request, the host sends the request with `machine:send_cmio_response()`, passing the current state hash for the machine to record.
+(This, of course, changes the state so its hash is not what has just been written, but this is expected.)
+The call also writes the request to the CMIO RX buffer and its type and length to the HTIF register `fromhost`, and unblocks the machine by clearing its `iflags_Y` register.
+The machine is now ready to be resumed.
+The host loops resuming the machine and collecting its outputs or reports every time it yields automatic.
+The guest application is eventually done with the input.
+If it rejects the input, the host drops the current machine and replaces it with a copy of the snapshot.
+If it accepts the input, the host replaces the snapshot with a copy of the current machine, and collects the new output hashes root hash.
+If it threw an exception or halted, the host aborts.
+
+For an inspect-state request, the loop is very similar.
+The differences are that only reports are collected (outputs are ignored), and that the machine is always reverted back to a copy of its snapshot.
+
+#### Address ranges
+
+A Cartesi Machine contains many address ranges.
+The address ranges visible to the main processor are mapped at fixed positions in its 64-bit physical address space.
+These are the ranges listed in the [board mapping table](#the-board) at the start of this chapter, exposed to Lua via the `cartesi.AR_*` constants, and discoverable at runtime via the [PMA array](#pmas) described in the next subsection.
+
+The uarch has its own private address ranges, which are not accessible to the main processor:
+
+| Physical address | Mapping |
+|------------------|---------|
+| []{replace=ar_table/uarch_shadow} | Microarchitecture shadow |
+| []{replace=ar_table/uarch_ram} | Microarchitecture RAM |
+
+The uarch shadow holds the uarch processor state.
+The uarch RAM holds the uarch program that decodes and executes one main processor instruction per uarch run before halting.
+
+#### PMAs
+
+Each address range visible to the main processor is described by an entry in the array of Physical Memory Attribute records (PMAs).
+The PMA array occupies []{replace=ar_table/pmas} and starts at address []{replace=ar_table/pmas_start} (exposed as `cartesi.AR_PMAS_START`).
+This is how the RISC-V interpreter discovers the available ranges at runtime, regardless of whether it is compiled to run directly on the host or inside a ZK prover.
+The microarchitecture's private ranges are not visible to the main processor and have no PMA entries, though a driver id is reserved for the uarch shadow state for consistency.
+
+Each PMA consists of 2 64-bit words.
+The first word gives the start of a range and the second word its length.
+These words are readable both internally and externally.
+Since the ranges must be aligned to 4KiB page boundaries, the lowest 12-bits of each word are available for attributes.
+The meaning of each attribute field is as follows:
+First word:
+
+| Bits | `63-12` | `11-8` | `7` | `6` | `5` | `4` | `3` | `2` | `1` | `0` |
+|------|---------|--------|-----|-----|-----|-----|-----|-----|-----|-----|
+| Field | `start` | `DID` | `IW` | `IR` | `X` | `W` | `R` | `E` | `IO` | `M` |
+
+The `M`, `IO`, and `E` bits are mutually exclusive, and respectively mark the range as memory, I/O mapped, or excluded.
+Bits `R`, `W`, and&nbsp;`X` mark read, write, and execute permissions, respectively.
+The `IR` and&nbsp;`IW` bits mark the range as idempotent for reads and writes, respectively.
+Finally, the `DID` gives the driver id, which can have the following values:
+
+```{.lua key=pma_did replace=null outputs=PMA_EMPTY_DID,PMA_MEMORY_DID,PMA_SHADOW_STATE_DID,PMA_FLASH_DRIVE_DID,PMA_CLINT_DID,PMA_HTIF_DID,PMA_PLIC_DID,PMA_CMIO_RX_BUFFER_DID,PMA_CMIO_TX_BUFFER_DID,PMA_SHADOW_UARCH_STATE_DID,PMA_VIRTIO_DID,PMA_NVRAM_DID}
+local cartesi = require "cartesi"
+for _, n in ipairs({"PMA_EMPTY_DID", "PMA_MEMORY_DID", "PMA_SHADOW_STATE_DID",
+        "PMA_FLASH_DRIVE_DID", "PMA_CLINT_DID", "PMA_HTIF_DID", "PMA_PLIC_DID",
+        "PMA_CMIO_RX_BUFFER_DID", "PMA_CMIO_TX_BUFFER_DID",
+        "PMA_SHADOW_UARCH_STATE_DID", "PMA_VIRTIO_DID", "PMA_NVRAM_DID"}) do
+    local f = assert(io.open(n, "w"))
+    f:write(tostring(cartesi[n]))
+    f:close()
+end
+```
+
+| Name | Value |
+|------|-------|
+| `PMA_EMPTY_DID` | []{replace=pma_did/PMA_EMPTY_DID} |
+| `PMA_MEMORY_DID` | []{replace=pma_did/PMA_MEMORY_DID} |
+| `PMA_SHADOW_STATE_DID` | []{replace=pma_did/PMA_SHADOW_STATE_DID} |
+| `PMA_FLASH_DRIVE_DID` | []{replace=pma_did/PMA_FLASH_DRIVE_DID} |
+| `PMA_CLINT_DID` | []{replace=pma_did/PMA_CLINT_DID} |
+| `PMA_HTIF_DID` | []{replace=pma_did/PMA_HTIF_DID} |
+| `PMA_PLIC_DID` | []{replace=pma_did/PMA_PLIC_DID} |
+| `PMA_CMIO_RX_BUFFER_DID` | []{replace=pma_did/PMA_CMIO_RX_BUFFER_DID} |
+| `PMA_CMIO_TX_BUFFER_DID` | []{replace=pma_did/PMA_CMIO_TX_BUFFER_DID} |
+| `PMA_SHADOW_UARCH_STATE_DID` | []{replace=pma_did/PMA_SHADOW_UARCH_STATE_DID} |
+| `PMA_VIRTIO_DID` | []{replace=pma_did/PMA_VIRTIO_DID} |
+| `PMA_NVRAM_DID` | []{replace=pma_did/PMA_NVRAM_DID} |
+
+Second word:
+
+| Bits | `63-12` | `11-0` |
+|------|---------|--------|
+| Field | `length` | *Reserved (=0)* |
+
+The list of PMA records ends with an invalid PMA entry for which `length=0`.
+
+### Linux setup
+
+By default, `pc` starts at the beginning of RAM (address []{replace=ar_ram_start}), where the RAM image is loaded.
+The emulator builds a [<i>devicetree</i>](https://www.devicetree.org/) describing the hardware at instantiation time, derived from the machine configuration, and writes it into the DTB memory range immediately below RAM.
+The start address of the DTB ([]{replace=ar_dtb_start}) is pre-loaded in register&nbsp;`a1`, per the conventional RISC-V boot ABI.
+
+The `dtc` command-line utility can be used to inspect the devicetree:
+
+```{.bash key=dtc replace=source outputs=pmem,pmem_start}
+# docs:begin
+cartesi-machine \
+    --no-init-splash \
+    --quiet \
+    --user=root \
+# docs:begin null
+	--store-config=config.json \
+# docs:end null
+    -- "dtc -I dtb -O dts /sys/firmware/fdt"
+# docs:end
+printf "%x" $(jq '.flash_drive[0].start' < config.json) > pmem_start
+printf "pmem@%s" $(cat pmem_start) > pmem
+```
+
+The result is
+```{.text replace=dtc}
+```
+
+The `memory@80000000` section describes 64MiB of RAM starting at address `0x80000000`.
+The []{replace=dtc/pmem} section describes flash drive 0: a memory region starting at address []{replace=dtc/pmem_start}, with compatible string `pmem-region`.
+This will eventually become available as `/dev/pmem0`.
+The `cmio` section specifies the starts and lengths of the CMIO memory ranges.
+The `yield` section specifies that the machine will process automatic and manual yields.
+Finally, section `chosen` includes the `bootargs` string that will be used as the kernel command-line parameters.
+Notice the specification of the root file-system as `root=/dev/pmem0` in the bootargs, and the `root` alias in `aliases` pointing to the `pmem` node.
+Also notice the command `dtc -I dtb -O dts /sys/firmware/fdt` coming directly from the `cartesi-machine` command line.
+
+Linux support for RISC-V is upstream in the [Linux kernel archives](https://www.kernel.org/).
+The kernel runs in supervisor mode, on top of a Supervisor Binary Interface (SBI) provided by a machine-mode shim: a [Cartesi fork](https://github.com/cartesi/opensbi) of [OpenSBI](https://github.com/riscv-software-src/opensbi), with Cartesi-specific extensions used by the kernel to talk to HTIF.
+Cartesi's RAM image `linux.bin` is an OpenSBI `fw_payload` bundle, with the kernel embedded as the payload, built from the [`machine-linux-image`](https://github.com/cartesi/machine-linux-image) repository.
+OpenSBI occupies the first 512KiB of RAM, declared as a no-map region in the device tree so the kernel does not touch it.
+After self-initialization, OpenSBI switches to supervisor mode and cedes control to the kernel entry point.
+
+```{.lua key=dtb_bootargs_root_part replace=null}
+local cartesi = require "cartesi"
+io.write(cartesi.DTB_BOOTARGS_ROOT_PART)
+```
+
+```{.lua key=dtb_bootargs_init_part replace=null}
+local cartesi = require "cartesi"
+io.write(cartesi.DTB_BOOTARGS_INIT_PART)
+```
+
+```{.lua key=dtb_bootargs_console_part replace=null}
+local cartesi = require "cartesi"
+io.write(cartesi.DTB_BOOTARGS_CONSOLE_PART)
+```
+
+```{.lua key=dtb_bootargs_uio_part replace=null}
+local cartesi = require "cartesi"
+io.write(cartesi.DTB_BOOTARGS_UIO_PART)
+```
+
+After completing its own initialization, the kernel mounts the root file-system (by default []{replace=dtb_bootargs_root_part}) and cedes control to the program named by the&nbsp;`init=`&nbsp;parameter (by default []{replace=dtb_bootargs_init_part}).
+Cartesi's root file-system `rootfs.ext2` is built from the [`machine-guest-tools`](https://github.com/cartesi/machine-guest-tools) repository, which also installs `cartesi-init` and the rollups user-space tooling.
+See [Initialization](#initialization-1) under the Guest perspective for what `cartesi-init` does after the kernel hands off.
+
+# The blockchain perspective
+
+This section describes the Cartesi Machine from the perspective of the blockchain.
+Using the Cartesi platform, smart contracts gain a new ability.
+They can get their users to agree on the results of computations that cannot be performed natively as smart contracts: computations that either involve too much data, are too computationally demanding, or require a sophisticated software infrastructure that is simply not available for use on-chain.
+
+Users that have a stake in a given computation are represented off-chain by Cartesi Nodes under their control.
+Cartesi Nodes react to Cartesi-enabled smart contracts and instantiate Cartesi Machines to perform the required computations and post the result back to the blockchain.
+Since Cartesi Machines are self-contained and reproducible, the results of off-chain computations performed by honest users will agree.
+The smart contract can then make decisions of consequence that depend on these results.
+
+When the Cartesi Node representing an honest user identifies an incorrect result posted by a dishonest user, it disputes the result.
+The opposing Cartesi Nodes then engage in an automatic dispute resolution protocol presided over by the blockchain, which results in the dishonest user being proven wrong.
+The smart contract that commanded the computation can then punish the dishonest user and reward the honest one.
+
+The Cartesi Machine emulator is one of a kind.
+It doesn't simply emulate the RISC-V ISA to the extent that it can boot a performant operating system based on Linux.
+It does so in a way that allows smart contracts to specify computations, replace their inputs, inspect their outputs, and direct the dispute resolution protocol.
+
+## Hash-view of state
+
+One of the key goals of moving computations off-chain is to allow them to manipulate vast amounts of data: so much data that it becomes economically prohibitive to explicitly store them in the blockchain.
+Nevertheless, for smart contracts to delegate computations off-chain, they must be able to specify the computations, their inputs, and then reason over their outputs.
+The key to solving these seemingly contradictory goals is the clever use of cryptographic hashes.
+
+Cartesi Machines are transparent in the sense that their entire state is exposed for external inspection.
+This includes the RAM, all flash drives and NVRAMs, general purpose registers, control and status registers, and even the internal state of all devices.
+In fact, the entire machine state is mapped into the 64-bit physical memory address space of the Cartesi Machine.
+(The exact mapping is given in the [system architecture](#system-architecture) section of the guest perspective.)
+This means that, right before a machine is executed, a cryptographic hash of its entire state can be generated.
+A cryptographic hash of the state of a Cartesi Machine &ldquo;completely&rdquo; specifies the computation it is about to perform.
+This is because a given state always evolves in exactly the same way (because Cartesi Machines are self-contained and reproducible) and it is infeasible to find a different machine state that produces the same cryptographic state hash.
+By the same token, once the machine is done, the state hash &ldquo;completely&rdquo; specifies the result of the computation, wherever it may reside within the address space.
+
+:::info
+The same caveat applies to &ldquo;completely&rdquo; here as to &ldquo;only&rdquo; earlier (see [State hashes](#state-hashes)).
+There are vastly more possible machine states than 256-bit state hashes, so collisions must exist, but finding one is infeasible for a cryptographic hash function such as Keccak-256.
+:::
+
+The state hash of a Cartesi Machine is the root hash of a Merkle tree.
+Merkle trees are binary trees where a leaf node is labeled with the hash of a data block  and an inner node is labeled with the hash of the concatenated labels of its two child nodes.
+In the case of Cartesi Machines, a block is simply one of the 2<sup>[]{replace=hash_tree_constants/log2_leaf_count code=no}</sup> aligned []{replace=hash_tree_constants/word_size code=no}-byte blocks in the machine's physical memory address space.
+The root hash can be obtained from the `machine:get_root_hash()` method.
+In the command-line, the options `--initial-hash` and `--final-hash` of the `cartesi-machine` utility cause it to output the root hash of the Merkle tree as it is before the emulator starts running and after it is done running, respectively.
+
+The machine can be configured to use the `"keccak256"` hash function (for use with the uarch) or the `"sha256"` hash function (for use with ZK).
+In theory, the Merkle tree of the entire machine state could be built from these primitives and [external state access](#external-state-access) to the machine instance.
+In practice, most of the state is unused and implicitly filled with zeros, and this allows the Merkle tree computation to skip large swaths of the state by using precomputed hashes for subtrees that span zeroed out regions of all power-of-2 sizes.
+The computation is also smart enough to only update the parts of the tree that changed between invocations.
+
+<picture>
+  <source media="(prefers-color-scheme: dark)" srcset="images/state-tree-dark.svg">
+  <img alt="A machine's state hash-tree over its address space" src="images/state-tree-light.svg">
+</picture>
+
+The figure above shows the state Merkle tree of a machine, drawn over its 64-bit address space.
+Each memory range is a complete subtree, shown as a blue triangle rooted at one tree node.
+The address space between ranges is pristine, shown as pale triangles, and a single pristine gap may take more than one subtree to span.
+A tree node is blue when everything below it is a memory range, pale when all of it is pristine, and gray when it mixes the two.
+The state hash is the root, at the far left.
+
+Tree hashes are used instead of linear hashes because they support a variety of operations that are unavailable from linear hashes.
+
+### Slicing and splicing
+
+In the Merkle tree of a Cartesi Machine state, the labels of each of the 2<sup>D</sup> nodes at a depth *D* can be seen as the root hashes for Merkle *subtrees* corresponding to adjacent intervals of *2<sup>L</sup>* bytes in the address space, where *L=64-D*.
+Each of these nodes can be identified by an address *A* and the log *L* of the length of the interval it spans, where *A* is aligned to a *2<sup>L</sup>* boundary.
+
+Consider a scenario in which a smart contract knows *only* the state hash *M* for a certain Cartesi Machine.
+Using Merkle trees makes the following key operations possible:
+1. *Slicing* &mdash; A user with access to the Merkle tree of *M* can provide data the blockchain can use to prove that the word at a given address has a given value. More generally, the user can provide data the blockchain can use to prove that a node with a given address and length in the tree has a given label;
+1. *Splicing* &mdash; A user with access to the Merkle tree of *M* can provide data the blockchain can use to prove that writing a given word at a given address results in a Cartesi Machine with a given state hash *M'*.  More generally, the user can provide data the blockchain can use to prove that replacing a node of given length at a given address with another node of equal length and a given label results in a Cartesi Machine with a given state hash *M'*.
+
+To understand how the slicing proof works, notice that the path from the Merkle tree node at depth *D>0* (i.e., with log length *L=64-D*) and address *A* goes through *D* nodes: *n<sub>D</sub>*, *n<sub>D-1</sub>*, &hellip;, *n<sub>1</sub>* until it reaches the root *n<sub>0</sub>*.
+The labels associated to all these nodes can be produced as follows.
+If *n<sub>D</sub>* is a leaf node, its []{replace=hash_tree_constants/word_size}-byte contents must be provided and the label is the hash of those bytes.
+Otherwise, if it is a general node, its label must be provided.
+The label of *n<sub>D-1</sub>* can then be obtained by hashing together the label of node *n<sub>D</sub>* and the label of its sibling.
+The order between these two siblings is available from the *D*th most significant bit in address *A*.
+If it is clear, *n<sub>D</sub>*'s label comes first, otherwise, its sibling's label comes first.
+It should be obvious that, when labels for *all siblings* in the path from the target node to the root are provided, this process can be repeated until the label of *n<sub>0</sub>* itself is obtained.
+This must match the value *M* known to the smart contract.
+In fact, due to the properties of cryptographic hashes, it is infeasible for the label so obtained to match *M* *unless all the data provided is true*.
+
+The data needed for the proofs can be produced by the `machine:get_proof(<address>, <log2_target_size>[, <log2_root_size>])` method of a Cartesi Machine instance.
+The contents of the proof returned are described in the [Lua interface](#state-value-proofs-1).
+That section uses the same small `hash-tree` module, whose three helpers are shown alongside the prose below.
+
+The workhorse is `roll_hash_up_tree(<proof>, <new_target_hash>)`:
+```{.lua replace=proof_module/source/roll_hash_up_tree title="hash-tree.lua (excerpt)"}
+```
+In the first iteration of the loop, the function uses the bit with value 2<sup>`proof.log2_target_size`</sup> in `proof.target_address` to determine if the sibling of the target node comes before or after it in the address space of the Cartesi Machine.
+It then computes the hash of the concatenation of the target node's hash and its sibling's hash (in the correct order).
+To do so, it uses the `cartesi.keccak256(<hash1>, <hash2>)` function.
+The result must be the hash of the parent node to the target and its sibling.
+The loop then goes up the `proof.sibling_hashes` array, and obtains the sibling of this parent node.
+This is again concatenated with the just-calculated hash of the parent node (in the correct order) to obtain what must be the hash of the grandparent node.
+This process is repeated until the hash of what must be the root node is found and returned.
+Function `verify_slice(<proof>)` then compares this to `proof.root_hash`.
+If they match, the proof passes.
+Otherwise, something is amiss.
+
+The slicing check `verify_slice` wires this walk into the proof structure returned by `machine:get_proof()`:
+```{.lua replace=proof_module/source/verify_slice title="hash-tree.lua (excerpt)"}
+```
+To verify a slicing operation, the code first checks the root hash *M* against the one found in the proof.
+Then, it uses `roll_hash_up_tree` to recompute the root hash from the path between the target node and root.
+Any mismatch triggers an assertion.
+
+Verifying a splicing operation is just as easy.
+First, the code verifies that the slicing operation is valid.
+This ensures that the sibling hashes are correct.
+Then, it uses `roll_hash_up_tree` to compute the root hash from the path between the target node and root.
+Only this time it starts from the new target node hash.
+The resulting root hash is the hash of a tree with the old node replaced by the new.
+This is exactly what `verify_splice` does:
+```{.lua replace=proof_module/source/verify_splice title="hash-tree.lua (excerpt)"}
+```
+
+### Template instantiation
+
+The most important use for the splicing operation is template instantiation.
+From the blockchain perspective, a [Cartesi Machine template](#cartesi-machine-templates) is simply a state hash *M*.
+Instantiating the Cartesi Machine with a given input is simply the process of obtaining the state hash *M'* that results from replacing one or more of its input NVRAMs.
+Each replacement is the result of a splicing operation as described above.
+The splicing operation is particularly convenient if the input range length is a power of 2 and its start is aligned according to its length.
+This is why, by default, the Cartesi Machine positions flash drives and NVRAMs respecting these constraints.
+
+The following script performs the same operation in two distinct ways, an off-chain way and a blockchain way, and checks that the two agree.
+Off-chain, it instantiates the `calculator-template` concretely, modifies its input NVRAM with the contents of a mathematical expression, and then asks for the state hash *M'* of the modified machine.
+```{.lua key=splice_calculator_with_new_drive include=splice-calculator-with-new-drive.lua title="splice-calculator-with-new-drive.lua"}
+```
+
+On chain, instantiating the machine like this would be impossible.
+Nevertheless, the script can obtain the same state hash *M'* using proofs.
+For this, it needs only the pristine input proof and the root hash of the modified input NVRAM.
+The splicing operation bubbles that root hash up the tree to recover the state hash, which the script then compares against the one obtained off-chain.
+
+Since the input NVRAM starts completely filled with zeros, only the mathematical expression is needed to describe its modified contents.
+Its root hash is computed by `hash_tree.get_root_hash(<data>, <log2_root_size>)`, which lays `<data>` at the base of a 2^`<log2_root_size>`-byte subtree and returns its root.
+```{.lua replace=proof_module/source/get_root_hash title="hash-tree.lua (excerpt)"}
+```
+The leaves are the []{replace=hash_tree_constants/word_size code=no}-byte words of `<data>`, each hashed with `cartesi.keccak256`, and a trailing partial word is zero-padded.
+Each inner node is the hash of its two children.
+Every node that `<data>` does not reach takes its level's pristine hash, the root of an all-zero subtree, obtained by hashing the previous level's pristine hash with itself.
+In this way, the function recovers the drive's root hash efficiently, without ever accessing its unmodified regions.
+
+Running the script with the command-line
+```{.bash key=lua_splice_calculator_with_new_drive vars=template->calc_template/calculator-template/path,proofs_pristine_run depends=splice_calculator_with_new_drive,proof_module replace=source}
+ln -sf "$template" .
+ln -sf "$proofs_pristine_run/pristine-input-proof.lua" .
+ln -sf "$RECIPES_DIR/splice-calculator-with-new-drive.lua" .
+# docs:begin
+lua5.4 splice-calculator-with-new-drive.lua "6*2^1024 + 3*2^512"
+# docs:end
+```
+produces the output
+```{replace=lua_splice_calculator_with_new_drive}
+```
+
+### Result extraction
+
+The most important use for the slicing operation is retrieving computation results.
+In a typical scenario, a user posts the final state hash of an instantiated Cartesi Machine that has been run until it halted.
+When the other users agree with this final state hash, slicing operations can be used to convince the blockchain of the contents of the halted Cartesi Machine's state.
+This can be the value of a single word in an output flash drive or NVRAM, or it can be the Merkle tree root for its entire contents.
+
+The following script performs the same operation in two distinct ways, an off-chain way and a blockchain way, and checks that the two agree.
+Off-chain, it instantiates the `calculator-template` concretely, writes a mathematical expression into its input NVRAM, runs the machine until it halts, reads the result string from its output NVRAM, and saves the state hash *M'* of the halted machine.
+```{.lua key=slice_calculator_output include=slice-calculator-output.lua title="slice-calculator-output.lua"}
+```
+
+On chain, the blockchain wants to verify the result of the computation.
+This is possible when all interested parties agree on the final state hash *M'* of the Cartesi Machine they ran off-chain.
+Assuming this to be the case, and in possession of the output proof and the result, the blockchain reconstructs the root hash of the output NVRAM from the result with `hash_tree.get_root_hash`, the same function the previous example used for the input drive.
+It then passes the output proof, this reconstructed hash, and the agreed hash *M'* to `verify_splice`, which confirms that an output NVRAM with exactly this content sits in the machine whose state hash is *M'*.
+In other words, once everyone agrees on *M'*, the result really is there.
+```{.bash key=lua_slice_calculator_output vars=template->calc_template/calculator-template/path,output_raw_proof depends=slice_calculator_output,proof_module replace=source}
+ln -sf "$template" .
+ln -sf "$output_raw_proof/output-proof.lua" .
+ln -sf "$RECIPES_DIR/slice-calculator-output.lua" .
+# docs:begin
+lua5.4 slice-calculator-output.lua "6*2^1024 + 3*2^512"
+# docs:end
+```
+produces the output
+```{replace=lua_slice_calculator_output}
+```
+
+### The output hashes tree
+
+The operations so far concern the word-leaf tree of the machine state.
+The same slicing idea applies to another Merkle tree the project uses, the *output hashes tree*, introduced under [Rolling Cartesi Machines and Cartesi Rollups](#rolling-cartesi-machines-and-cartesi-rollups).
+Its leaves are output hashes, each one `cartesi.keccak256` of a single output, rather than the bytes of a fixed address range.
+Its height is fixed at []{replace=hash_tree_constants/log2_max_output_count code=no}, so it can hold up to 2<sup>[]{replace=hash_tree_constants/log2_max_output_count code=no}</sup> outputs.
+A leaf for an output not yet produced is pristine, literally []{replace=hash_tree_constants/hash_size code=no} zero bytes, rather than the hash of a pristine word.
+A Rolling Cartesi Machine grows this one tree from genesis, across all of its epochs, one output at a time.
+
+Every operation the output hashes tree needs can be carried out from a compact summary of it, called a *frontier*, without ever materializing the whole tree.
+This matters at both ends of the system.
+Inside the Cartesi Machine, outputs accumulate across an unbounded number of epochs, so holding the complete tree would eventually exhaust the memory available to the guest.
+Outside, as we will see, even the output proofs can be generated holding only the frontier.
+The outputs themselves and their proofs are kept outside the machine, by the Cartesi Node.
+The machine state commits to them through the output hashes root hash alone.
+
+The frontier after *c* outputs captures the complete left subtrees standing over the leaves in the range [0, *c*), each by its root hash.
+Writing *c* in binary, such a subtree spans 2<sup>*l*</sup> leaves and is present exactly when bit *l* of *c* is set.
+These subtrees tile the leaves left to right, largest first, so the frontier holds one root hash per set bit of *c*, and *c* itself can be read back from which entries are present.
+The module stores it as a fixed-length array with one slot per level, holding that level's subtree root hash, or `false` where its bit is clear.
+
+The accessor `frontier_node` reads the hash of a node at one level from three regions that sit left to right in the tree, the frontier, an active region of nodes being worked on, and pristine padding:
+```{.lua replace=proof_module/source/frontier_node title="hash-tree.lua (excerpt)"}
+```
+A node index that falls to the left of the active region is supplied by the frontier, a complete left subtree's root hash.
+One that falls to the right is the root hash of an all-pristine subtree.
+One inside is taken straight from the active region.
+In the excerpt, `<index>` is the node's position within the level, `<base>` is where the active region begins and `<active>` holds its nodes, and `<frontier_entry>` and `<pristine_entry>` are that level's frontier and pristine subtree roots.
+Both maintaining the frontier and emitting proofs go through this accessor.
+
+![Output hashes tree partitioned into frontier, active region, and pristine padding](images/outputs-tree.svg)
+
+The figure shows the tree mid-stream, scaled down to height four while the real output hashes tree has height []{replace=hash_tree_constants/log2_max_output_count code=no}.
+Six earlier outputs sit to the left under the frontier, which holds them as two complete subtrees, one of four leaves and one of two, filled blue at their roots.
+The three new outputs of this epoch form the active region in the middle, filled green.
+The seven leaves to the right are pristine padding, held as a four-leaf, a two-leaf, and a single-leaf subtree, filled gray at their roots.
+Only the hashes actually held are filled, so every node below a frontier or pristine root is left empty, outlined in its subtree's color, because the frontier keeps each whole subtree as that one root hash and never materializes the leaves under it.
+
+The function `frontier_push_back` folds one new output leaf into the frontier:
+```{.lua replace=proof_module/source/frontier_push_back title="hash-tree.lua (excerpt)"}
+```
+Adding an output advances the leaf count from *c* to *c*+1.
+In binary that clears a run of low set bits and sets the next one up, an ordinary carry.
+The function mirrors the carry, combining the new leaf with the present low levels from the bottom up to the first empty one, clearing each, and storing the resulting hash at that first empty level.
+It is the root of the subtree covering exactly the leaves ending at the new output, the frontier entry the carry creates.
+A level is combined only once every 2<sup>*l*</sup> outputs, so a long run of outputs costs constant work each, amortized.
+
+The function `frontier_get_root_hash` returns the root hash of the tree, padded with zero leaves to completion:
+```{.lua replace=proof_module/source/frontier_get_root_hash title="hash-tree.lua (excerpt)"}
+```
+Every leaf the outputs have not reached is pristine.
+The function climbs level by level, combining each present frontier entry on the left with pristine padding on the right.
+The [Output proofs](#output-proofs) example uses these two together while processing an epoch, pushing each accepted output and then rooting the frontier to check it against the output hashes root hash the guest reported.
+
+The constructor is `frontier`, which produces the frontier an epoch begins from:
+```{.lua replace=proof_module/source/frontier title="hash-tree.lua (excerpt)"}
+```
+It distinguishes two cases with `is_proof`, which checks whether the argument is a proof table rather than a height.
+Given the tree height, it returns the empty frontier of a genesis epoch, the all-`false` frontier for the given height.
+Given the previous epoch's last output proof instead, it rebuilds the frontier as it stood after that output.
+The last output is the rightmost leaf in the range [0, *c*), so at every level where *c* has a set bit that leaf is a right child, and its proof sibling there is exactly the root hash the frontier stores for that level.
+The lowest such entry is recovered by rolling the leaf up through its siblings below.
+A single proof, the one already saved for an epoch's last output, is therefore all the next epoch needs to resume the same genesis-rooted tree.
+
+Finally, `frontier_next_proofs` produces an epoch's output proofs:
+```{.lua replace=proof_module/source/frontier_next_proofs title="hash-tree.lua (excerpt)"}
+```
+Given the starting frontier and the output hashes accepted during the epoch, in order, it returns one proof per new output, all against the single final root.
+The only thing a new output's proof needs from the earlier leaves in the range [0, *c*) is the frontier.
+A left sibling on a new leaf's path to the root always ends at an aligned boundary at or before *c*, so it is a complete subtree whose root hash the frontier already holds, never an individual old leaf.
+The function sweeps the new leaves up one level at a time, reading each proof sibling through `frontier_node`, which supplies a frontier entry or pristine padding at the boundaries.
+The proofs are built together, in one batch at the end of the epoch, because an early output's low siblings are later outputs of the same epoch.
+Note that proofs issued for outputs in previous epochs are produced and stored by the Cartesi Node as soon as those epochs were finalized.
+They are checked against the state hash (and output hashes root hash) finalized then, not against what gets finalized in later epochs.
+
+Generating these proofs is shown in the Lua [Output proofs](#output-proofs) section.
+Checking an output against them, from a settled machine state hash alone, is shown under [Output verification](#output-verification) below.
+
+### Output verification
+
+The slicing and splicing operations above extract a result from a halted machine, whose entire output occupies a single NVRAM.
+A Rolling Cartesi Machine instead emits outputs one at a time and keeps running.
+The analogous operation is to verify the contents of a given output it produced.
+This is possible between epochs, once the state hash of the machine is agreed upon.
+From that state hash, a slicing operation recovers the output hashes root hash from the machine's CMIO tx buffer.
+As described under [Output proofs](#output-proofs), this is the root of a Merkle tree.
+Its leaves are the hashes of all outputs ever produced, in order.
+A second slicing operation, in that tree, then proves the output's hash is one of its leaves.
+
+When the [Rolling Cartesi Machine calculator](#rolling-cartesi-machines) processed its first epoch, it saved more than the outputs themselves.
+For each accepted input, it saved a proof that the output hashes root hash occupied the CMIO tx buffer.
+For each output, it saved an output proof.
+Through `--final-hash`, it also saved the machine state hash the epoch settled on.
+The output proofs are built against the epoch's final output hashes root hash.
+They therefore pair with the output hashes root hash proof from the last accepted input, input 3.
+The following script verifies output 0 from the settled state hash and those artifacts alone, without instantiating any machine.
+```{.lua key=verify_output_proof include=verify-output-proof.lua title="verify-output-proof.lua"}
+```
+The script first confirms the output proof's root equals the value the output hashes root hash proof locates in the tx-buffer word.
+That joins the two trees.
+It then hashes the output's bytes and matches them against the leaf the output proof locates, pinning down this exact output.
+
+Running the script over the artifacts the Rolling Cartesi Machine calculator saved
+```{.bash key=lua_verify_output_proof vars=rolling_calc_run depends=verify_output_proof replace=source}
+ln -sf $rolling_calc_run/epoch-1-state-hash.bin .
+ln -sf $rolling_calc_run/input-3-output-hashes-root-hash-proof.lua .
+ln -sf $rolling_calc_run/output-0-input-1-proof.lua .
+ln -sf $rolling_calc_run/output-0-input-1.bin .
+ln -sf "$RECIPES_DIR/verify-output-proof.lua" .
+# docs:begin
+lua5.4 verify-output-proof.lua \
+    epoch-1-state-hash.bin \
+    input-3-output-hashes-root-hash-proof.lua \
+    output-0-input-1-proof.lua \
+    output-0-input-1.bin
+# docs:end
+```
+produces the output
+```{replace=lua_verify_output_proof}
+```
+
+
+## Verification game
+
+The question now becomes how the blockchain can identify the honest party when there are two opinions on the final state hash of a Cartesi Machine, for a computation the blockchain itself is unable to perform.
+This is the role of the verification game, an [established technique](https://doi.org/10.1016/j.ic.2013.03.003) on which our original [whitepaper](https://cartesi.io/cartesi_whitepaper.pdf) builds.
+It rests on one assumption, that at least one of the two parties is honest.
+
+The `verification-game.lua` recipe is a self-contained model of it.
+A referee, standing in for the Cartesi contracts deployed on the blockchain, mediates a dispute between two players, each standing in for a Cartesi Node that ran the computation off-chain.
+The three are separate processes that communicate over the network, which here stands in for blockchain transactions.
+The referee never trusts a player.
+The two players run identical code and differ only in the machine they hold.
+One is honest, the other cheats past a chosen point by switching to a machine that ran a different expression.
+
+The game opens with each player committing the final state hash of its machine, obtained by running it until it halts.
+If the two hashes agree there is no dispute and the result can be extracted directly.
+When they disagree the referee settles the dispute before accepting the result.
+```{.lua key=vg_run_referee include=verification-game.lua/run_referee title="verification-game.lua (excerpt)"}
+```
+
+### Settling a dispute
+
+The dispute is settled in two bisections.
+The first ranges over `mcycle` and isolates the disputed main processor instruction, the second ranges over `uarch_cycle` and isolates the single uarch step within it.
+```{.lua key=vg_adjudicate include=verification-game.lua/adjudicate_dispute title="verification-game.lua (excerpt)"}
+```
+
+### One bisection level
+
+Each bisection narrows the disagreement to the single transition responsible for it, repeatedly asking both players for the state hash at the midpoint of an interval of cycles and keeping the half where they still disagree.
+```{.lua key=vg_bisect_level include=verification-game.lua/bisect_level title="verification-game.lua (excerpt)"}
+```
+The main processor has a fixed-point property once the machine halts.
+Running it for more `mcycle`s leaves the state, and therefore the hash, unchanged.
+Likewise, the uarch has a fixed-point property once it halts.
+Running it for more `uarch_cycle`s leaves the state unchanged, until a reset begins the next main processor instruction.
+This is what lets each bisection range over the full cycle ceiling without knowing in advance where either machine halts.
+A midpoint past a halt simply repeats the final hash, and the disagreement is still found at the cycle where the two computations diverge.
+
+### Verifying the state transition
+
+Once a single `uarch_cycle` is in dispute, the referee asks the player on the disagreeing side for the access log of the transition out of it, and verifies that log without ever instantiating a machine.
+This stands for a Cartesi contract that can verify such logs directly on the blockchain.
+The transition is either an ordinary uarch step or the terminal reset that begins the next main processor instruction.
+Which one it is depends only on the agreed cycle, since the only transition out of `cartesi.UARCH_CYCLE_MAX - 1` is the reset, so the referee checks the log with `verify_reset_uarch` at that boundary and `verify_step_uarch` everywhere else.
+If the log proves that the agreed before-hash advances to the player's committed after-hash, that player was honest, otherwise the other one is assumed to be.
+```{.lua key=vg_verify_transition include=verification-game.lua/verify_state_transition title="verification-game.lua (excerpt)"}
+```
+
+### Verifying the result
+
+Naming the winner settles which final state hash is the true one.
+The referee asks both players for a result and accepts the first that verifies against that hash.
+```{.lua key=vg_wait_for_result include=verification-game.lua/wait_for_result title="verification-game.lua (excerpt)"}
+```
+A posted result verifies, by the same slicing operation shown earlier, only if its bytes hash to the proof's target, the target sits at the output drive's address, and the proof rolls up to the winner's final hash.
+```{.lua key=vg_verify_output include=verification-game.lua/verify_output title="verification-game.lua (excerpt)"}
+```
+A result that does not, from the dishonest player or anyone else, is rejected.
+This keeps the result phase decoupled from the dispute, the parties who settle it are not the parties who later rely on the finalized hash to prove the result.
+
+### Running the game
+
+To run the whole game, start the referee, the server the players connect to:
+```{.bash key=vg_run vars=template->calc_template/calculator-template/path depends=vg_verify_output outputs=referee replace=source/server}
+ln -sf "$template" .
+ln -sf "$RECIPES_DIR/verification-game.lua" .
+ln -sf "$RECIPES_DIR/dishonest.lua" .
+{
+# docs:begin server
+lua5.4 verification-game.lua referee 127.0.0.1:8087 "6*2^1024 + 3*2^512"
+# docs:end server
+} > /dev/null 2>&1 &
+while ! netstat -ntl 2>&1 | grep 8087 > /dev/null; do sleep 1; done
+{
+# docs:begin honest
+lua5.4 verification-game.lua honest 127.0.0.1:8087 "6*2^1024 + 3*2^512"
+# docs:end honest
+} > /dev/null 2>&1 &
+# make sure honest player is player 1 and dishonest is player 2
+while ! netstat -nt 2>&1 | grep 8087 > /dev/null; do sleep 1; done
+{
+# docs:begin dishonest
+lua5.4 verification-game.lua dishonest 127.0.0.1:8087 "6*2^1024 + 3*2^512" 25 7 "2+2"
+# docs:end dishonest
+} > /dev/null 2>&1 &
+wait
+# The referee leaves one file per narration phase. Show the short phases whole and reduce each
+# long bisection to its first and last three rounds.
+{
+cat commitments
+head -n 3 bisect_mcycle
+echo ...
+tail -n 3 bisect_mcycle
+head -n 3 bisect_uarch_cycle
+echo ...
+tail -n 3 bisect_uarch_cycle
+cat verdict
+cat output
+} > referee
+```
+then the honest player, which evaluates the public expression:
+```{.bash replace=vg_run/source/honest}
+```
+and the dishonest player, which cheats at an early cycle into a different expression:
+```{.bash replace=vg_run/source/dishonest}
+```
+The referee narrates the dispute from start to finish:
+```{replace=vg_run/referee}
+```
+The bisection converges on the cheat point, the disputed step verifies in the honest player's favor, and the cheater's result is rejected before the true one is accepted.
+
+```{.lua key=vg_uarch_cycle_max replace=null}
+local cartesi = require("cartesi")
+print(cartesi.UARCH_CYCLE_MAX)
+```
+That dispute resolved on an ordinary uarch step, since the cheat point fell early in the disputed instruction's uarch cycles.
+Cheating instead at the last uarch cycle, `cartesi.UARCH_CYCLE_MAX - 1`, moves the disagreement onto the terminal reset that begins the next instruction, the case the referee checks with `verify_reset_uarch`:
+```{.bash key=vg_run_reset vars=template->calc_template/calculator-template/path,uarch_cycle_max->vg_uarch_cycle_max/stdout depends=vg_run outputs=referee replace=source/dishonest}
+ln -sf "$template" .
+ln -sf "$RECIPES_DIR/verification-game.lua" .
+ln -sf "$RECIPES_DIR/dishonest.lua" .
+{
+lua5.4 verification-game.lua referee 127.0.0.1:8088 "6*2^1024 + 3*2^512"
+} > /dev/null 2>&1 &
+while ! netstat -ntl 2>&1 | grep 8088 > /dev/null; do sleep 1; done
+{
+lua5.4 verification-game.lua honest 127.0.0.1:8088 "6*2^1024 + 3*2^512"
+} > /dev/null 2>&1 &
+last_uarch_cycle=$(( $uarch_cycle_max - 1 ))
+# make sure honest player is player 1 and dishonest is player 2
+while ! netstat -nt 2>&1 | grep 8088 > /dev/null; do sleep 1; done
+{
+# docs:begin dishonest
+lua5.4 verification-game.lua dishonest 127.0.0.1:8088 "6*2^1024 + 3*2^512" 25 "$last_uarch_cycle" "2+2"
+# docs:end dishonest
+} > /dev/null 2>&1 &
+wait
+# Show only what differs from the step run: the uarch bisection climbing to the reset
+# boundary, then the verdict.
+{
+head -n 3 bisect_uarch_cycle
+echo ...
+tail -n 3 bisect_uarch_cycle
+cat verdict
+} > referee
+```
+This time the uarch bisection climbs to the reset boundary and the honest player's reset log verifies just the same:
+```{replace=vg_run_reset/referee}
+```
+
+For simplicity this model uses only two players, but the same idea is the basis for efficient algorithms that resolve disputes among many players.
+Our implementation has since moved on to use our [Permissionless Refereed Tournaments](https://arxiv.org/abs/2212.12439).
+For an even better algorithm, see our [Dave: A Decentralized, Secure, and Lively Fraud-Proof Algorithm](https://doi.org/10.1145/3734698).
+
+[modeline]: # ( vim: set filetype=markdown spell spelllang=en: )
+
diff --git a/doc/alerts.lua b/doc/alerts.lua
new file mode 100644
index 000000000..a54a0686f
--- /dev/null
+++ b/doc/alerts.lua
@@ -0,0 +1,46 @@
+-- Pandoc Lua filter: convert docusaurus-style admonition fenced divs to
+-- GitHub alert blockquotes (> [!TYPE] ...) for gfm output, or to
+-- github-markdown-css-compatible divs for html output.
+--
+-- Docusaurus classes and their GitHub alert equivalents:
+local MAP = {
+    note = "NOTE",
+    info = "NOTE",
+    tip = "TIP",
+    warning = "WARNING",
+    caution = "CAUTION",
+    danger = "WARNING",
+}
+
+function Div(el)
+    local kind
+    for _, c in ipairs(el.classes) do
+        if MAP[c] then
+            kind = MAP[c]
+            break
+        end
+    end
+    if not kind then
+        return nil
+    end
+
+    if FORMAT:match("^html") then
+        local lower = kind:lower()
+        local label = kind:sub(1, 1) .. kind:sub(2):lower()
+        local title = pandoc.RawBlock("html", '<p class="markdown-alert-title">' .. label .. "</p>")
+        local content = { title }
+        for _, b in ipairs(el.content) do
+            content[#content + 1] = b
+        end
+        return pandoc.Div(content, pandoc.Attr("", { "markdown-alert", "markdown-alert-" .. lower }))
+    end
+
+    -- RawInline("markdown", ...) passes through the gfm writer unescaped, so
+    -- the [!TYPE] marker reaches GitHub intact without bracket-escaping.
+    local marker = pandoc.Para({ pandoc.RawInline("markdown", "[!" .. kind .. "]") })
+    local content = { marker }
+    for _, b in ipairs(el.content) do
+        content[#content + 1] = b
+    end
+    return pandoc.BlockQuote(content)
+end
diff --git a/doc/Doxyfile b/doc/doxygen/Doxyfile
similarity index 100%
rename from doc/Doxyfile
rename to doc/doxygen/Doxyfile
diff --git a/doc/github.template.html b/doc/github.template.html
new file mode 100644
index 000000000..2f90347f3
--- /dev/null
+++ b/doc/github.template.html
@@ -0,0 +1,22 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>$title$</title>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.8.1/github-markdown.min.css">
+<style>
+  body { box-sizing: border-box; min-width: 200px; max-width: 980px; margin: 0 auto; padding: 45px; }
+  @media (max-width: 767px) { body { padding: 15px; } }
+</style>
+</head>
+<body class="markdown-body">
+$include-before$
+$if(toc)$
+<nav id="TOC" role="doc-toc">
+$toc$
+</nav>
+$endif$
+$body$
+</body>
+</html>
diff --git a/doc/github.template.md b/doc/github.template.md
new file mode 100644
index 000000000..17a233f2e
--- /dev/null
+++ b/doc/github.template.md
@@ -0,0 +1,13 @@
+$for(include-before)$
+$include-before$
+
+$endfor$
+$if(toc)$
+$table-of-contents$
+
+$endif$
+$body$
+$for(include-after)$
+
+$include-after$
+$endfor$
diff --git a/doc/images/outputs-tree.dot b/doc/images/outputs-tree.dot
new file mode 100644
index 000000000..1fe741d05
--- /dev/null
+++ b/doc/images/outputs-tree.dot
@@ -0,0 +1,60 @@
+// Height-4 outputs tree (16 leaves), a stand-in for the real, much taller tree.
+// Node positions are pinned for a perfectly symmetric binary tree (dot's own layout
+// leaves it skewed); render with "neato -n", which uses the positions and runs no
+// layout. leaf_count=6 entering: the frontier holds a complete 4-leaf subtree and a
+// complete 2-leaf subtree. Three new outputs form the active region. The last seven
+// leaves are pristine padding, a 4-leaf, a 2-leaf, and a 1-leaf subtree. Only the hashes
+// actually held are filled (the five subtree roots and the active region); the rest empty.
+digraph outputs_tree {
+  graph [bgcolor=transparent];
+  node [shape=circle, fixedsize=true, width=0.34, label="", style=filled, color="#555555", penwidth=2];
+  edge [arrowhead=none, color="#555555"];
+
+  N1 [fillcolor="#8fd16f", color="#8fd16f", pos="345.0,256!"];
+  N2 [fillcolor="#8fd16f", color="#8fd16f", pos="161.0,192!"];
+  N3 [fillcolor="#8fd16f", color="#8fd16f", pos="529.0,192!"];
+  N4 [fillcolor="#5b9bf0", color="#5b9bf0", pos="69.0,128!"];
+  N5 [fillcolor="#8fd16f", color="#8fd16f", pos="253.0,128!"];
+  N6 [fillcolor="#8fd16f", color="#8fd16f", pos="437.0,128!"];
+  N7 [fillcolor="#888888", color="#888888", pos="621.0,128!"];
+  N8 [fillcolor="none", color="#5b9bf0", pos="23.0,64!"];
+  N9 [fillcolor="none", color="#5b9bf0", pos="115.0,64!"];
+  N10 [fillcolor="#5b9bf0", color="#5b9bf0", pos="207.0,64!"];
+  N11 [fillcolor="#8fd16f", color="#8fd16f", pos="299.0,64!"];
+  N12 [fillcolor="#8fd16f", color="#8fd16f", pos="391.0,64!"];
+  N13 [fillcolor="#888888", color="#888888", pos="483.0,64!"];
+  N14 [fillcolor="none", color="#888888", pos="575.0,64!"];
+  N15 [fillcolor="none", color="#888888", pos="667.0,64!"];
+  N16 [fillcolor="none", color="#5b9bf0", pos="0.0,0!"];
+  N17 [fillcolor="none", color="#5b9bf0", pos="46.0,0!"];
+  N18 [fillcolor="none", color="#5b9bf0", pos="92.0,0!"];
+  N19 [fillcolor="none", color="#5b9bf0", pos="138.0,0!"];
+  N20 [fillcolor="none", color="#5b9bf0", pos="184.0,0!"];
+  N21 [fillcolor="none", color="#5b9bf0", pos="230.0,0!"];
+  N22 [fillcolor="#8fd16f", color="#8fd16f", pos="276.0,0!"];
+  N23 [fillcolor="#8fd16f", color="#8fd16f", pos="322.0,0!"];
+  N24 [fillcolor="#8fd16f", color="#8fd16f", pos="368.0,0!"];
+  N25 [fillcolor="#888888", color="#888888", pos="414.0,0!"];
+  N26 [fillcolor="none", color="#888888", pos="460.0,0!"];
+  N27 [fillcolor="none", color="#888888", pos="506.0,0!"];
+  N28 [fillcolor="none", color="#888888", pos="552.0,0!"];
+  N29 [fillcolor="none", color="#888888", pos="598.0,0!"];
+  N30 [fillcolor="none", color="#888888", pos="644.0,0!"];
+  N31 [fillcolor="none", color="#888888", pos="690.0,0!"];
+
+  N1 -> N2; N1 -> N3;
+  N2 -> N4; N2 -> N5;
+  N3 -> N6; N3 -> N7;
+  N4 -> N8; N4 -> N9;
+  N5 -> N10; N5 -> N11;
+  N6 -> N12; N6 -> N13;
+  N7 -> N14; N7 -> N15;
+  N8 -> N16; N8 -> N17;
+  N9 -> N18; N9 -> N19;
+  N10 -> N20; N10 -> N21;
+  N11 -> N22; N11 -> N23;
+  N12 -> N24; N12 -> N25;
+  N13 -> N26; N13 -> N27;
+  N14 -> N28; N14 -> N29;
+  N15 -> N30; N15 -> N31;
+}
diff --git a/doc/images/outputs-tree.svg b/doc/images/outputs-tree.svg
new file mode 100644
index 000000000..3e9747e17
--- /dev/null
+++ b/doc/images/outputs-tree.svg
@@ -0,0 +1,317 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 12.2.1 (20241206.2353)
+ -->
+<!-- Title: outputs_tree Pages: 1 -->
+<svg width="722pt" height="288pt"
+ viewBox="0.00 0.00 722.48 288.48" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 284.48)">
+<title>outputs_tree</title>
+<!-- N1 -->
+<g id="node1" class="node">
+<title>N1</title>
+<ellipse fill="#8fd16f" stroke="#8fd16f" stroke-width="2" cx="357.24" cy="-268.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N2 -->
+<g id="node2" class="node">
+<title>N2</title>
+<ellipse fill="#8fd16f" stroke="#8fd16f" stroke-width="2" cx="173.24" cy="-204.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N1&#45;&gt;N2 -->
+<g id="edge1" class="edge">
+<title>N1&#45;&gt;N2</title>
+<path fill="none" stroke="#555555" d="M344.88,-263.94C311.36,-252.28 219,-220.16 185.54,-208.52"/>
+</g>
+<!-- N3 -->
+<g id="node3" class="node">
+<title>N3</title>
+<ellipse fill="#8fd16f" stroke="#8fd16f" stroke-width="2" cx="541.24" cy="-204.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N1&#45;&gt;N3 -->
+<g id="edge2" class="edge">
+<title>N1&#45;&gt;N3</title>
+<path fill="none" stroke="#555555" d="M369.6,-263.94C403.12,-252.28 495.48,-220.16 528.94,-208.52"/>
+</g>
+<!-- N4 -->
+<g id="node4" class="node">
+<title>N4</title>
+<ellipse fill="#5b9bf0" stroke="#5b9bf0" stroke-width="2" cx="81.24" cy="-140.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N2&#45;&gt;N4 -->
+<g id="edge3" class="edge">
+<title>N2&#45;&gt;N4</title>
+<path fill="none" stroke="#555555" d="M162.69,-196.9C145.03,-184.62 109.71,-160.05 91.95,-147.69"/>
+</g>
+<!-- N5 -->
+<g id="node5" class="node">
+<title>N5</title>
+<ellipse fill="#8fd16f" stroke="#8fd16f" stroke-width="2" cx="265.24" cy="-140.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N2&#45;&gt;N5 -->
+<g id="edge4" class="edge">
+<title>N2&#45;&gt;N5</title>
+<path fill="none" stroke="#555555" d="M183.79,-196.9C201.45,-184.62 236.77,-160.05 254.53,-147.69"/>
+</g>
+<!-- N6 -->
+<g id="node6" class="node">
+<title>N6</title>
+<ellipse fill="#8fd16f" stroke="#8fd16f" stroke-width="2" cx="449.24" cy="-140.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N3&#45;&gt;N6 -->
+<g id="edge5" class="edge">
+<title>N3&#45;&gt;N6</title>
+<path fill="none" stroke="#555555" d="M530.69,-196.9C513.03,-184.62 477.71,-160.05 459.95,-147.69"/>
+</g>
+<!-- N7 -->
+<g id="node7" class="node">
+<title>N7</title>
+<ellipse fill="#888888" stroke="#888888" stroke-width="2" cx="633.24" cy="-140.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N3&#45;&gt;N7 -->
+<g id="edge6" class="edge">
+<title>N3&#45;&gt;N7</title>
+<path fill="none" stroke="#555555" d="M551.79,-196.9C569.45,-184.62 604.77,-160.05 622.53,-147.69"/>
+</g>
+<!-- N8 -->
+<g id="node8" class="node">
+<title>N8</title>
+<ellipse fill="none" stroke="#5b9bf0" stroke-width="2" cx="35.24" cy="-76.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N4&#45;&gt;N8 -->
+<g id="edge7" class="edge">
+<title>N4&#45;&gt;N8</title>
+<path fill="none" stroke="#555555" d="M73.64,-129.67C65.07,-117.74 51.21,-98.46 42.69,-86.61"/>
+</g>
+<!-- N9 -->
+<g id="node9" class="node">
+<title>N9</title>
+<ellipse fill="none" stroke="#5b9bf0" stroke-width="2" cx="127.24" cy="-76.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N4&#45;&gt;N9 -->
+<g id="edge8" class="edge">
+<title>N4&#45;&gt;N9</title>
+<path fill="none" stroke="#555555" d="M88.84,-129.67C97.41,-117.74 111.27,-98.46 119.79,-86.61"/>
+</g>
+<!-- N10 -->
+<g id="node10" class="node">
+<title>N10</title>
+<ellipse fill="#5b9bf0" stroke="#5b9bf0" stroke-width="2" cx="219.24" cy="-76.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N5&#45;&gt;N10 -->
+<g id="edge9" class="edge">
+<title>N5&#45;&gt;N10</title>
+<path fill="none" stroke="#555555" d="M257.64,-129.67C249.07,-117.74 235.21,-98.46 226.69,-86.61"/>
+</g>
+<!-- N11 -->
+<g id="node11" class="node">
+<title>N11</title>
+<ellipse fill="#8fd16f" stroke="#8fd16f" stroke-width="2" cx="311.24" cy="-76.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N5&#45;&gt;N11 -->
+<g id="edge10" class="edge">
+<title>N5&#45;&gt;N11</title>
+<path fill="none" stroke="#555555" d="M272.84,-129.67C281.41,-117.74 295.27,-98.46 303.79,-86.61"/>
+</g>
+<!-- N12 -->
+<g id="node12" class="node">
+<title>N12</title>
+<ellipse fill="#8fd16f" stroke="#8fd16f" stroke-width="2" cx="403.24" cy="-76.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N6&#45;&gt;N12 -->
+<g id="edge11" class="edge">
+<title>N6&#45;&gt;N12</title>
+<path fill="none" stroke="#555555" d="M441.64,-129.67C433.07,-117.74 419.21,-98.46 410.69,-86.61"/>
+</g>
+<!-- N13 -->
+<g id="node13" class="node">
+<title>N13</title>
+<ellipse fill="#888888" stroke="#888888" stroke-width="2" cx="495.24" cy="-76.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N6&#45;&gt;N13 -->
+<g id="edge12" class="edge">
+<title>N6&#45;&gt;N13</title>
+<path fill="none" stroke="#555555" d="M456.84,-129.67C465.41,-117.74 479.27,-98.46 487.79,-86.61"/>
+</g>
+<!-- N14 -->
+<g id="node14" class="node">
+<title>N14</title>
+<ellipse fill="none" stroke="#888888" stroke-width="2" cx="587.24" cy="-76.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N7&#45;&gt;N14 -->
+<g id="edge13" class="edge">
+<title>N7&#45;&gt;N14</title>
+<path fill="none" stroke="#555555" d="M625.64,-129.67C617.07,-117.74 603.21,-98.46 594.69,-86.61"/>
+</g>
+<!-- N15 -->
+<g id="node15" class="node">
+<title>N15</title>
+<ellipse fill="none" stroke="#888888" stroke-width="2" cx="679.24" cy="-76.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N7&#45;&gt;N15 -->
+<g id="edge14" class="edge">
+<title>N7&#45;&gt;N15</title>
+<path fill="none" stroke="#555555" d="M640.84,-129.67C649.41,-117.74 663.27,-98.46 671.79,-86.61"/>
+</g>
+<!-- N16 -->
+<g id="node16" class="node">
+<title>N16</title>
+<ellipse fill="none" stroke="#5b9bf0" stroke-width="2" cx="12.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N8&#45;&gt;N16 -->
+<g id="edge15" class="edge">
+<title>N8&#45;&gt;N16</title>
+<path fill="none" stroke="#555555" d="M30.81,-63.9C26.73,-52.57 20.73,-35.86 16.66,-24.54"/>
+</g>
+<!-- N17 -->
+<g id="node17" class="node">
+<title>N17</title>
+<ellipse fill="none" stroke="#5b9bf0" stroke-width="2" cx="58.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N8&#45;&gt;N17 -->
+<g id="edge16" class="edge">
+<title>N8&#45;&gt;N17</title>
+<path fill="none" stroke="#555555" d="M39.67,-63.9C43.75,-52.57 49.75,-35.86 53.82,-24.54"/>
+</g>
+<!-- N18 -->
+<g id="node18" class="node">
+<title>N18</title>
+<ellipse fill="none" stroke="#5b9bf0" stroke-width="2" cx="104.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N9&#45;&gt;N18 -->
+<g id="edge17" class="edge">
+<title>N9&#45;&gt;N18</title>
+<path fill="none" stroke="#555555" d="M122.81,-63.9C118.73,-52.57 112.73,-35.86 108.66,-24.54"/>
+</g>
+<!-- N19 -->
+<g id="node19" class="node">
+<title>N19</title>
+<ellipse fill="none" stroke="#5b9bf0" stroke-width="2" cx="150.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N9&#45;&gt;N19 -->
+<g id="edge18" class="edge">
+<title>N9&#45;&gt;N19</title>
+<path fill="none" stroke="#555555" d="M131.67,-63.9C135.75,-52.57 141.75,-35.86 145.82,-24.54"/>
+</g>
+<!-- N20 -->
+<g id="node20" class="node">
+<title>N20</title>
+<ellipse fill="none" stroke="#5b9bf0" stroke-width="2" cx="196.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N10&#45;&gt;N20 -->
+<g id="edge19" class="edge">
+<title>N10&#45;&gt;N20</title>
+<path fill="none" stroke="#555555" d="M214.81,-63.9C210.73,-52.57 204.73,-35.86 200.66,-24.54"/>
+</g>
+<!-- N21 -->
+<g id="node21" class="node">
+<title>N21</title>
+<ellipse fill="none" stroke="#5b9bf0" stroke-width="2" cx="242.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N10&#45;&gt;N21 -->
+<g id="edge20" class="edge">
+<title>N10&#45;&gt;N21</title>
+<path fill="none" stroke="#555555" d="M223.67,-63.9C227.75,-52.57 233.75,-35.86 237.82,-24.54"/>
+</g>
+<!-- N22 -->
+<g id="node22" class="node">
+<title>N22</title>
+<ellipse fill="#8fd16f" stroke="#8fd16f" stroke-width="2" cx="288.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N11&#45;&gt;N22 -->
+<g id="edge21" class="edge">
+<title>N11&#45;&gt;N22</title>
+<path fill="none" stroke="#555555" d="M306.81,-63.9C302.73,-52.57 296.73,-35.86 292.66,-24.54"/>
+</g>
+<!-- N23 -->
+<g id="node23" class="node">
+<title>N23</title>
+<ellipse fill="#8fd16f" stroke="#8fd16f" stroke-width="2" cx="334.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N11&#45;&gt;N23 -->
+<g id="edge22" class="edge">
+<title>N11&#45;&gt;N23</title>
+<path fill="none" stroke="#555555" d="M315.67,-63.9C319.75,-52.57 325.75,-35.86 329.82,-24.54"/>
+</g>
+<!-- N24 -->
+<g id="node24" class="node">
+<title>N24</title>
+<ellipse fill="#8fd16f" stroke="#8fd16f" stroke-width="2" cx="380.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N12&#45;&gt;N24 -->
+<g id="edge23" class="edge">
+<title>N12&#45;&gt;N24</title>
+<path fill="none" stroke="#555555" d="M398.81,-63.9C394.73,-52.57 388.73,-35.86 384.66,-24.54"/>
+</g>
+<!-- N25 -->
+<g id="node25" class="node">
+<title>N25</title>
+<ellipse fill="#888888" stroke="#888888" stroke-width="2" cx="426.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N12&#45;&gt;N25 -->
+<g id="edge24" class="edge">
+<title>N12&#45;&gt;N25</title>
+<path fill="none" stroke="#555555" d="M407.67,-63.9C411.75,-52.57 417.75,-35.86 421.82,-24.54"/>
+</g>
+<!-- N26 -->
+<g id="node26" class="node">
+<title>N26</title>
+<ellipse fill="none" stroke="#888888" stroke-width="2" cx="472.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N13&#45;&gt;N26 -->
+<g id="edge25" class="edge">
+<title>N13&#45;&gt;N26</title>
+<path fill="none" stroke="#555555" d="M490.81,-63.9C486.73,-52.57 480.73,-35.86 476.66,-24.54"/>
+</g>
+<!-- N27 -->
+<g id="node27" class="node">
+<title>N27</title>
+<ellipse fill="none" stroke="#888888" stroke-width="2" cx="518.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N13&#45;&gt;N27 -->
+<g id="edge26" class="edge">
+<title>N13&#45;&gt;N27</title>
+<path fill="none" stroke="#555555" d="M499.67,-63.9C503.75,-52.57 509.75,-35.86 513.82,-24.54"/>
+</g>
+<!-- N28 -->
+<g id="node28" class="node">
+<title>N28</title>
+<ellipse fill="none" stroke="#888888" stroke-width="2" cx="564.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N14&#45;&gt;N28 -->
+<g id="edge27" class="edge">
+<title>N14&#45;&gt;N28</title>
+<path fill="none" stroke="#555555" d="M582.81,-63.9C578.73,-52.57 572.73,-35.86 568.66,-24.54"/>
+</g>
+<!-- N29 -->
+<g id="node29" class="node">
+<title>N29</title>
+<ellipse fill="none" stroke="#888888" stroke-width="2" cx="610.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N14&#45;&gt;N29 -->
+<g id="edge28" class="edge">
+<title>N14&#45;&gt;N29</title>
+<path fill="none" stroke="#555555" d="M591.67,-63.9C595.75,-52.57 601.75,-35.86 605.82,-24.54"/>
+</g>
+<!-- N30 -->
+<g id="node30" class="node">
+<title>N30</title>
+<ellipse fill="none" stroke="#888888" stroke-width="2" cx="656.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N15&#45;&gt;N30 -->
+<g id="edge29" class="edge">
+<title>N15&#45;&gt;N30</title>
+<path fill="none" stroke="#555555" d="M674.81,-63.9C670.73,-52.57 664.73,-35.86 660.66,-24.54"/>
+</g>
+<!-- N31 -->
+<g id="node31" class="node">
+<title>N31</title>
+<ellipse fill="none" stroke="#888888" stroke-width="2" cx="702.24" cy="-12.24" rx="12.24" ry="12.24"/>
+</g>
+<!-- N15&#45;&gt;N31 -->
+<g id="edge30" class="edge">
+<title>N15&#45;&gt;N31</title>
+<path fill="none" stroke="#555555" d="M683.67,-63.9C687.75,-52.57 693.75,-35.86 697.82,-24.54"/>
+</g>
+</g>
+</svg>
diff --git a/doc/images/state-tree-dark.svg b/doc/images/state-tree-dark.svg
new file mode 100644
index 000000000..ff37d4b71
--- /dev/null
+++ b/doc/images/state-tree-dark.svg
@@ -0,0 +1,178 @@
+<svg xmlns="http://www.w3.org/2000/svg" width="670.6" height="1008.59" font-family="-apple-system,BlinkMacSystemFont,'Segoe UI',Helvetica,Arial,sans-serif">
+<text x="207" y="22" font-size="14" font-weight="bold" text-anchor="middle" fill="#e6edf3">State hash-tree</text>
+<text x="541.3" y="22" font-size="14" font-weight="bold" text-anchor="middle" fill="#e6edf3">Address space</text>
+<g transform="translate(34,34)">
+<line x1="332" y1="62" x2="364" y2="44" stroke="#b9c2cf"/>
+<line x1="332" y1="62" x2="364" y2="80" stroke="#b9c2cf"/>
+<line x1="332" y1="126.05" x2="364" y2="113.3" stroke="#b9c2cf"/>
+<line x1="332" y1="126.05" x2="364" y2="138.8" stroke="#b9c2cf"/>
+<line x1="282" y1="94.0251" x2="332" y2="62" stroke="#b9c2cf"/>
+<line x1="282" y1="94.0251" x2="332" y2="126.05" stroke="#b9c2cf"/>
+<line x1="232" y1="128.552" x2="282" y2="94.0251" stroke="#b9c2cf"/>
+<line x1="232" y1="128.552" x2="364" y2="163.078" stroke="#b9c2cf"/>
+<line x1="332" y1="211.805" x2="364" y2="192.457" stroke="#b9c2cf"/>
+<line x1="332" y1="211.805" x2="364" y2="231.154" stroke="#b9c2cf"/>
+<line x1="282" y1="244.878" x2="332" y2="211.805" stroke="#b9c2cf"/>
+<line x1="282" y1="244.878" x2="364" y2="277.951" stroke="#b9c2cf"/>
+<line x1="182" y1="186.715" x2="232" y2="128.552" stroke="#b9c2cf"/>
+<line x1="182" y1="186.715" x2="282" y2="244.878" stroke="#b9c2cf"/>
+<line x1="132" y1="252.172" x2="182" y2="186.715" stroke="#b9c2cf"/>
+<line x1="132" y1="252.172" x2="364" y2="317.63" stroke="#b9c2cf"/>
+<line x1="332" y1="412.904" x2="364" y2="388.791" stroke="#b9c2cf"/>
+<line x1="332" y1="412.904" x2="364" y2="437.017" stroke="#b9c2cf"/>
+<line x1="332" y1="501.342" x2="364" y2="485.244" stroke="#b9c2cf"/>
+<line x1="332" y1="501.342" x2="364" y2="517.441" stroke="#b9c2cf"/>
+<line x1="282" y1="457.123" x2="332" y2="412.904" stroke="#b9c2cf"/>
+<line x1="282" y1="457.123" x2="332" y2="501.342" stroke="#b9c2cf"/>
+<line x1="232" y1="497.116" x2="282" y2="457.123" stroke="#b9c2cf"/>
+<line x1="232" y1="497.116" x2="364" y2="537.108" stroke="#b9c2cf"/>
+<line x1="332" y1="575.585" x2="364" y2="558.883" stroke="#b9c2cf"/>
+<line x1="332" y1="575.585" x2="364" y2="592.287" stroke="#b9c2cf"/>
+<line x1="182" y1="536.351" x2="232" y2="497.116" stroke="#b9c2cf"/>
+<line x1="182" y1="536.351" x2="332" y2="575.585" stroke="#b9c2cf"/>
+<line x1="132" y1="443" x2="364" y2="349.649" stroke="#b9c2cf"/>
+<line x1="132" y1="443" x2="182" y2="536.351" stroke="#b9c2cf"/>
+<line x1="82" y1="347.586" x2="132" y2="252.172" stroke="#b9c2cf"/>
+<line x1="82" y1="347.586" x2="132" y2="443" stroke="#b9c2cf"/>
+<line x1="332" y1="670.587" x2="364" y2="642.687" stroke="#b9c2cf"/>
+<line x1="332" y1="670.587" x2="364" y2="698.487" stroke="#b9c2cf"/>
+<line x1="282" y1="712.887" x2="332" y2="670.587" stroke="#b9c2cf"/>
+<line x1="282" y1="712.887" x2="364" y2="755.187" stroke="#b9c2cf"/>
+<line x1="332" y1="828.871" x2="364" y2="809.187" stroke="#b9c2cf"/>
+<line x1="332" y1="828.871" x2="364" y2="848.554" stroke="#b9c2cf"/>
+<line x1="232" y1="770.879" x2="282" y2="712.887" stroke="#b9c2cf"/>
+<line x1="232" y1="770.879" x2="332" y2="828.871" stroke="#b9c2cf"/>
+<line x1="182" y1="824.55" x2="232" y2="770.879" stroke="#b9c2cf"/>
+<line x1="182" y1="824.55" x2="364" y2="878.22" stroke="#b9c2cf"/>
+<line x1="32" y1="586.068" x2="82" y2="347.586" stroke="#b9c2cf"/>
+<line x1="32" y1="586.068" x2="182" y2="824.55" stroke="#b9c2cf"/>
+<line x1="-18" y1="756.111" x2="32" y2="586.068" stroke="#b9c2cf"/>
+<line x1="-18" y1="756.111" x2="364" y2="926.154" stroke="#b9c2cf"/>
+<rect x="390" y="26" width="22" height="36" fill="#2f6fb3" stroke="#b9c2cf"/>
+<text x="420" y="30" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000000000000</text>
+<text x="420" y="48" font-size="13" fill="#5b9bf0">shadow state <tspan fill="#9aa4b2" font-size="10">(2^15 bytes)</tspan></text>
+<rect x="390" y="62" width="22" height="36" fill="#ffffff" stroke="#b9c2cf"/>
+<text x="420" y="66" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000000008000</text>
+<text x="420" y="84" font-size="12" font-style="italic" fill="#ffffff">pristine</text>
+<rect x="390" y="98" width="22" height="30.6" fill="#2f6fb3" stroke="#b9c2cf"/>
+<text x="420" y="102" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000000010000</text>
+<text x="420" y="117.3" font-size="13" fill="#5b9bf0">PMAs <tspan fill="#9aa4b2" font-size="10">(2^12 bytes)</tspan></text>
+<rect x="390" y="128.6" width="22" height="48.5565" fill="#ffffff" stroke="#b9c2cf"/>
+<text x="420" y="132.6" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000000011000</text>
+<text x="420" y="156.878" font-size="12" font-style="italic" fill="#ffffff">pristine</text>
+<rect x="390" y="177.157" width="22" height="30.6" fill="#2f6fb3" stroke="#b9c2cf"/>
+<text x="420" y="181.157" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000000400000</text>
+<text x="420" y="196.457" font-size="13" fill="#5b9bf0">shadow uarch state <tspan fill="#9aa4b2" font-size="10">(2^12 bytes)</tspan></text>
+<rect x="390" y="207.757" width="22" height="46.7949" fill="#ffffff" stroke="#b9c2cf"/>
+<text x="420" y="211.757" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000000401000</text>
+<text x="420" y="235.154" font-size="12" font-style="italic" fill="#ffffff">pristine</text>
+<rect x="390" y="254.551" width="22" height="46.8" fill="#2f6fb3" stroke="#b9c2cf"/>
+<text x="420" y="258.551" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000000600000</text>
+<text x="420" y="281.951" font-size="13" fill="#5b9bf0">uarch RAM <tspan fill="#9aa4b2" font-size="10">(2^21 bytes)</tspan></text>
+<rect x="390" y="301.351" width="22" height="64.0394" fill="#ffffff" stroke="#b9c2cf"/>
+<text x="420" y="305.351" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000000800000</text>
+<text x="420" y="337.371" font-size="12" font-style="italic" fill="#ffffff">pristine</text>
+<rect x="390" y="365.391" width="22" height="46.8" fill="#2f6fb3" stroke="#b9c2cf"/>
+<text x="420" y="369.391" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000060000000</text>
+<text x="420" y="392.791" font-size="13" fill="#5b9bf0">CMIO rx buffer <tspan fill="#9aa4b2" font-size="10">(2^21 bytes)</tspan></text>
+<rect x="390" y="412.191" width="22" height="49.6529" fill="#ffffff" stroke="#b9c2cf"/>
+<text x="420" y="416.191" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000060200000</text>
+<text x="420" y="441.017" font-size="12" font-style="italic" fill="#ffffff">pristine</text>
+<rect x="390" y="461.844" width="22" height="46.8" fill="#2f6fb3" stroke="#b9c2cf"/>
+<text x="420" y="465.844" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000060800000</text>
+<text x="420" y="489.244" font-size="13" fill="#5b9bf0">CMIO tx buffer <tspan fill="#9aa4b2" font-size="10">(2^21 bytes)</tspan></text>
+<rect x="390" y="508.644" width="22" height="61.1436" fill="#ffffff" stroke="#b9c2cf"/>
+<text x="420" y="512.644" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000060a00000</text>
+<text x="420" y="543.216" font-size="12" font-style="italic" fill="#ffffff">pristine</text>
+<rect x="390" y="569.787" width="22" height="45" fill="#2f6fb3" stroke="#b9c2cf"/>
+<text x="420" y="573.787" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x000007ff00000</text>
+<text x="420" y="596.287" font-size="13" fill="#5b9bf0">DTB <tspan fill="#9aa4b2" font-size="10">(2^20 bytes)</tspan></text>
+<rect x="390" y="614.787" width="22" height="55.8" fill="#2f6fb3" stroke="#b9c2cf"/>
+<text x="420" y="618.787" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000080000000</text>
+<text x="420" y="646.687" font-size="13" fill="#5b9bf0">RAM <tspan fill="#9aa4b2" font-size="10">(2^26 bytes)</tspan></text>
+<rect x="390" y="670.587" width="22" height="55.8" fill="#ffffff" stroke="#b9c2cf"/>
+<text x="420" y="674.587" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000084000000</text>
+<text x="420" y="702.487" font-size="12" font-style="italic" fill="#ffffff">pristine</text>
+<rect x="390" y="726.387" width="22" height="57.6" fill="#2f6fb3" stroke="#b9c2cf"/>
+<text x="420" y="730.387" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000088000000</text>
+<text x="420" y="759.187" font-size="13" fill="#5b9bf0">flash drive 0 <tspan fill="#9aa4b2" font-size="10">(2^27 bytes)</tspan></text>
+<rect x="390" y="783.987" width="22" height="50.4" fill="#2f6fb3" stroke="#b9c2cf"/>
+<text x="420" y="787.987" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000090000000</text>
+<text x="420" y="813.187" font-size="13" fill="#5b9bf0">nvram 0 <tspan fill="#9aa4b2" font-size="10">(2^23 bytes)</tspan></text>
+<rect x="390" y="834.387" width="22" height="124.2" fill="#ffffff" stroke="#b9c2cf"/>
+<text x="420" y="838.387" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">0x0000090800000</text>
+<text x="420" y="900.487" font-size="12" font-style="italic" fill="#ffffff">pristine</text>
+<text x="420" y="962.587" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#9aa4b2">2^64</text>
+<polygon points="364,44 382,26.5 382,61.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<circle cx="364" cy="44" r="3.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<polygon points="364,80 382,62.5 382,97.5" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="80" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,113.3 382,98.5 382,128.1" fill="#2f6fb3" stroke="#b9c2cf"/>
+<circle cx="364" cy="113.3" r="3.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<polygon points="364,138.8 382,129.1 382,148.5" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="138.8" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,163.078 382,149.5 382,176.657" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="163.078" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,192.457 382,177.657 382,207.257" fill="#2f6fb3" stroke="#b9c2cf"/>
+<circle cx="364" cy="192.457" r="3.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<polygon points="364,231.154 382,208.257 382,254.051" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="231.154" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,277.951 382,255.051 382,300.851" fill="#2f6fb3" stroke="#b9c2cf"/>
+<circle cx="364" cy="277.951" r="3.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<polygon points="364,317.63 382,301.851 382,333.408" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="317.63" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,349.649 382,334.408 382,364.891" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="349.649" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,388.791 382,365.891 382,411.691" fill="#2f6fb3" stroke="#b9c2cf"/>
+<circle cx="364" cy="388.791" r="3.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<polygon points="364,437.017 382,412.691 382,461.344" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="437.017" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,485.244 382,462.344 382,508.144" fill="#2f6fb3" stroke="#b9c2cf"/>
+<circle cx="364" cy="485.244" r="3.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<polygon points="364,517.441 382,509.144 382,525.738" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="517.441" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,537.108 382,526.738 382,547.479" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="537.108" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,558.883 382,548.479 382,569.287" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="558.883" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,592.287 382,570.287 382,614.287" fill="#2f6fb3" stroke="#b9c2cf"/>
+<circle cx="364" cy="592.287" r="3.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<polygon points="364,642.687 382,615.287 382,670.087" fill="#2f6fb3" stroke="#b9c2cf"/>
+<circle cx="364" cy="642.687" r="3.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<polygon points="364,698.487 382,671.087 382,725.887" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="698.487" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,755.187 382,726.887 382,783.487" fill="#2f6fb3" stroke="#b9c2cf"/>
+<circle cx="364" cy="755.187" r="3.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<polygon points="364,809.187 382,784.487 382,833.887" fill="#2f6fb3" stroke="#b9c2cf"/>
+<circle cx="364" cy="809.187" r="3.5" fill="#2f6fb3" stroke="#b9c2cf"/>
+<polygon points="364,848.554 382,834.887 382,862.22" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="848.554" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,878.22 382,863.22 382,893.22" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="878.22" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<polygon points="364,926.154 382,894.22 382,958.087" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="364" cy="926.154" r="3.5" fill="#ffffff" stroke="#b9c2cf"/>
+<circle cx="332" cy="62" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="332" cy="126.05" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="282" cy="94.0251" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="232" cy="128.552" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="332" cy="211.805" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="282" cy="244.878" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="182" cy="186.715" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="132" cy="252.172" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="332" cy="412.904" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="332" cy="501.342" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="282" cy="457.123" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="232" cy="497.116" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="332" cy="575.585" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="182" cy="536.351" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="132" cy="443" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="82" cy="347.586" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="332" cy="670.587" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="282" cy="712.887" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="332" cy="828.871" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="232" cy="770.879" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="182" cy="824.55" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="32" cy="586.068" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+<circle cx="-18" cy="756.111" r="3.5" fill="#8b949e" stroke="#b9c2cf"/>
+</g>
+</svg>
diff --git a/doc/images/state-tree-light.svg b/doc/images/state-tree-light.svg
new file mode 100644
index 000000000..6b44f011f
--- /dev/null
+++ b/doc/images/state-tree-light.svg
@@ -0,0 +1,178 @@
+<svg xmlns="http://www.w3.org/2000/svg" width="670.6" height="1008.59" font-family="-apple-system,BlinkMacSystemFont,'Segoe UI',Helvetica,Arial,sans-serif">
+<text x="207" y="22" font-size="14" font-weight="bold" text-anchor="middle" fill="#1f2328">State hash-tree</text>
+<text x="541.3" y="22" font-size="14" font-weight="bold" text-anchor="middle" fill="#1f2328">Address space</text>
+<g transform="translate(34,34)">
+<line x1="332" y1="62" x2="364" y2="44" stroke="#57606a"/>
+<line x1="332" y1="62" x2="364" y2="80" stroke="#57606a"/>
+<line x1="332" y1="126.05" x2="364" y2="113.3" stroke="#57606a"/>
+<line x1="332" y1="126.05" x2="364" y2="138.8" stroke="#57606a"/>
+<line x1="282" y1="94.0251" x2="332" y2="62" stroke="#57606a"/>
+<line x1="282" y1="94.0251" x2="332" y2="126.05" stroke="#57606a"/>
+<line x1="232" y1="128.552" x2="282" y2="94.0251" stroke="#57606a"/>
+<line x1="232" y1="128.552" x2="364" y2="163.078" stroke="#57606a"/>
+<line x1="332" y1="211.805" x2="364" y2="192.457" stroke="#57606a"/>
+<line x1="332" y1="211.805" x2="364" y2="231.154" stroke="#57606a"/>
+<line x1="282" y1="244.878" x2="332" y2="211.805" stroke="#57606a"/>
+<line x1="282" y1="244.878" x2="364" y2="277.951" stroke="#57606a"/>
+<line x1="182" y1="186.715" x2="232" y2="128.552" stroke="#57606a"/>
+<line x1="182" y1="186.715" x2="282" y2="244.878" stroke="#57606a"/>
+<line x1="132" y1="252.172" x2="182" y2="186.715" stroke="#57606a"/>
+<line x1="132" y1="252.172" x2="364" y2="317.63" stroke="#57606a"/>
+<line x1="332" y1="412.904" x2="364" y2="388.791" stroke="#57606a"/>
+<line x1="332" y1="412.904" x2="364" y2="437.017" stroke="#57606a"/>
+<line x1="332" y1="501.342" x2="364" y2="485.244" stroke="#57606a"/>
+<line x1="332" y1="501.342" x2="364" y2="517.441" stroke="#57606a"/>
+<line x1="282" y1="457.123" x2="332" y2="412.904" stroke="#57606a"/>
+<line x1="282" y1="457.123" x2="332" y2="501.342" stroke="#57606a"/>
+<line x1="232" y1="497.116" x2="282" y2="457.123" stroke="#57606a"/>
+<line x1="232" y1="497.116" x2="364" y2="537.108" stroke="#57606a"/>
+<line x1="332" y1="575.585" x2="364" y2="558.883" stroke="#57606a"/>
+<line x1="332" y1="575.585" x2="364" y2="592.287" stroke="#57606a"/>
+<line x1="182" y1="536.351" x2="232" y2="497.116" stroke="#57606a"/>
+<line x1="182" y1="536.351" x2="332" y2="575.585" stroke="#57606a"/>
+<line x1="132" y1="443" x2="364" y2="349.649" stroke="#57606a"/>
+<line x1="132" y1="443" x2="182" y2="536.351" stroke="#57606a"/>
+<line x1="82" y1="347.586" x2="132" y2="252.172" stroke="#57606a"/>
+<line x1="82" y1="347.586" x2="132" y2="443" stroke="#57606a"/>
+<line x1="332" y1="670.587" x2="364" y2="642.687" stroke="#57606a"/>
+<line x1="332" y1="670.587" x2="364" y2="698.487" stroke="#57606a"/>
+<line x1="282" y1="712.887" x2="332" y2="670.587" stroke="#57606a"/>
+<line x1="282" y1="712.887" x2="364" y2="755.187" stroke="#57606a"/>
+<line x1="332" y1="828.871" x2="364" y2="809.187" stroke="#57606a"/>
+<line x1="332" y1="828.871" x2="364" y2="848.554" stroke="#57606a"/>
+<line x1="232" y1="770.879" x2="282" y2="712.887" stroke="#57606a"/>
+<line x1="232" y1="770.879" x2="332" y2="828.871" stroke="#57606a"/>
+<line x1="182" y1="824.55" x2="232" y2="770.879" stroke="#57606a"/>
+<line x1="182" y1="824.55" x2="364" y2="878.22" stroke="#57606a"/>
+<line x1="32" y1="586.068" x2="82" y2="347.586" stroke="#57606a"/>
+<line x1="32" y1="586.068" x2="182" y2="824.55" stroke="#57606a"/>
+<line x1="-18" y1="756.111" x2="32" y2="586.068" stroke="#57606a"/>
+<line x1="-18" y1="756.111" x2="364" y2="926.154" stroke="#57606a"/>
+<rect x="390" y="26" width="22" height="36" fill="#2f6fb3" stroke="#57606a"/>
+<text x="420" y="30" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000000000000</text>
+<text x="420" y="48" font-size="13" fill="#0969da">shadow state <tspan fill="#6e7781" font-size="10">(2^15 bytes)</tspan></text>
+<rect x="390" y="62" width="22" height="36" fill="#eaeef2" stroke="#57606a"/>
+<text x="420" y="66" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000000008000</text>
+<text x="420" y="84" font-size="12" font-style="italic" fill="#eaeef2">pristine</text>
+<rect x="390" y="98" width="22" height="30.6" fill="#2f6fb3" stroke="#57606a"/>
+<text x="420" y="102" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000000010000</text>
+<text x="420" y="117.3" font-size="13" fill="#0969da">PMAs <tspan fill="#6e7781" font-size="10">(2^12 bytes)</tspan></text>
+<rect x="390" y="128.6" width="22" height="48.5565" fill="#eaeef2" stroke="#57606a"/>
+<text x="420" y="132.6" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000000011000</text>
+<text x="420" y="156.878" font-size="12" font-style="italic" fill="#eaeef2">pristine</text>
+<rect x="390" y="177.157" width="22" height="30.6" fill="#2f6fb3" stroke="#57606a"/>
+<text x="420" y="181.157" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000000400000</text>
+<text x="420" y="196.457" font-size="13" fill="#0969da">shadow uarch state <tspan fill="#6e7781" font-size="10">(2^12 bytes)</tspan></text>
+<rect x="390" y="207.757" width="22" height="46.7949" fill="#eaeef2" stroke="#57606a"/>
+<text x="420" y="211.757" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000000401000</text>
+<text x="420" y="235.154" font-size="12" font-style="italic" fill="#eaeef2">pristine</text>
+<rect x="390" y="254.551" width="22" height="46.8" fill="#2f6fb3" stroke="#57606a"/>
+<text x="420" y="258.551" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000000600000</text>
+<text x="420" y="281.951" font-size="13" fill="#0969da">uarch RAM <tspan fill="#6e7781" font-size="10">(2^21 bytes)</tspan></text>
+<rect x="390" y="301.351" width="22" height="64.0394" fill="#eaeef2" stroke="#57606a"/>
+<text x="420" y="305.351" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000000800000</text>
+<text x="420" y="337.371" font-size="12" font-style="italic" fill="#eaeef2">pristine</text>
+<rect x="390" y="365.391" width="22" height="46.8" fill="#2f6fb3" stroke="#57606a"/>
+<text x="420" y="369.391" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000060000000</text>
+<text x="420" y="392.791" font-size="13" fill="#0969da">CMIO rx buffer <tspan fill="#6e7781" font-size="10">(2^21 bytes)</tspan></text>
+<rect x="390" y="412.191" width="22" height="49.6529" fill="#eaeef2" stroke="#57606a"/>
+<text x="420" y="416.191" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000060200000</text>
+<text x="420" y="441.017" font-size="12" font-style="italic" fill="#eaeef2">pristine</text>
+<rect x="390" y="461.844" width="22" height="46.8" fill="#2f6fb3" stroke="#57606a"/>
+<text x="420" y="465.844" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000060800000</text>
+<text x="420" y="489.244" font-size="13" fill="#0969da">CMIO tx buffer <tspan fill="#6e7781" font-size="10">(2^21 bytes)</tspan></text>
+<rect x="390" y="508.644" width="22" height="61.1436" fill="#eaeef2" stroke="#57606a"/>
+<text x="420" y="512.644" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000060a00000</text>
+<text x="420" y="543.216" font-size="12" font-style="italic" fill="#eaeef2">pristine</text>
+<rect x="390" y="569.787" width="22" height="45" fill="#2f6fb3" stroke="#57606a"/>
+<text x="420" y="573.787" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x000007ff00000</text>
+<text x="420" y="596.287" font-size="13" fill="#0969da">DTB <tspan fill="#6e7781" font-size="10">(2^20 bytes)</tspan></text>
+<rect x="390" y="614.787" width="22" height="55.8" fill="#2f6fb3" stroke="#57606a"/>
+<text x="420" y="618.787" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000080000000</text>
+<text x="420" y="646.687" font-size="13" fill="#0969da">RAM <tspan fill="#6e7781" font-size="10">(2^26 bytes)</tspan></text>
+<rect x="390" y="670.587" width="22" height="55.8" fill="#eaeef2" stroke="#57606a"/>
+<text x="420" y="674.587" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000084000000</text>
+<text x="420" y="702.487" font-size="12" font-style="italic" fill="#eaeef2">pristine</text>
+<rect x="390" y="726.387" width="22" height="57.6" fill="#2f6fb3" stroke="#57606a"/>
+<text x="420" y="730.387" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000088000000</text>
+<text x="420" y="759.187" font-size="13" fill="#0969da">flash drive 0 <tspan fill="#6e7781" font-size="10">(2^27 bytes)</tspan></text>
+<rect x="390" y="783.987" width="22" height="50.4" fill="#2f6fb3" stroke="#57606a"/>
+<text x="420" y="787.987" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000090000000</text>
+<text x="420" y="813.187" font-size="13" fill="#0969da">nvram 0 <tspan fill="#6e7781" font-size="10">(2^23 bytes)</tspan></text>
+<rect x="390" y="834.387" width="22" height="124.2" fill="#eaeef2" stroke="#57606a"/>
+<text x="420" y="838.387" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">0x0000090800000</text>
+<text x="420" y="900.487" font-size="12" font-style="italic" fill="#eaeef2">pristine</text>
+<text x="420" y="962.587" font-size="10" font-family="ui-monospace,SFMono-Regular,Menlo,Consolas,monospace" fill="#6e7781">2^64</text>
+<polygon points="364,44 382,26.5 382,61.5" fill="#2f6fb3" stroke="#57606a"/>
+<circle cx="364" cy="44" r="3.5" fill="#2f6fb3" stroke="#57606a"/>
+<polygon points="364,80 382,62.5 382,97.5" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="80" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,113.3 382,98.5 382,128.1" fill="#2f6fb3" stroke="#57606a"/>
+<circle cx="364" cy="113.3" r="3.5" fill="#2f6fb3" stroke="#57606a"/>
+<polygon points="364,138.8 382,129.1 382,148.5" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="138.8" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,163.078 382,149.5 382,176.657" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="163.078" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,192.457 382,177.657 382,207.257" fill="#2f6fb3" stroke="#57606a"/>
+<circle cx="364" cy="192.457" r="3.5" fill="#2f6fb3" stroke="#57606a"/>
+<polygon points="364,231.154 382,208.257 382,254.051" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="231.154" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,277.951 382,255.051 382,300.851" fill="#2f6fb3" stroke="#57606a"/>
+<circle cx="364" cy="277.951" r="3.5" fill="#2f6fb3" stroke="#57606a"/>
+<polygon points="364,317.63 382,301.851 382,333.408" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="317.63" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,349.649 382,334.408 382,364.891" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="349.649" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,388.791 382,365.891 382,411.691" fill="#2f6fb3" stroke="#57606a"/>
+<circle cx="364" cy="388.791" r="3.5" fill="#2f6fb3" stroke="#57606a"/>
+<polygon points="364,437.017 382,412.691 382,461.344" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="437.017" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,485.244 382,462.344 382,508.144" fill="#2f6fb3" stroke="#57606a"/>
+<circle cx="364" cy="485.244" r="3.5" fill="#2f6fb3" stroke="#57606a"/>
+<polygon points="364,517.441 382,509.144 382,525.738" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="517.441" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,537.108 382,526.738 382,547.479" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="537.108" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,558.883 382,548.479 382,569.287" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="558.883" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,592.287 382,570.287 382,614.287" fill="#2f6fb3" stroke="#57606a"/>
+<circle cx="364" cy="592.287" r="3.5" fill="#2f6fb3" stroke="#57606a"/>
+<polygon points="364,642.687 382,615.287 382,670.087" fill="#2f6fb3" stroke="#57606a"/>
+<circle cx="364" cy="642.687" r="3.5" fill="#2f6fb3" stroke="#57606a"/>
+<polygon points="364,698.487 382,671.087 382,725.887" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="698.487" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,755.187 382,726.887 382,783.487" fill="#2f6fb3" stroke="#57606a"/>
+<circle cx="364" cy="755.187" r="3.5" fill="#2f6fb3" stroke="#57606a"/>
+<polygon points="364,809.187 382,784.487 382,833.887" fill="#2f6fb3" stroke="#57606a"/>
+<circle cx="364" cy="809.187" r="3.5" fill="#2f6fb3" stroke="#57606a"/>
+<polygon points="364,848.554 382,834.887 382,862.22" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="848.554" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,878.22 382,863.22 382,893.22" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="878.22" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<polygon points="364,926.154 382,894.22 382,958.087" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="364" cy="926.154" r="3.5" fill="#eaeef2" stroke="#57606a"/>
+<circle cx="332" cy="62" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="332" cy="126.05" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="282" cy="94.0251" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="232" cy="128.552" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="332" cy="211.805" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="282" cy="244.878" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="182" cy="186.715" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="132" cy="252.172" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="332" cy="412.904" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="332" cy="501.342" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="282" cy="457.123" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="232" cy="497.116" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="332" cy="575.585" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="182" cy="536.351" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="132" cy="443" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="82" cy="347.586" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="332" cy="670.587" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="282" cy="712.887" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="332" cy="828.871" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="232" cy="770.879" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="182" cy="824.55" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="32" cy="586.068" r="3.5" fill="#8b949e" stroke="#57606a"/>
+<circle cx="-18" cy="756.111" r="3.5" fill="#8b949e" stroke="#57606a"/>
+</g>
+</svg>
diff --git a/doc/images/state-tree.lua b/doc/images/state-tree.lua
new file mode 100644
index 000000000..0762dd7fe
--- /dev/null
+++ b/doc/images/state-tree.lua
@@ -0,0 +1,301 @@
+-- Renders the machine state as a Merkle tree over the address space, as an SVG for a dark
+-- background. Every complete subtree is a filled triangle with a root node at its apex: blue
+-- for a named memory range, white for an elided pristine subtree. Internal nodes are circles
+-- joined by edges, colored by what their subtree holds: blue if all ranges, white if all
+-- pristine, gray if mixed. A gap that straddles a split boundary is two triangles (one from
+-- above, one from below) sharing a single band in the bar. Band height is proportional to
+-- log2 of the whole span; a shared band splits it between its triangles by each one's log2
+-- span (since log2(B + C) is not log2(B) + log2(C), the parts are scaled to add up). Run as
+-- `lua5.4 state-tree.lua > state-tree.svg`.
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+local m = cartesi.machine({
+    ram = { length = 64 << 20 },
+    flash_drive = { { length = 128 << 20 } },
+    nvram = { { length = 8 << 20 } },
+})
+local TWO64 = 2.0 ^ 64
+local function lg(x)
+    return math.log(x, 2)
+end
+local function rowh(span)
+    return 9 + 1.8 * lg(span)
+end
+local function hex(a)
+    return string.format("0x%013x", math.tointeger(a) or math.tointeger(math.floor(a)) or 0)
+end
+
+local FONT = "-apple-system,BlinkMacSystemFont,'Segoe UI',Helvetica,Arial,sans-serif"
+local MONO = "ui-monospace,SFMono-Regular,Menlo,Consolas,monospace"
+-- Palette per theme. The first argument selects "light" or "dark" (default), so a
+-- <picture> in the page can serve the variant that matches the reader's theme. BLUE
+-- (range fill) and GRAY (mixed node) read on both backgrounds; the rest flip.
+local THEMES = {
+    dark = { FG = "#e6edf3", MUT = "#9aa4b2", EDGE = "#b9c2cf", WHITE = "#ffffff", BLUE_T = "#5b9bf0" },
+    light = { FG = "#1f2328", MUT = "#6e7781", EDGE = "#57606a", WHITE = "#eaeef2", BLUE_T = "#0969da" },
+}
+local theme = THEMES[arg[1]] or THEMES.dark
+local FG, MUT, EDGE, WHITE, BLUE_T = theme.FG, theme.MUT, theme.EDGE, theme.WHITE, theme.BLUE_T
+local BLUE, GRAY = "#2f6fb3", "#8b949e"
+
+local ranges = {}
+for _, r in ipairs(m:get_address_ranges()) do
+    if r.is_memory then
+        ranges[#ranges + 1] = { start = r.start, len = r.length, desc = r.description }
+    end
+end
+table.sort(ranges, function(a, b)
+    return a.start < b.start
+end)
+
+-- All ranges fully contained in the address interval [lo, hi).
+local function rangesin(lo, hi)
+    local t = {}
+    for _, r in ipairs(ranges) do
+        if r.start >= lo and r.start + r.len <= hi then
+            t[#t + 1] = r
+        end
+    end
+    return t
+end
+
+-- Binary Merkle tree by address bisection, contracting all-pristine subtrees to one triangle.
+-- A leaf is either a memory range, or a pristine interval { tlo, thi }.
+local function build(lo, hi)
+    local upper, lower, core
+    while true do
+        local within = rangesin(lo, hi)
+        if #within == 0 then
+            core = { tlo = lo, thi = hi }
+            break
+        end
+        if #within == 1 and within[1].start == lo and within[1].start + within[1].len == hi then
+            core = within[1]
+            break
+        end
+        local mid = lo + (hi - lo) / 2
+        local nl, nr = 0, 0
+        for _, r in ipairs(within) do
+            if r.start < mid then
+                nl = nl + 1
+            else
+                nr = nr + 1
+            end
+        end
+        if nl > 0 and nr > 0 then
+            core = { l = build(lo, mid), r = build(mid, hi) }
+            break
+        elseif nr == 0 then
+            upper = { tlo = mid, thi = upper and upper.thi or hi }
+            hi = mid
+        else
+            lower = { tlo = lower and lower.tlo or lo, thi = mid }
+            lo = mid
+        end
+    end
+    if upper then
+        core = { l = core, r = upper }
+    end
+    if lower then
+        core = { l = lower, r = core }
+    end
+    return core
+end
+local tree = build(0, TWO64)
+
+-- Node color: blue if its subtree holds only ranges, white if only pristine, gray if mixed.
+local function classify(n)
+    if n.desc then
+        return true, false
+    end
+    if n.tlo then
+        return false, true
+    end
+    local lr, lp = classify(n.l)
+    local rr, rp = classify(n.r)
+    return lr or rr, lp or rp
+end
+local function colorof(n)
+    local hr, hp = classify(n)
+    if hr and hp then
+        return GRAY
+    elseif hr then
+        return BLUE
+    else
+        return WHITE
+    end
+end
+
+local function is_leaf(n)
+    return n.desc ~= nil or n.tlo ~= nil
+end
+local rows = {}
+local function inorder(n)
+    if is_leaf(n) then
+        rows[#rows + 1] = n
+    else
+        inorder(n.l)
+        inorder(n.r)
+    end
+end
+inorder(tree)
+
+local TOP, BAR_W, DX, TRI_W = 26, 22, 50, 18
+local BAR_X = 40 + 7 * DX
+local GAP = 8 -- horizontal gap so leaf triangles do not touch the address-space bar
+local X_LEAF = BAR_X - GAP
+
+-- Geometry. Each band's height is rowh of its whole span; a band shared by several pristine
+-- triangles splits that height among them in proportion to each triangle's log2 span.
+local bands = {}
+local y, i = TOP, 1
+while i <= #rows do
+    local lf = rows[i]
+    if lf.tlo then
+        local j = i
+        while j < #rows and rows[j + 1].tlo do
+            j = j + 1
+        end
+        local top = y
+        local height = rowh(rows[j].thi - rows[i].tlo)
+        local sum = 0
+        for k = i, j do
+            sum = sum + lg(rows[k].thi - rows[k].tlo)
+        end
+        for k = i, j do
+            local hh = height * lg(rows[k].thi - rows[k].tlo) / sum
+            rows[k].y0, rows[k].h, rows[k].cy = y, hh, y + hh / 2
+            y = y + hh
+        end
+        bands[#bands + 1] = { pristine = true, top = top, bot = y, start = rows[i].tlo }
+        i = j + 1
+    else
+        lf.h = rowh(lf.len)
+        lf.y0, lf.cy = y, y + lf.h / 2
+        bands[#bands + 1] = { range = lf }
+        y = y + lf.h
+        i = i + 1
+    end
+end
+local BAR_BOT = y
+
+-- Lay out the tree right-to-left: each node sits one column left of its deeper child.
+local edges, dots = {}, {}
+local function layout(n)
+    if is_leaf(n) then
+        return X_LEAF - TRI_W, n.cy, 0
+    end
+    local lcx, ly, lh = layout(n.l)
+    local rcx, ry, rh = layout(n.r)
+    local h = math.max(lh, rh) + 1
+    local x, cy = X_LEAF - h * DX, (ly + ry) / 2
+    edges[#edges + 1] = { x, cy, lcx, ly }
+    edges[#edges + 1] = { x, cy, rcx, ry }
+    dots[#dots + 1] = { x = x, y = cy, color = colorof(n) }
+    return x, cy, h
+end
+local rootx = layout(tree)
+
+-- Bounds: the root sits far to the left, the range labels extend to the right. Compute the
+-- real extent and shift the whole drawing into a padded viewport with room for the headers.
+local TX = BAR_X + BAR_W + 8
+local maxr = TX + 60
+for _, b in ipairs(bands) do
+    if b.range then
+        local label = string.format("%s (2^%d bytes)", b.range.desc, util.ilog2(b.range.len))
+        maxr = math.max(maxr, TX + #label * 6.6)
+    end
+end
+local PAD, HEADER = 16, 34
+local SHIFT = PAD - rootx
+local W, H = SHIFT + maxr + 12, HEADER + BAR_BOT + 16
+
+local s = {}
+local function p(...)
+    s[#s + 1] = string.format(...)
+end
+p('<svg xmlns="http://www.w3.org/2000/svg" width="%g" height="%g" font-family="%s">', W, H, FONT)
+p(
+    '<text x="%g" y="22" font-size="14" font-weight="bold" text-anchor="middle" fill="%s">State hash-tree</text>',
+    SHIFT + (rootx + X_LEAF - TRI_W) / 2,
+    FG
+)
+p(
+    '<text x="%g" y="22" font-size="14" font-weight="bold" text-anchor="middle" fill="%s">Address space</text>',
+    SHIFT + (BAR_X + maxr) / 2,
+    FG
+)
+p('<g transform="translate(%g,%g)">', SHIFT, HEADER)
+for _, e in ipairs(edges) do
+    p('<line x1="%g" y1="%g" x2="%g" y2="%g" stroke="%s"/>', e[1], e[2], e[3], e[4], EDGE)
+end
+for _, b in ipairs(bands) do
+    if b.pristine then
+        p(
+            '<rect x="%g" y="%g" width="%g" height="%g" fill="%s" stroke="%s"/>',
+            BAR_X,
+            b.top,
+            BAR_W,
+            b.bot - b.top,
+            WHITE,
+            EDGE
+        )
+        p(
+            '<text x="%g" y="%g" font-size="10" font-family="%s" fill="%s">%s</text>',
+            TX,
+            b.top + 4,
+            MONO,
+            MUT,
+            hex(b.start)
+        )
+        p(
+            '<text x="%g" y="%g" font-size="12" font-style="italic" fill="%s">pristine</text>',
+            TX,
+            (b.top + b.bot) / 2 + 4,
+            WHITE
+        )
+    else
+        local lf = b.range
+        p('<rect x="%g" y="%g" width="%g" height="%g" fill="%s" stroke="%s"/>', BAR_X, lf.y0, BAR_W, lf.h, BLUE, EDGE)
+        p(
+            '<text x="%g" y="%g" font-size="10" font-family="%s" fill="%s">%s</text>',
+            TX,
+            lf.y0 + 4,
+            MONO,
+            MUT,
+            hex(lf.start)
+        )
+        p(
+            '<text x="%g" y="%g" font-size="13" fill="%s">%s '
+                .. '<tspan fill="%s" font-size="10">(2^%d bytes)</tspan></text>',
+            TX,
+            lf.cy + 4,
+            BLUE_T,
+            lf.desc,
+            MUT,
+            util.ilog2(lf.len)
+        )
+    end
+end
+p('<text x="%g" y="%g" font-size="10" font-family="%s" fill="%s">2^64</text>', TX, BAR_BOT + 4, MONO, MUT)
+for _, lf in ipairs(rows) do
+    local fill = lf.tlo and WHITE or BLUE
+    p(
+        '<polygon points="%g,%g %g,%g %g,%g" fill="%s" stroke="%s"/>',
+        X_LEAF - TRI_W,
+        lf.cy,
+        X_LEAF,
+        lf.y0 + 0.5,
+        X_LEAF,
+        lf.y0 + lf.h - 0.5,
+        fill,
+        EDGE
+    )
+    p('<circle cx="%g" cy="%g" r="3.5" fill="%s" stroke="%s"/>', X_LEAF - TRI_W, lf.cy, fill, EDGE)
+end
+for _, d in ipairs(dots) do
+    p('<circle cx="%g" cy="%g" r="3.5" fill="%s" stroke="%s"/>', d.x, d.y, d.color, EDGE)
+end
+p("</g>")
+p("</svg>")
+io.write(table.concat(s, "\n"), "\n")
diff --git a/doc/recipes/Dockerfile.rootfs-docs b/doc/recipes/Dockerfile.rootfs-docs
new file mode 100644
index 000000000..274bf9ee2
--- /dev/null
+++ b/doc/recipes/Dockerfile.rootfs-docs
@@ -0,0 +1,103 @@
+ARG UBUNTU_TAG=24.04
+ARG UBUNTU_DIGEST=sha256:c4a8d5503dfb2a3eb8ab5f807da5bc69a85730fb49b5cfca2330194ebcc41c7b
+ARG RUST_TAG=1.83-slim
+ARG RUST_DIGEST=sha256:540c902e99c384163b688bbd8b5b8520e94e7731b27f7bd0eaa56ae1960627ab
+ARG GO_TAG=1.23-bookworm
+ARG GO_DIGEST=sha256:167053a2bb901972bf2c1611f8f52c44d5fe7e762e5cab213708d82c421614db
+ARG UBUNTU_SNAPSHOT=20260421T000000Z
+ARG MACHINE_GUEST_TOOLS_VERSION=0.18.0-test4
+ARG MACHINE_GUEST_TOOLS_DEB_SHA256=066ce57d039eada31159dce3a1e0704f3e7518f4828e66339b2a326d73a2e928
+ARG MACHINE_GUEST_TOOLS_TARGZ_SHA256=65b0a076a9b8a362b300eae2636cca0abe9500eeabfaee13e5cfa7723af5a0c0
+ARG DEBIAN_FRONTEND=noninteractive
+
+# Stage 1: cross-compile the C and C++ programs on the host architecture.
+FROM --platform=$BUILDPLATFORM ubuntu:${UBUNTU_TAG}@${UBUNTU_DIGEST} AS c-cpp-builder
+ARG DEBIAN_FRONTEND
+ARG MACHINE_GUEST_TOOLS_VERSION
+ARG MACHINE_GUEST_TOOLS_TARGZ_SHA256
+ARG UBUNTU_SNAPSHOT
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends ca-certificates && \
+    apt-get update --snapshot=${UBUNTU_SNAPSHOT} && \
+    apt-get install -y --no-install-recommends g++-14-riscv64-linux-gnu && \
+    rm -rf /var/lib/apt/lists/*
+ADD --checksum=sha256:${MACHINE_GUEST_TOOLS_TARGZ_SHA256} \
+    https://github.com/cartesi/machine-guest-tools/releases/download/v${MACHINE_GUEST_TOOLS_VERSION}/machine-guest-tools_riscv64.tar.gz \
+    /tmp/machine-guest-tools_riscv64.tar.gz
+RUN mkdir -p /sysroot && \
+    tar -xzf /tmp/machine-guest-tools_riscv64.tar.gz -C /sysroot && \
+    rm -f /tmp/machine-guest-tools_riscv64.tar.gz
+COPY hello/hello.c   /work/hello.c
+COPY hello/hello.cpp /work/hello.cpp
+COPY puppet.c        /work/puppet.c
+RUN riscv64-linux-gnu-gcc-14 -O2 -std=c17   -o /work/hello-c   /work/hello.c && \
+    riscv64-linux-gnu-g++-14 -O2 -std=c++23 -o /work/hello-cpp /work/hello.cpp && \
+    riscv64-linux-gnu-gcc-14 -O2 -std=c17 \
+        -I/sysroot/usr/include -L/sysroot/usr/lib \
+        -o /work/puppet /work/puppet.c -lcmt
+
+# Stage 2: cross-compile the Rust program on the host architecture.
+FROM --platform=$BUILDPLATFORM rust:${RUST_TAG}@${RUST_DIGEST} AS rust-builder
+ARG DEBIAN_FRONTEND
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends gcc-riscv64-linux-gnu libc6-dev-riscv64-cross && \
+    rm -rf /var/lib/apt/lists/* && \
+    rustup target add riscv64gc-unknown-linux-gnu
+WORKDIR /work
+RUN cargo init --name hello-rust --vcs none .
+COPY hello/hello.rs /work/src/main.rs
+ENV CARGO_TARGET_RISCV64GC_UNKNOWN_LINUX_GNU_LINKER=riscv64-linux-gnu-gcc
+RUN cargo build --release --target riscv64gc-unknown-linux-gnu
+
+# Stage 3: cross-compile the Go program on the host architecture.
+FROM --platform=$BUILDPLATFORM golang:${GO_TAG}@${GO_DIGEST} AS go-builder
+WORKDIR /work
+COPY hello/hello.go /work/hello.go
+ENV GOARCH=riscv64 GOOS=linux CGO_ENABLED=0
+RUN go build -ldflags="-s -w" -o /work/hello-go /work/hello.go
+
+# Stage 4: assemble the rootfs by emulating riscv64 through binfmt+QEMU.
+# The platform is set by `--platform=linux/riscv64` on the buildx invocation.
+FROM ubuntu:${UBUNTU_TAG}@${UBUNTU_DIGEST} AS rootfs
+ARG DEBIAN_FRONTEND
+ARG MACHINE_GUEST_TOOLS_VERSION
+ARG MACHINE_GUEST_TOOLS_DEB_SHA256
+ARG UBUNTU_SNAPSHOT
+ADD --checksum=sha256:${MACHINE_GUEST_TOOLS_DEB_SHA256} \
+    https://github.com/cartesi/machine-guest-tools/releases/download/v${MACHINE_GUEST_TOOLS_VERSION}/machine-guest-tools_riscv64.deb \
+    /tmp/
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends ca-certificates && \
+    apt-get update --snapshot=${UBUNTU_SNAPSHOT} && \
+    apt-get install -y --no-install-recommends \
+        /tmp/machine-guest-tools_riscv64.deb \
+        libstdc++6 \
+        bc curl device-tree-compiler gforth jq lua5.4 lua-socket \
+        python3-minimal tcl && \
+    apt-get purge -y --auto-remove ca-certificates && \
+    rm -f /var/cache/ldconfig/aux-cache && \
+    rm -rf /var/log/* && \
+    rm -rf /var/lib/apt/lists/* /tmp/machine-guest-tools_riscv64.deb
+
+# RUN apt-get update && \
+#     apt-get install -y --no-install-recommends nodejs ruby php-cli && \
+#     rm -rf /var/lib/apt/lists/*
+
+COPY --from=c-cpp-builder /work/hello-c                                               /home/dapp/hello-c
+COPY --from=c-cpp-builder /work/hello-cpp                                             /home/dapp/hello-cpp
+COPY --from=c-cpp-builder /work/puppet                                                /home/dapp/puppet
+COPY --from=rust-builder  /work/target/riscv64gc-unknown-linux-gnu/release/hello-rust /home/dapp/hello-rust
+COPY --from=go-builder    /work/hello-go                                              /home/dapp/hello-go
+COPY hello/hello.4th /home/dapp/hello.4th
+COPY hello/hello.awk /home/dapp/hello.awk
+COPY hello/hello.js  /home/dapp/hello.js
+COPY hello/hello.lua /home/dapp/hello.lua
+COPY hello/hello.pl  /home/dapp/hello.pl
+COPY hello/hello.php /home/dapp/hello.php
+COPY hello/hello.py  /home/dapp/hello.py
+COPY hello/hello.rb  /home/dapp/hello.rb
+COPY hello/hello.sh  /home/dapp/hello.sh
+COPY hello/hello.tcl /home/dapp/hello.tcl
+COPY hello/all.sh    /home/dapp/all.sh
+RUN chmod +x /home/dapp/hello-c /home/dapp/hello-cpp /home/dapp/hello-rust /home/dapp/hello-go /home/dapp/puppet /home/dapp/hello.* /home/dapp/all.sh && \
+    chown -R dapp:dapp /home/dapp
diff --git a/doc/recipes/all-cycles.sh b/doc/recipes/all-cycles.sh
new file mode 100755
index 000000000..25faa6b5b
--- /dev/null
+++ b/doc/recipes/all-cycles.sh
@@ -0,0 +1,2 @@
+#!/bin/bash
+grep -oP 'Cycles: \K[0-9]+'
diff --git a/doc/recipes/all-hashes.sh b/doc/recipes/all-hashes.sh
new file mode 100755
index 000000000..c58865649
--- /dev/null
+++ b/doc/recipes/all-hashes.sh
@@ -0,0 +1,2 @@
+#!/bin/bash
+grep -oP '[0-9]+: \K[a-fA-F0-9]{64}'
diff --git a/doc/recipes/build-rootfs-docs-license.sh b/doc/recipes/build-rootfs-docs-license.sh
new file mode 100755
index 000000000..f156503e0
--- /dev/null
+++ b/doc/recipes/build-rootfs-docs-license.sh
@@ -0,0 +1,47 @@
+#!/bin/sh
+set -eu
+
+# Generate a package and license report for rootfs-docs.ext2 in markdown,
+# the same way machine-guest-tools does for its rootfs. Instead of
+# rebuilding the rootfs docker image (which would require riscv64
+# emulation), the committed ext2 is converted into a docker image with
+# "docker import", which executes nothing. The report therefore describes
+# the exact committed artifact. It goes to stdout, diagnostics to stderr.
+
+image=cartesi/rootfs-docs
+
+# The scanner resolves package lists against the same archive snapshot the
+# image was built from, so source-package URIs stay stable over time.
+APT_SNAPSHOT=$(sed -n 's/^ARG UBUNTU_SNAPSHOT=//p' Dockerfile.rootfs-docs)
+export APT_SNAPSHOT
+
+# scan-local.sh builds this same scanner image again later (cached). It is
+# built here first because it is also where the ext2 is unpacked, by root,
+# on a Linux filesystem, so ownership and permissions survive into the tar.
+docker buildx build --load -t repo-info:local-dpkg \
+    -f third-party/repo-info/Dockerfile.local-dpkg \
+    third-party/repo-info 1>&2
+
+docker run --rm -v "$PWD/rootfs-docs.ext2:/rootfs.ext2:ro" repo-info:local-dpkg \
+    sh -c 'mkdir /x && debugfs -R "rdump / /x" /rootfs.ext2 1>&2 && \
+           tar -C /x --exclude=./lost+found -cf - .' |
+    docker import --platform linux/riscv64 - $image 1>&2
+
+# Whether docker inspect can format scan-local.sh's metadata template for
+# an imported image depends on the image store. The containerd store keeps
+# a sparse config that fails the template (only its leading newline is
+# printed), while the classic store renders the full section. Some of its
+# fields are also not byte-stable across regenerations. The filter below
+# drops the whole Docker Metadata section, restoring the blank line the
+# failed template would have left, so the report comes out the same in
+# both cases.
+# Capture the scan before filtering so a scanner failure (e.g. an
+# unresolvable repository source, see gather-dpkg.sh) aborts under set -e
+# instead of being masked by the awk at the tail of a pipeline.
+report=$(cd third-party/repo-info && ./scan-local.sh $image linux/riscv64)
+printf '%s\n' "$report" |
+    awk '
+        /^## Docker Metadata$/ { skip = 1; next }
+        skip && /^## / { skip = 0; print "" }
+        !skip
+    '
diff --git a/doc/recipes/build-rootfs-docs.sh b/doc/recipes/build-rootfs-docs.sh
new file mode 100755
index 000000000..c499f6180
--- /dev/null
+++ b/doc/recipes/build-rootfs-docs.sh
@@ -0,0 +1,17 @@
+#!/bin/sh
+set -eu
+
+# Cross-compile the dapp and assemble the rootfs as a flattened tarball.
+docker buildx build --platform=linux/riscv64 \
+    --output type=tar,dest=rootfs-docs.tar \
+    -f Dockerfile.rootfs-docs .
+
+# Convert the tarball into an ext2 image.
+xgenext2fs -fzB 4096 -i 4096 -r +4000 \
+    -a rootfs-docs.tar -L docs rootfs-docs.ext2
+rm -f rootfs-docs.tar
+
+# docs:begin null
+# Embed the recipe-input fingerprint, used to detect a stale image.
+e2cp rootfs-docs.inputs.sha256 rootfs-docs.ext2:/var/log/rootfs-docs.inputs.sha256
+# docs:end null
diff --git a/doc/recipes/calc.sh b/doc/recipes/calc.sh
new file mode 100755
index 000000000..951fea684
--- /dev/null
+++ b/doc/recipes/calc.sh
@@ -0,0 +1,22 @@
+#!/bin/bash
+set -o pipefail
+
+declare -A emit=([advance_state]=notice [inspect_state]=report)
+reqfile=$(mktemp /tmp/calc.XXXXXX)
+status="accept"
+while :
+do
+  rollup $status > "$reqfile"
+  request_type=$(jq -j .request_type < "$reqfile")
+  status="reject"
+  jq -j '.data.payload' < "$reqfile" | \
+    hex --decode | \
+      bc | \
+        grep . | \
+          tr -d '\\\n' | \
+            hex --encode | \
+              jq -R '{ payload: . }' | \
+                rollup "${emit[$request_type]}" > /dev/null && \
+                  status="accept"
+done
+rm "$reqfile"
diff --git a/doc/recipes/cartesi-rollup-data.lua b/doc/recipes/cartesi-rollup-data.lua
new file mode 100755
index 000000000..535175f37
--- /dev/null
+++ b/doc/recipes/cartesi-rollup-data.lua
@@ -0,0 +1,200 @@
+#!/usr/bin/env lua5.4
+-- Host-side mirror of /usr/bin/rollup.
+-- Encodes advance/inspect requests for the CMIO rx buffer; decodes
+-- voucher/notice/report/exception/delegate-call-voucher records from
+-- the CMIO tx buffer.
+
+local evmu = require("cartesi.evmu")
+local json = require("dkjson")
+
+local EVM_ADVANCE = "EvmAdvance(uint256,address,address,uint256,uint256,uint256,uint256,bytes)"
+local VOUCHER = "Voucher(address,uint256,bytes)"
+local DELEGATE = "DelegateCallVoucher(address,bytes)"
+local NOTICE = "Notice(bytes)"
+
+local USAGE = [[Usage:
+    cartesi-rollup-data.lua <direction> <type>
+
+Reads from stdin and writes to stdout. Encoding subcommands take a
+JSON description and write the binary record. Decoding subcommands
+take the binary record and write a JSON description.
+
+  encode <type>    JSON stdin -> binary stdout
+
+    encode advance
+      encode an advance-state request as binary EvmAdvance calldata.
+      The JSON object must contain chain_id, app_contract, msg_sender,
+      block_number, block_timestamp, prev_randao, index, and payload
+      fields.
+
+    encode inspect
+      write the raw inspect-state query payload bytes to stdout. The
+      JSON object must contain a single payload field.
+
+  decode <type>    binary stdin -> JSON stdout
+
+    decode advance
+      decode an advance-state request, printing a JSON object with
+      chain_id, app_contract, msg_sender, block_number, block_timestamp,
+      prev_randao, index, and payload fields.
+
+    decode inspect
+      wrap the raw query payload bytes in a JSON object with a single
+      payload field.
+
+    decode voucher
+      decode a voucher, printing destination, value, and payload.
+
+    decode delegate-call-voucher
+      decode a delegate-call voucher, printing destination and payload.
+
+    decode notice
+      decode a notice, printing the payload.
+
+    decode report
+    decode exception
+      print a JSON object with a single payload field carrying the raw
+      payload bytes hex-encoded.
+
+  where
+    chain_id, block_number, block_timestamp, and index are non-negative
+      integers,
+    app_contract and msg_sender are 20-byte EVM addresses in hex,
+    prev_randao is a big-endian 32-byte unsigned integer in hex, and
+    payload fields are 0x-prefixed hex strings.
+
+]]
+
+-- Convert a uint256 bint to a 0x-prefixed 64-character hex string.
+-- evmu.bint is a 512-bit instance; tobe() returns 64 bytes; last 32 are
+-- the uint256 value.
+local function uint256_to_hex(v)
+    return evmu.encode_hex(evmu.bint.tobe(v):sub(33))
+end
+
+local function read_json_stdin()
+    local s = io.read("a")
+    local t, _, err = json.decode(s)
+    if err then
+        error("invalid JSON on stdin: " .. err)
+    end
+    return t
+end
+
+local function write_json(t, order)
+    io.write(json.encode(t, { indent = true, keyorder = order }))
+    io.write("\n")
+end
+
+local function require_field(t, key)
+    local v = t[key]
+    if v == nil then
+        error("missing required field: " .. key)
+    end
+    return v
+end
+
+local encoders = {}
+local decoders = {}
+
+function encoders.advance()
+    local f = read_json_stdin()
+    local bint = evmu.bint
+    local bin = evmu.encode_calldata(EVM_ADVANCE, {
+        bint.new(require_field(f, "chain_id")),
+        require_field(f, "app_contract"),
+        require_field(f, "msg_sender"),
+        bint.new(require_field(f, "block_number")),
+        bint.new(require_field(f, "block_timestamp")),
+        bint.new(require_field(f, "prev_randao")),
+        bint.new(require_field(f, "index")),
+        require_field(f, "payload"),
+    })
+    io.write(bin)
+end
+
+function encoders.inspect()
+    local f = read_json_stdin()
+    io.write(assert(evmu.decode_hex(require_field(f, "payload"))))
+end
+
+function decoders.advance()
+    local t = evmu.decode_calldata(EVM_ADVANCE, io.read("a"))
+    local bint = evmu.bint
+    write_json({
+        chain_id = bint.touinteger(t[1]),
+        app_contract = t[2],
+        msg_sender = t[3],
+        block_number = bint.touinteger(t[4]),
+        block_timestamp = bint.touinteger(t[5]),
+        prev_randao = uint256_to_hex(t[6]),
+        index = bint.touinteger(t[7]),
+        payload = t[8],
+    }, {
+        "chain_id",
+        "app_contract",
+        "msg_sender",
+        "block_number",
+        "block_timestamp",
+        "prev_randao",
+        "index",
+        "payload",
+    })
+end
+
+function decoders.inspect()
+    write_json({ payload = evmu.encode_hex(io.read("a")) }, { "payload" })
+end
+
+function decoders.voucher()
+    local t = evmu.decode_calldata(VOUCHER, io.read("a"))
+    write_json({
+        destination = t[1],
+        value = uint256_to_hex(t[2]),
+        payload = t[3],
+    }, { "destination", "value", "payload" })
+end
+
+decoders["delegate-call-voucher"] = function()
+    local t = evmu.decode_calldata(DELEGATE, io.read("a"))
+    write_json({
+        destination = t[1],
+        payload = t[2],
+    }, { "destination", "payload" })
+end
+
+function decoders.notice()
+    local t = evmu.decode_calldata(NOTICE, io.read("a"))
+    write_json({ payload = t[1] }, { "payload" })
+end
+
+local function decode_raw_payload()
+    write_json({ payload = evmu.encode_hex(io.read("a")) }, { "payload" })
+end
+decoders.report = decode_raw_payload
+decoders.exception = decode_raw_payload
+
+local function fail()
+    io.stderr:write(USAGE)
+    os.exit(1)
+end
+
+local direction = arg[1]
+if not direction or direction == "-h" or direction == "--help" then
+    io.stderr:write(USAGE)
+    os.exit(direction ~= nil and 0 or 1)
+end
+
+local handlers
+if direction == "encode" then
+    handlers = encoders
+elseif direction == "decode" then
+    handlers = decoders
+else
+    fail()
+end
+local h = handlers[arg[2] or ""]
+if not h then
+    fail()
+end
+h()
diff --git a/doc/recipes/cycle-of.sh b/doc/recipes/cycle-of.sh
new file mode 100755
index 000000000..920a915e7
--- /dev/null
+++ b/doc/recipes/cycle-of.sh
@@ -0,0 +1,7 @@
+#!/bin/bash
+# Print the cycle count from the Cycles: line following the Nth match of PATTERN.
+# Usage: cycle-of.sh PATTERN [N]   (N defaults to 1)
+awk -v pat="$1" -v n="${2:-1}" '
+    $0 ~ pat { if (++i == n) { waiting = 1; next } }
+    waiting && $1 == "Cycles:" { print $2; exit }
+'
diff --git a/doc/recipes/dishonest.lua b/doc/recipes/dishonest.lua
new file mode 100644
index 000000000..e83903c92
--- /dev/null
+++ b/doc/recipes/dishonest.lua
@@ -0,0 +1,91 @@
+-- A composite presents the machine interface backed by two machines and switches from the
+-- first to the second at a given point (mcycle, uarch_cycle), reporting the first up to and
+-- including the point and the second after. run pins the step's mcycle, since the uarch
+-- advances mcycle on its own and a live read mid-step would place the switch wrong. Only the
+-- active machine advances, the second having been run to the switch mcycle once at
+-- construction. Forking forks both. Only the switching methods are defined below, the rest
+-- fall through to the active machine.
+-- First access caches the result on the instance, so later accesses skip __index. A defined
+-- method copies over as is. An undefined key naming a function on the active machine becomes a
+-- forwarding method, built once and shared on composite_meta. Any other value passes through
+-- uncached, since it may change.
+local composite_meta = {}
+composite_meta.__index = function(self, key)
+    local method = composite_meta[key]
+    if not method then
+        local active_val = self.active[key]
+        if type(active_val) == "function" then
+            method = function(this, ...)
+                return this.active[key](this.active, ...)
+            end
+            composite_meta[key] = method
+        else
+            return active_val
+        end
+    end
+    self[key] = method
+    return method
+end
+
+-- True for positions strictly after the cheat point (lexicographic on the pair).
+local function past_cheat(self, mcycle, uarch_cycle)
+    if mcycle ~= self.cheat_mcycle then
+        return mcycle > self.cheat_mcycle
+    end
+    return uarch_cycle > self.cheat_uarch_cycle
+end
+
+local function new_composite_machine(real_machine, cheat_mcycle, cheat_uarch_cycle, cheat_machine)
+    cheat_machine:run(cheat_mcycle)
+    return setmetatable({
+        real_machine = real_machine,
+        cheat_machine = cheat_machine,
+        active = real_machine,
+        mcycle = 0,
+        cheat_mcycle = cheat_mcycle,
+        cheat_uarch_cycle = cheat_uarch_cycle,
+    }, composite_meta)
+end
+
+function composite_meta.fork_server(self)
+    local fork = setmetatable({
+        real_machine = assert(self.real_machine:fork_server()),
+        cheat_machine = assert(self.cheat_machine:fork_server()),
+        mcycle = self.mcycle,
+        cheat_mcycle = self.cheat_mcycle,
+        cheat_uarch_cycle = self.cheat_uarch_cycle,
+    }, composite_meta)
+    fork.active = fork.real_machine
+    return fork
+end
+
+function composite_meta.run(self, m)
+    self.mcycle = m
+    self.active = past_cheat(self, m, 0) and self.cheat_machine or self.real_machine
+    self.active:run(m)
+end
+
+-- The uarch stays within the pinned mcycle, so the switch is judged against that, not the
+-- live mcycle the uarch advances.
+function composite_meta.run_uarch(self, u)
+    self.active = past_cheat(self, self.mcycle, u) and self.cheat_machine or self.real_machine
+    self.active:run_uarch(u)
+end
+
+function composite_meta.shutdown_server(self)
+    self.real_machine:shutdown_server()
+    self.cheat_machine:shutdown_server()
+end
+
+-- The log methods always report the second machine, rolled to the current position. self is
+-- always an ephemeral fork here, so rolling it forward in place is fine.
+function composite_meta.log_step_uarch(self, log_type)
+    self.cheat_machine:run_uarch(self.active:read_reg("uarch_cycle"))
+    return self.cheat_machine:log_step_uarch(log_type)
+end
+function composite_meta.log_reset_uarch(self, log_type)
+    self.cheat_machine:run_uarch(self.active:read_reg("uarch_cycle"))
+    return self.cheat_machine:log_reset_uarch(log_type)
+end
+
+return { new_composite_machine = new_composite_machine }
diff --git a/doc/recipes/dump-default-config.lua b/doc/recipes/dump-default-config.lua
new file mode 100644
index 000000000..c6cdcba9c
--- /dev/null
+++ b/doc/recipes/dump-default-config.lua
@@ -0,0 +1,10 @@
+-- Load the Cartesi module and utilities
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+
+-- Obtain default config
+local default_config = cartesi.machine:get_default_config()
+
+-- Pretty-print it
+io.write("return ")
+util.dump_table(default_config, io.stdout)
diff --git a/doc/recipes/dump-uarch-step.lua b/doc/recipes/dump-uarch-step.lua
new file mode 100644
index 000000000..585fbfb87
--- /dev/null
+++ b/doc/recipes/dump-uarch-step.lua
@@ -0,0 +1,20 @@
+-- Load the Cartesi modules
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+-- Advance to the requested mcycle and uarch_cycle
+local mcycle = assert(tonumber(arg[2]), "missing mcycle")
+local ucycle = assert(tonumber(arg[3]), "missing uarch_cycle")
+machine:run(mcycle)
+assert(machine:read_reg("mcycle") == mcycle, "machine halted or yielded early")
+machine:run_uarch(ucycle)
+assert(machine:read_reg("uarch_cycle") == ucycle, "uarch halted before target")
+
+-- Obtain access log and dump it to screen
+local log = machine:log_step_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS)
+io.stderr:write(string.format("\nAccess log of uarch step at mcycle=%u uarch_cycle=%u:\n\n", mcycle, ucycle))
+util.print_log(log, io.stderr)
diff --git a/doc/recipes/find-hash.sh b/doc/recipes/find-hash.sh
new file mode 100755
index 000000000..5ec15410d
--- /dev/null
+++ b/doc/recipes/find-hash.sh
@@ -0,0 +1,2 @@
+#!/bin/bash
+grep -oP "\"*$1\"*: \"*\K[a-fA-F0-9]{64}" | head -1
diff --git a/doc/recipes/find-htif-putchar.lua b/doc/recipes/find-htif-putchar.lua
new file mode 100644
index 000000000..f6eda5143
--- /dev/null
+++ b/doc/recipes/find-htif-putchar.lua
@@ -0,0 +1,15 @@
+local cartesi = require("cartesi")
+
+local config = require("config-nothing-to-do")
+local runtime = { console = { output_destination = "to_buffer", output_flush_mode = "every_line" } }
+local machine = cartesi.machine(config, runtime)
+
+local line = 0
+while machine:run() == cartesi.BREAK_REASON_CONSOLE_OUTPUT do
+    machine:read_console_output()
+    line = line + 1
+    if line == 8 then
+        io.stderr:write(machine:read_reg("mcycle") - 1)
+        break
+    end
+end
diff --git a/doc/recipes/find-lua-val.sh b/doc/recipes/find-lua-val.sh
new file mode 100755
index 000000000..de9bdd01b
--- /dev/null
+++ b/doc/recipes/find-lua-val.sh
@@ -0,0 +1,2 @@
+#!/bin/bash
+grep -oP "\"*$1\"* = \"*\K(0x[0-9a-fA-F]+|-?[0-9]+)" | head -1
diff --git a/doc/recipes/find-uarch-putchar-ecall.lua b/doc/recipes/find-uarch-putchar-ecall.lua
new file mode 100644
index 000000000..3e156e76d
--- /dev/null
+++ b/doc/recipes/find-uarch-putchar-ecall.lua
@@ -0,0 +1,25 @@
+local cartesi = require("cartesi")
+
+local mcycle = assert(tonumber(arg[1]), "missing argument: mcycle")
+
+local config = require("config-nothing-to-do")
+local machine = cartesi.machine(config)
+
+machine:run(mcycle)
+
+local PUTCHAR = cartesi.UARCH_ECALL_FN_PUTCHAR
+local ECALL = 0x00000073
+while machine:read_reg("uarch_halt_flag") == 0 do
+    local pc = machine:read_reg("uarch_pc")
+    local insn = string.unpack("<I4", machine:read_memory(pc, 4))
+    if insn == ECALL and machine:read_reg("uarch_x17") == PUTCHAR then
+        io.stderr:write(machine:read_reg("uarch_cycle"))
+        return
+    end
+    local uarch_cycle = machine:read_reg("uarch_cycle")
+    machine:run_uarch(uarch_cycle + 1)
+    if uarch_cycle % 10 ^ 5 == 0 then
+        collectgarbage("collect")
+    end
+end
+error("putchar ecall not found before uarch halt")
diff --git a/doc/recipes/hash-of.sh b/doc/recipes/hash-of.sh
new file mode 100755
index 000000000..f70040961
--- /dev/null
+++ b/doc/recipes/hash-of.sh
@@ -0,0 +1,7 @@
+#!/bin/bash
+# Print the Nth 64-char hex hash following the first match of PATTERN.
+# Usage: hash-of.sh PATTERN [N]   (N defaults to 1)
+awk -v pat="$1" -v n="${2:-1}" '
+    !found && $0 ~ pat { found = 1; next }
+    found && NF == 2 && length($2) == 64 { if (++i == n) { print $2; exit } }
+'
diff --git a/doc/recipes/hello.ext2 b/doc/recipes/hello.ext2
new file mode 100644
index 000000000..0d7d0731f
Binary files /dev/null and b/doc/recipes/hello.ext2 differ
diff --git a/doc/recipes/hello/all.sh b/doc/recipes/hello/all.sh
new file mode 100755
index 000000000..6091d95f1
--- /dev/null
+++ b/doc/recipes/hello/all.sh
@@ -0,0 +1,18 @@
+#!/bin/sh
+
+cd $(dirname $0)
+
+./hello-c
+./hello-cpp
+./hello-rust
+./hello-go
+gforth hello.4th
+./hello.awk
+./hello.lua
+./hello.pl
+./hello.py
+./hello.sh
+./hello.tcl
+#./hello.js
+#./hello.rb
+#./hello.php
diff --git a/doc/recipes/hello/hello-cpp b/doc/recipes/hello/hello-cpp
new file mode 100755
index 000000000..f53929ce1
Binary files /dev/null and b/doc/recipes/hello/hello-cpp differ
diff --git a/doc/recipes/hello/hello.4th b/doc/recipes/hello/hello.4th
new file mode 100755
index 000000000..2a2dc862f
--- /dev/null
+++ b/doc/recipes/hello/hello.4th
@@ -0,0 +1,2 @@
+: main 6 1 do i 0 .r ." : Hello world from Forth!" cr loop ;
+main bye
diff --git a/doc/recipes/hello/hello.awk b/doc/recipes/hello/hello.awk
new file mode 100644
index 000000000..1e62dcf7b
--- /dev/null
+++ b/doc/recipes/hello/hello.awk
@@ -0,0 +1,6 @@
+#!/usr/bin/awk -f
+BEGIN {
+    for (i = 1; i <= 5; i++) {
+        printf "%d: Hello world from AWK!\n", i
+    }
+}
diff --git a/doc/recipes/hello/hello.c b/doc/recipes/hello/hello.c
new file mode 100644
index 000000000..292d41137
--- /dev/null
+++ b/doc/recipes/hello/hello.c
@@ -0,0 +1,7 @@
+#include <stdio.h>
+
+int main(void) {
+    for (int i = 1; i <= 5; i++) {
+        printf("%d: Hello world from C!\n", i);
+    }
+}
diff --git a/doc/recipes/hello/hello.cpp b/doc/recipes/hello/hello.cpp
new file mode 100644
index 000000000..b9a6a7af2
--- /dev/null
+++ b/doc/recipes/hello/hello.cpp
@@ -0,0 +1,7 @@
+#include <print>
+
+int main() {
+    for (int i = 1; i <= 5; i++) {
+        std::println("{}: Hello world from C++!", i);
+    }
+}
diff --git a/doc/recipes/hello/hello.go b/doc/recipes/hello/hello.go
new file mode 100644
index 000000000..b41c12c7c
--- /dev/null
+++ b/doc/recipes/hello/hello.go
@@ -0,0 +1,9 @@
+package main
+
+import "fmt"
+
+func main() {
+	for i := 1; i <= 5; i++ {
+		fmt.Printf("%d: Hello world from Go!\n", i)
+	}
+}
diff --git a/doc/recipes/hello/hello.js b/doc/recipes/hello/hello.js
new file mode 100755
index 000000000..506e12cf0
--- /dev/null
+++ b/doc/recipes/hello/hello.js
@@ -0,0 +1,5 @@
+#!/usr/bin/env node
+
+for (var i = 0; i < 5; i++) {
+    console.log((i+1) + ": Hello world from JavaScript!")
+}
diff --git a/doc/recipes/hello/hello.lua b/doc/recipes/hello/hello.lua
new file mode 100755
index 000000000..3352c8fb3
--- /dev/null
+++ b/doc/recipes/hello/hello.lua
@@ -0,0 +1,5 @@
+#!/usr/bin/env lua5.4
+
+for i = 1, 5 do
+    print(i .. ": Hello world from Lua!")
+end
diff --git a/doc/recipes/hello/hello.php b/doc/recipes/hello/hello.php
new file mode 100755
index 000000000..4ce88a488
--- /dev/null
+++ b/doc/recipes/hello/hello.php
@@ -0,0 +1,6 @@
+#!/usr/bin/env php
+<?php
+for ($i = 1; $i <= 5; $i++) {
+    print "$i: Hello world from PHP!\n";
+}
+?>
diff --git a/doc/recipes/hello/hello.pl b/doc/recipes/hello/hello.pl
new file mode 100755
index 000000000..4c736ff78
--- /dev/null
+++ b/doc/recipes/hello/hello.pl
@@ -0,0 +1,5 @@
+#!/usr/bin/env perl
+
+for my $i (1..5){
+	print("$i: Hello world from Perl!\n");
+}
diff --git a/doc/recipes/hello/hello.py b/doc/recipes/hello/hello.py
new file mode 100755
index 000000000..e854f7d47
--- /dev/null
+++ b/doc/recipes/hello/hello.py
@@ -0,0 +1,4 @@
+#!/usr/bin/env python3
+
+for i in range(0,5):
+    print("{}: Hello world from Python3".format(i+1))
diff --git a/doc/recipes/hello/hello.rb b/doc/recipes/hello/hello.rb
new file mode 100755
index 000000000..72b16dade
--- /dev/null
+++ b/doc/recipes/hello/hello.rb
@@ -0,0 +1,5 @@
+#!/usr/bin/env ruby
+
+for i in 1..5 do
+    puts "%d: Hello world from Ruby!" % i
+end
diff --git a/doc/recipes/hello/hello.rs b/doc/recipes/hello/hello.rs
new file mode 100644
index 000000000..4290f3bfb
--- /dev/null
+++ b/doc/recipes/hello/hello.rs
@@ -0,0 +1,5 @@
+fn main() {
+    for i in 1..6 {
+        println!("{}: Hello world from Rust!", i);
+    }
+}
diff --git a/doc/recipes/hello/hello.sh b/doc/recipes/hello/hello.sh
new file mode 100755
index 000000000..5d3ee4d73
--- /dev/null
+++ b/doc/recipes/hello/hello.sh
@@ -0,0 +1,5 @@
+#!/bin/sh
+
+for i in $(seq 1 5); do
+    echo "$i: Hello world from sh!"
+done
diff --git a/doc/recipes/hello/hello.tcl b/doc/recipes/hello/hello.tcl
new file mode 100755
index 000000000..0cb7e907f
--- /dev/null
+++ b/doc/recipes/hello/hello.tcl
@@ -0,0 +1,5 @@
+#!/usr/bin/env tclsh
+
+for {set i 1} {$i <= 5} {incr i} {
+    puts "$i: Hello world from TCL!"
+}
diff --git a/doc/recipes/last-cycles.sh b/doc/recipes/last-cycles.sh
new file mode 100755
index 000000000..749e388f0
--- /dev/null
+++ b/doc/recipes/last-cycles.sh
@@ -0,0 +1,2 @@
+#!/bin/bash
+grep -oP 'Cycles: \K[0-9]+' | tail -1
diff --git a/doc/recipes/load-cat-foo-bar.lua b/doc/recipes/load-cat-foo-bar.lua
new file mode 100644
index 000000000..4ff102666
--- /dev/null
+++ b/doc/recipes/load-cat-foo-bar.lua
@@ -0,0 +1,10 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Instantiate machine from persistent state directory
+local machine = cartesi.machine("cat-foo-bar")
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
diff --git a/doc/recipes/minimal-config.lua b/doc/recipes/minimal-config.lua
new file mode 100644
index 000000000..095b42f3e
--- /dev/null
+++ b/doc/recipes/minimal-config.lua
@@ -0,0 +1,71 @@
+-- Reads a stored Lua machine config from the file given as argument, strips
+-- every field equal to the corresponding default value (recursively), removes
+-- subtables that become empty, and prints the result to stdout. Mirrors the
+-- equality test cartesi-machine.lua uses to annotate "-- default" lines.
+-- When the default has no entry for a field (typically a flash drive or NVRAM
+-- entry added by the user), an empty string or `false` value on the given
+-- config side is treated as default and dropped too.
+
+local cartesi = require("cartesi")
+
+local function prune(t, def)
+    if type(t) ~= "table" then
+        return t
+    end
+    for k, v in pairs(t) do
+        local d = def and def[k]
+        if type(v) == "table" then
+            prune(v, type(d) == "table" and d or nil)
+            if next(v) == nil then
+                t[k] = nil
+            end
+        elseif v == d or (d == nil and (v == "" or v == false)) then
+            t[k] = nil
+        end
+    end
+    return t
+end
+
+local function dump(out, what, indent)
+    if type(what) ~= "table" then
+        if math.type(what) == "integer" then
+            out:write(string.format("0x%x", what))
+        else
+            out:write(string.format("%q", what))
+        end
+        return
+    end
+    local keys = {}
+    for k in pairs(what) do
+        keys[#keys + 1] = k
+    end
+    if #keys == 0 then
+        out:write("{}")
+        return
+    end
+    table.sort(keys, function(a, b)
+        if type(a) == type(b) then
+            return a < b
+        end
+        return type(a) == "number"
+    end)
+    local next_indent = indent .. "  "
+    out:write("{\n")
+    for _, k in ipairs(keys) do
+        out:write(next_indent)
+        if type(k) == "string" then
+            out:write(k, " = ")
+        end
+        dump(out, what[k], next_indent)
+        out:write(",\n")
+    end
+    out:write(indent, "}")
+end
+
+local config_path = assert(arg[1], "usage: minimal-config.lua <config.lua>")
+local config = assert(loadfile(config_path, "t"))()
+local default = cartesi.machine:get_default_config()
+prune(config, default)
+io.write("return ")
+dump(io.stdout, config, "")
+io.write("\n")
diff --git a/doc/recipes/puppet.c b/doc/recipes/puppet.c
new file mode 100644
index 000000000..8455e0308
--- /dev/null
+++ b/doc/recipes/puppet.c
@@ -0,0 +1,78 @@
+/* Puppet: a libcmt rollup target driven by its inputs.
+ *
+ * Each advance-state payload is a command of the form "verb:data" (or
+ * a bare verb without a colon).  The verb selects the libcmt call; the
+ * data after the colon is the bytes the call receives.
+ *
+ *   notice:<data>     -> cmt_rollup_emit_notice(data), accept
+ *   report:<data>     -> cmt_rollup_emit_report(data), accept
+ *   voucher:<data>    -> cmt_rollup_emit_voucher(msg_sender, 0, data),
+ *                        accept
+ *   exception:<data>  -> cmt_rollup_emit_exception(data); halts
+ *   exit              -> break out of the loop and return from main;
+ *                        the machine halts on its own
+ *   <anything else>   -> reject the advance; the host rolls the state
+ *                        back
+ *
+ * An inspect-state query is echoed back as a single report, accepted.
+ */
+
+#include <string.h>
+#include "libcmt/rollup.h"
+
+static int verb_match(const cmt_abi_bytes_t *payload, const char *verb, cmt_abi_bytes_t *data) {
+    size_t verb_len = strlen(verb);
+    if (payload->length < verb_len) return 0;
+    if (memcmp(payload->data, verb, verb_len) != 0) return 0;
+    if (payload->length == verb_len) {
+        data->data = NULL;
+        data->length = 0;
+        return 1;
+    }
+    if (((const char *) payload->data)[verb_len] != ':') return 0;
+    data->data = (char *) payload->data + verb_len + 1;
+    data->length = payload->length - verb_len - 1;
+    return 1;
+}
+
+int main(void) {
+    cmt_rollup_t rollup;
+    if (cmt_rollup_init(&rollup) < 0) return 1;
+
+    cmt_rollup_finish_t finish = { .accept_previous_request = true };
+    if (cmt_rollup_finish(&rollup, &finish) < 0) return 1;
+
+    for (;;) {
+        bool accept = true;
+        bool should_exit = false;
+        if (finish.next_request_type == HTIF_YIELD_REASON_ADVANCE_STATE) {
+            cmt_rollup_advance_t advance;
+            if (cmt_rollup_read_advance_state(&rollup, &advance) < 0) break;
+            cmt_abi_bytes_t data;
+            if (verb_match(&advance.payload, "notice", &data)) {
+                cmt_rollup_emit_notice(&rollup, &data, NULL);
+            } else if (verb_match(&advance.payload, "report", &data)) {
+                cmt_rollup_emit_report(&rollup, &data);
+            } else if (verb_match(&advance.payload, "voucher", &data)) {
+                cmt_abi_u256_t value = {{0}};
+                cmt_rollup_emit_voucher(&rollup, &advance.msg_sender, &value, &data, NULL);
+            } else if (verb_match(&advance.payload, "exception", &data)) {
+                cmt_rollup_emit_exception(&rollup, &data);
+            } else if (verb_match(&advance.payload, "exit", &data) && data.length == 0) {
+                should_exit = true;
+            } else {
+                accept = false;
+            }
+        } else if (finish.next_request_type == HTIF_YIELD_REASON_INSPECT_STATE) {
+            cmt_rollup_inspect_t inspect;
+            if (cmt_rollup_read_inspect_state(&rollup, &inspect) < 0) break;
+            cmt_rollup_emit_report(&rollup, &inspect.payload);
+        }
+        if (should_exit) break;
+        finish.accept_previous_request = accept;
+        if (cmt_rollup_finish(&rollup, &finish) < 0) break;
+    }
+
+    cmt_rollup_fini(&rollup);
+    return 0;
+}
diff --git a/doc/recipes/rootfs-docs.ext2 b/doc/recipes/rootfs-docs.ext2
new file mode 100644
index 000000000..1513d314f
--- /dev/null
+++ b/doc/recipes/rootfs-docs.ext2
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fe62e2afa2d46eb85b79380f7fce5e47c9852c0b4c93ca751fe96923b555843c
+size 156131328
diff --git a/doc/recipes/rootfs-docs.licenses.md b/doc/recipes/rootfs-docs.licenses.md
new file mode 100644
index 000000000..6bc8b2f6c
--- /dev/null
+++ b/doc/recipes/rootfs-docs.licenses.md
@@ -0,0 +1,2308 @@
+# `cartesi/rootfs-docs`
+
+
+## `dpkg` (`.deb`-based packages)
+
+### `dpkg` source package: `acl=2.3.2-1build1.1`
+
+Binary Packages:
+
+- `libacl1:riscv64=2.3.2-1build1.1`
+
+Licenses: (parsed from: `/usr/share/doc/libacl1/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `LGPL-2+`
+- `LGPL-2.1`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris acl=2.3.2-1build1.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/acl/acl_2.3.2.orig.tar.xz' acl_2.3.2.orig.tar.xz 371680
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/acl/acl_2.3.2.orig.tar.xz.asc' acl_2.3.2.orig.tar.xz.asc 833
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/acl/acl_2.3.2-1build1.1.debian.tar.xz' acl_2.3.2-1build1.1.debian.tar.xz 23472
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/acl/acl_2.3.2-1build1.1.dsc' acl_2.3.2-1build1.1.dsc 2616
+```
+
+### `dpkg` source package: `apt=2.8.3`
+
+Binary Packages:
+
+- `apt:riscv64=2.8.3`
+- `libapt-pkg6.0t64:riscv64=2.8.3`
+
+Licenses: (parsed from: `/usr/share/doc/apt/copyright`, `/usr/share/doc/libapt-pkg6.0t64/copyright`)
+
+- `BSD-3-clause`
+- `Expat`
+- `GPL-2`
+- `GPL-2+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris apt=2.8.3
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/apt/apt_2.8.3.tar.xz' apt_2.8.3.tar.xz 2354680
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/apt/apt_2.8.3.dsc' apt_2.8.3.dsc 2973
+```
+
+### `dpkg` source package: `attr=1:2.5.2-1build1.1`
+
+Binary Packages:
+
+- `libattr1:riscv64=1:2.5.2-1build1.1`
+
+Licenses: (parsed from: `/usr/share/doc/libattr1/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `LGPL-2+`
+- `LGPL-2.1`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris attr=1:2.5.2-1build1.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/attr/attr_2.5.2.orig.tar.xz' attr_2.5.2.orig.tar.xz 334180
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/attr/attr_2.5.2.orig.tar.xz.asc' attr_2.5.2.orig.tar.xz.asc 833
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/attr/attr_2.5.2-1build1.1.debian.tar.xz' attr_2.5.2-1build1.1.debian.tar.xz 26032
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/attr/attr_2.5.2-1build1.1.dsc' attr_2.5.2-1build1.1.dsc 2588
+```
+
+### `dpkg` source package: `audit=1:3.1.2-2.1build1.1`
+
+Binary Packages:
+
+- `libaudit-common=1:3.1.2-2.1build1.1`
+- `libaudit1:riscv64=1:3.1.2-2.1build1.1`
+
+Licenses: (parsed from: `/usr/share/doc/libaudit-common/copyright`, `/usr/share/doc/libaudit1/copyright`)
+
+- `GPL-1`
+- `GPL-2`
+- `LGPL-2.1`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris audit=1:3.1.2-2.1build1.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/audit/audit_3.1.2.orig.tar.gz' audit_3.1.2.orig.tar.gz 1219860
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/audit/audit_3.1.2-2.1build1.1.debian.tar.xz' audit_3.1.2-2.1build1.1.debian.tar.xz 18860
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/a/audit/audit_3.1.2-2.1build1.1.dsc' audit_3.1.2-2.1build1.1.dsc 2848
+```
+
+### `dpkg` source package: `base-files=13ubuntu10.4`
+
+Binary Packages:
+
+- `base-files:riscv64=13ubuntu10.4`
+
+Licenses: (parsed from: `/usr/share/doc/base-files/copyright`)
+
+- `GPL`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris base-files=13ubuntu10.4
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/base-files/base-files_13ubuntu10.4.tar.xz' base-files_13ubuntu10.4.tar.xz 94240
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/base-files/base-files_13ubuntu10.4.dsc' base-files_13ubuntu10.4.dsc 1642
+```
+
+### `dpkg` source package: `base-passwd=3.6.3build1`
+
+Binary Packages:
+
+- `base-passwd:riscv64=3.6.3build1`
+
+Licenses: (parsed from: `/usr/share/doc/base-passwd/copyright`)
+
+- `GPL-2`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris base-passwd=3.6.3build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/base-passwd/base-passwd_3.6.3build1.dsc' base-passwd_3.6.3build1.dsc 1779
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/base-passwd/base-passwd_3.6.3build1.tar.xz' base-passwd_3.6.3build1.tar.xz 58252
+```
+
+### `dpkg` source package: `bash=5.2.21-2ubuntu4`
+
+Binary Packages:
+
+- `bash:riscv64=5.2.21-2ubuntu4`
+
+Licenses: (parsed from: `/usr/share/doc/bash/copyright`)
+
+- `BSD-4-clause-UC`
+- `GFDL-1.3`
+- `GFDL-NIV-1.3`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `GPL-3+`
+- `GPL-3+ with Bison exception`
+- `Latex2e`
+- `MIT-like`
+- `permissive`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris bash=5.2.21-2ubuntu4
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/bash/bash_5.2.21-2ubuntu4.dsc' bash_5.2.21-2ubuntu4.dsc 2437
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/bash/bash_5.2.21.orig.tar.xz' bash_5.2.21.orig.tar.xz 5598816
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/bash/bash_5.2.21-2ubuntu4.debian.tar.xz' bash_5.2.21-2ubuntu4.debian.tar.xz 94124
+```
+
+### `dpkg` source package: `bc=1.07.1-3ubuntu4`
+
+Binary Packages:
+
+- `bc:riscv64=1.07.1-3ubuntu4`
+
+Licenses: (parsed from: `/usr/share/doc/bc/copyright`)
+
+- `GPL-2`
+- `GPL-2.0+`
+- `GPL-2.0+ with Texinfo exception`
+- `X11`
+- `permissive`
+- `permissive'`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris bc=1.07.1-3ubuntu4
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/bc/bc_1.07.1-3ubuntu4.dsc' bc_1.07.1-3ubuntu4.dsc 2018
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/bc/bc_1.07.1.orig.tar.gz' bc_1.07.1.orig.tar.gz 419850
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/bc/bc_1.07.1-3ubuntu4.debian.tar.xz' bc_1.07.1-3ubuntu4.debian.tar.xz 23888
+```
+
+### `dpkg` source package: `brotli=1.1.0-2build2`
+
+Binary Packages:
+
+- `libbrotli1:riscv64=1.1.0-2build2`
+
+Licenses: (parsed from: `/usr/share/doc/libbrotli1/copyright`)
+
+- `MIT`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris brotli=1.1.0-2build2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/brotli/brotli_1.1.0-2build2.dsc' brotli_1.1.0-2build2.dsc 2401
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/brotli/brotli_1.1.0.orig.tar.gz' brotli_1.1.0.orig.tar.gz 512036
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/brotli/brotli_1.1.0-2build2.debian.tar.xz' brotli_1.1.0-2build2.debian.tar.xz 5644
+```
+
+### `dpkg` source package: `busybox=1:1.36.1-6ubuntu3.1`
+
+Binary Packages:
+
+- `busybox-static:riscv64=1:1.36.1-6ubuntu3.1`
+
+Licenses: (parsed from: `/usr/share/doc/busybox-static/copyright`)
+
+- `GPL-2`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris busybox=1:1.36.1-6ubuntu3.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/busybox/busybox_1.36.1.orig.tar.bz2' busybox_1.36.1.orig.tar.bz2 2525473
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/busybox/busybox_1.36.1.orig.tar.bz2.asc' busybox_1.36.1.orig.tar.bz2.asc 195
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/busybox/busybox_1.36.1-6ubuntu3.1.debian.tar.xz' busybox_1.36.1-6ubuntu3.1.debian.tar.xz 84488
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/busybox/busybox_1.36.1-6ubuntu3.1.dsc' busybox_1.36.1-6ubuntu3.1.dsc 2711
+```
+
+### `dpkg` source package: `bzip2=1.0.8-5.1build0.1`
+
+Binary Packages:
+
+- `libbz2-1.0:riscv64=1.0.8-5.1build0.1`
+
+Licenses: (parsed from: `/usr/share/doc/libbz2-1.0/copyright`)
+
+- `BSD-variant`
+- `GPL-2`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris bzip2=1.0.8-5.1build0.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/bzip2/bzip2_1.0.8.orig.tar.gz' bzip2_1.0.8.orig.tar.gz 810029
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/bzip2/bzip2_1.0.8-5.1build0.1.debian.tar.bz2' bzip2_1.0.8-5.1build0.1.debian.tar.bz2 26927
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/b/bzip2/bzip2_1.0.8-5.1build0.1.dsc' bzip2_1.0.8-5.1build0.1.dsc 2220
+```
+
+### `dpkg` source package: `cdebconf=0.271ubuntu3`
+
+Binary Packages:
+
+- `libdebconfclient0:riscv64=0.271ubuntu3`
+
+Licenses: (parsed from: `/usr/share/doc/libdebconfclient0/copyright`)
+
+- `BSD-2-Clause`
+- `BSD-2-clause`
+- `GPL-2`
+- `GPL-2+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris cdebconf=0.271ubuntu3
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/cdebconf/cdebconf_0.271ubuntu3.dsc' cdebconf_0.271ubuntu3.dsc 2910
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/cdebconf/cdebconf_0.271ubuntu3.tar.xz' cdebconf_0.271ubuntu3.tar.xz 285500
+```
+
+### `dpkg` source package: `coreutils=9.4-3ubuntu6.2`
+
+Binary Packages:
+
+- `coreutils:riscv64=9.4-3ubuntu6.2`
+
+Licenses: (parsed from: `/usr/share/doc/coreutils/copyright`)
+
+- `BSD-4-clause-UC`
+- `FSFULLR`
+- `GFDL-1.3`
+- `GFDL-NIV-1.3`
+- `GPL-3`
+- `GPL-3+`
+- `ISC`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris coreutils=9.4-3ubuntu6.2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/coreutils/coreutils_9.4.orig.tar.xz' coreutils_9.4.orig.tar.xz 5979200
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/coreutils/coreutils_9.4-3ubuntu6.2.debian.tar.xz' coreutils_9.4-3ubuntu6.2.debian.tar.xz 42032
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/coreutils/coreutils_9.4-3ubuntu6.2.dsc' coreutils_9.4-3ubuntu6.2.dsc 2030
+```
+
+### `dpkg` source package: `curl=8.5.0-2ubuntu10.9`
+
+Binary Packages:
+
+- `curl:riscv64=8.5.0-2ubuntu10.9`
+- `libcurl4t64:riscv64=8.5.0-2ubuntu10.9`
+
+Licenses: (parsed from: `/usr/share/doc/curl/copyright`, `/usr/share/doc/libcurl4t64/copyright`)
+
+- `BSD-3-Clause`
+- `BSD-3-clause`
+- `BSD-4-Clause-UC`
+- `FSFULLR`
+- `GPL-2`
+- `GPL-2+ with Autoconf-data exception`
+- `GPL-2+ with Libtool exception`
+- `GPL-3+ with Autoconf-data exception`
+- `ISC`
+- `OLDAP-2.8`
+- `X11`
+- `curl`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris curl=8.5.0-2ubuntu10.9
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/curl/curl_8.5.0.orig.tar.gz' curl_8.5.0.orig.tar.gz 4372979
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/curl/curl_8.5.0-2ubuntu10.9.debian.tar.xz' curl_8.5.0-2ubuntu10.9.debian.tar.xz 76576
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/curl/curl_8.5.0-2ubuntu10.9.dsc' curl_8.5.0-2ubuntu10.9.dsc 3051
+```
+
+### `dpkg` source package: `cyrus-sasl2=2.1.28+dfsg1-5ubuntu3.1`
+
+Binary Packages:
+
+- `libsasl2-2:riscv64=2.1.28+dfsg1-5ubuntu3.1`
+- `libsasl2-modules-db:riscv64=2.1.28+dfsg1-5ubuntu3.1`
+
+Licenses: (parsed from: `/usr/share/doc/libsasl2-2/copyright`, `/usr/share/doc/libsasl2-modules-db/copyright`)
+
+- `BSD-2-clause`
+- `BSD-2.2-clause`
+- `BSD-3-Clause-Attribution`
+- `BSD-3-clause`
+- `BSD-3-clause-JANET`
+- `BSD-3-clause-PADL`
+- `BSD-4-clause-UC`
+- `FSFULLR`
+- `GPL-3`
+- `GPL-3+`
+- `IBM-as-is`
+- `MIT-CMU`
+- `MIT-Export`
+- `MIT-OpenVision`
+- `OpenLDAP`
+- `RSA-MD`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris cyrus-sasl2=2.1.28+dfsg1-5ubuntu3.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/cyrus-sasl2/cyrus-sasl2_2.1.28%2bdfsg1.orig.tar.xz' cyrus-sasl2_2.1.28+dfsg1.orig.tar.xz 794540
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/cyrus-sasl2/cyrus-sasl2_2.1.28%2bdfsg1-5ubuntu3.1.debian.tar.xz' cyrus-sasl2_2.1.28+dfsg1-5ubuntu3.1.debian.tar.xz 98324
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/c/cyrus-sasl2/cyrus-sasl2_2.1.28%2bdfsg1-5ubuntu3.1.dsc' cyrus-sasl2_2.1.28+dfsg1-5ubuntu3.1.dsc 3501
+```
+
+### `dpkg` source package: `dash=0.5.12-6ubuntu5`
+
+Binary Packages:
+
+- `dash:riscv64=0.5.12-6ubuntu5`
+
+Licenses: (parsed from: `/usr/share/doc/dash/copyright`)
+
+- `BSD-3-Clause`
+- `BSD-3-clause`
+- `GPL-2`
+- `GPL-2+`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris dash=0.5.12-6ubuntu5
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/dash/dash_0.5.12-6ubuntu5.dsc' dash_0.5.12-6ubuntu5.dsc 2124
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/dash/dash_0.5.12.orig.tar.gz' dash_0.5.12.orig.tar.gz 246054
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/dash/dash_0.5.12-6ubuntu5.debian.tar.xz' dash_0.5.12-6ubuntu5.debian.tar.xz 39616
+```
+
+### `dpkg` source package: `db5.3=5.3.28+dfsg2-7`
+
+Binary Packages:
+
+- `libdb5.3t64:riscv64=5.3.28+dfsg2-7`
+
+Licenses: (parsed from: `/usr/share/doc/libdb5.3t64/copyright`)
+
+- `Artistic`
+- `BSD-3-clause`
+- `BSD-3-clause-fjord`
+- `GPL`
+- `GPL-3`
+- `MIT-old`
+- `Ms-PL`
+- `Sleepycat`
+- `TCL-like`
+- `X11`
+- `zlib`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris db5.3=5.3.28+dfsg2-7
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/db5.3/db5.3_5.3.28%2bdfsg2-7.dsc' db5.3_5.3.28+dfsg2-7.dsc 2374
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/db5.3/db5.3_5.3.28%2bdfsg2.orig.tar.xz' db5.3_5.3.28+dfsg2.orig.tar.xz 21287688
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/db5.3/db5.3_5.3.28%2bdfsg2-7.debian.tar.xz' db5.3_5.3.28+dfsg2-7.debian.tar.xz 35232
+```
+
+### `dpkg` source package: `debconf=1.5.86ubuntu1`
+
+Binary Packages:
+
+- `debconf=1.5.86ubuntu1`
+
+Licenses: (parsed from: `/usr/share/doc/debconf/copyright`)
+
+- `BSD-2-clause`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris debconf=1.5.86ubuntu1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/debconf/debconf_1.5.86ubuntu1.dsc' debconf_1.5.86ubuntu1.dsc 2030
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/debconf/debconf_1.5.86ubuntu1.tar.xz' debconf_1.5.86ubuntu1.tar.xz 574112
+```
+
+### `dpkg` source package: `debianutils=5.17build1`
+
+Binary Packages:
+
+- `debianutils:riscv64=5.17build1`
+
+Licenses: (parsed from: `/usr/share/doc/debianutils/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `SMAIL-GPL`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris debianutils=5.17build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/debianutils/debianutils_5.17build1.dsc' debianutils_5.17build1.dsc 1771
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/debianutils/debianutils_5.17build1.tar.xz' debianutils_5.17build1.tar.xz 80468
+```
+
+### `dpkg` source package: `device-tree-compiler=1.7.0-2build1`
+
+Binary Packages:
+
+- `device-tree-compiler:riscv64=1.7.0-2build1`
+- `libfdt1:riscv64=1.7.0-2build1`
+
+Licenses: (parsed from: `/usr/share/doc/device-tree-compiler/copyright`, `/usr/share/doc/libfdt1/copyright`)
+
+- `BSD-2-clause`
+- `GPL-2`
+- `GPL-2+`
+- `LGPL-2.1+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris device-tree-compiler=1.7.0-2build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/device-tree-compiler/device-tree-compiler_1.7.0-2build1.dsc' device-tree-compiler_1.7.0-2build1.dsc 2590
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/device-tree-compiler/device-tree-compiler_1.7.0.orig.tar.gz' device-tree-compiler_1.7.0.orig.tar.gz 211526
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/device-tree-compiler/device-tree-compiler_1.7.0-2build1.debian.tar.xz' device-tree-compiler_1.7.0-2build1.debian.tar.xz 14536
+```
+
+### `dpkg` source package: `diffutils=1:3.10-1build1`
+
+Binary Packages:
+
+- `diffutils:riscv64=1:3.10-1build1`
+
+Licenses: (parsed from: `/usr/share/doc/diffutils/copyright`)
+
+- `FSFAP`
+- `FSFULLR`
+- `GFDL-1.3`
+- `GFDL-NIV-1.3`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `GPL-3+`
+- `GPL-3+ with autoconf exception`
+- `GPL-3+ with texinfo exception`
+- `LGPL-2`
+- `LGPL-2.0+`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `LGPL-3`
+- `LGPL-3.0+`
+- `X11`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris diffutils=1:3.10-1build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/diffutils/diffutils_3.10-1build1.dsc' diffutils_3.10-1build1.dsc 2192
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/diffutils/diffutils_3.10.orig.tar.xz' diffutils_3.10.orig.tar.xz 1624240
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/diffutils/diffutils_3.10.orig.tar.xz.asc' diffutils_3.10.orig.tar.xz.asc 833
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/diffutils/diffutils_3.10-1build1.debian.tar.xz' diffutils_3.10-1build1.debian.tar.xz 14068
+```
+
+### `dpkg` source package: `dpkg=1.22.6ubuntu6.5`
+
+Binary Packages:
+
+- `dpkg:riscv64=1.22.6ubuntu6.5`
+
+Licenses: (parsed from: `/usr/share/doc/dpkg/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `public-domain-s-s-d`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris dpkg=1.22.6ubuntu6.5
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/dpkg/dpkg_1.22.6ubuntu6.5.dsc' dpkg_1.22.6ubuntu6.5.dsc 3156
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/d/dpkg/dpkg_1.22.6ubuntu6.5.tar.xz' dpkg_1.22.6ubuntu6.5.tar.xz 5547360
+```
+
+### `dpkg` source package: `e2fsprogs=1.47.0-2.4~exp1ubuntu4.1`
+
+Binary Packages:
+
+- `e2fsprogs:riscv64=1.47.0-2.4~exp1ubuntu4.1`
+- `libcom-err2:riscv64=1.47.0-2.4~exp1ubuntu4.1`
+- `libext2fs2t64:riscv64=1.47.0-2.4~exp1ubuntu4.1`
+- `libss2:riscv64=1.47.0-2.4~exp1ubuntu4.1`
+- `logsave:riscv64=1.47.0-2.4~exp1ubuntu4.1`
+
+Licenses: (parsed from: `/usr/share/doc/e2fsprogs/copyright`, `/usr/share/doc/libcom-err2/copyright`, `/usr/share/doc/libext2fs2t64/copyright`, `/usr/share/doc/libss2/copyright`, `/usr/share/doc/logsave/copyright`)
+
+- `Apache-2`
+- `Apache-2.0`
+- `BSD-3-Clause`
+- `GPL`
+- `GPL-2`
+- `GPL-2+ with Texinfo exception`
+- `ISC`
+- `Kazlib`
+- `LGPL-2`
+- `Latex2e`
+- `MIT-US-export`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris e2fsprogs=1.47.0-2.4~exp1ubuntu4.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/e/e2fsprogs/e2fsprogs_1.47.0.orig.tar.gz' e2fsprogs_1.47.0.orig.tar.gz 9637717
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/e/e2fsprogs/e2fsprogs_1.47.0.orig.tar.gz.asc' e2fsprogs_1.47.0.orig.tar.gz.asc 488
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/e/e2fsprogs/e2fsprogs_1.47.0-2.4%7eexp1ubuntu4.1.debian.tar.xz' e2fsprogs_1.47.0-2.4~exp1ubuntu4.1.debian.tar.xz 90580
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/e/e2fsprogs/e2fsprogs_1.47.0-2.4%7eexp1ubuntu4.1.dsc' e2fsprogs_1.47.0-2.4~exp1ubuntu4.1.dsc 3294
+```
+
+### `dpkg` source package: `emacsen-common=3.0.5`
+
+Binary Packages:
+
+- `emacsen-common=3.0.5`
+
+Licenses: (parsed from: `/usr/share/doc/emacsen-common/copyright`)
+
+- `GPL`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris emacsen-common=3.0.5
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/e/emacsen-common/emacsen-common_3.0.5.dsc' emacsen-common_3.0.5.dsc 1463
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/e/emacsen-common/emacsen-common_3.0.5.tar.xz' emacsen-common_3.0.5.tar.xz 16460
+```
+
+### `dpkg` source package: `expat=2.6.1-2ubuntu0.4`
+
+Binary Packages:
+
+- `libexpat1:riscv64=2.6.1-2ubuntu0.4`
+
+Licenses: (parsed from: `/usr/share/doc/libexpat1/copyright`)
+
+- `MIT`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris expat=2.6.1-2ubuntu0.4
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/e/expat/expat_2.6.1.orig.tar.gz' expat_2.6.1.orig.tar.gz 8414649
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/e/expat/expat_2.6.1-2ubuntu0.4.debian.tar.xz' expat_2.6.1-2ubuntu0.4.debian.tar.xz 31092
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/e/expat/expat_2.6.1-2ubuntu0.4.dsc' expat_2.6.1-2ubuntu0.4.dsc 1945
+```
+
+### `dpkg` source package: `findutils=4.9.0-5build1`
+
+Binary Packages:
+
+- `findutils:riscv64=4.9.0-5build1`
+
+Licenses: (parsed from: `/usr/share/doc/findutils/copyright`)
+
+- `BSD-3-clause`
+- `BSD-3-clause and/or GPL-3+`
+- `FSFAP`
+- `FSFULLR`
+- `GFDL-1.3`
+- `GFDL-NIV-1.3+`
+- `GPL with automake exception`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-2+ with Autoconf-data exception`
+- `GPL-3`
+- `GPL-3+`
+- `GPL-3+ with Autoconf-data exception`
+- `GPL-3+ with Bison-2.2 exception`
+- `ISC`
+- `ISC and/or LGPL-2.1+`
+- `LGPL-2`
+- `LGPL-2+`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `LGPL-3`
+- `LGPL-3+`
+- `X11`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris findutils=4.9.0-5build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/f/findutils/findutils_4.9.0-5build1.dsc' findutils_4.9.0-5build1.dsc 2404
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/f/findutils/findutils_4.9.0.orig.tar.xz' findutils_4.9.0.orig.tar.xz 2046252
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/f/findutils/findutils_4.9.0.orig.tar.xz.asc' findutils_4.9.0.orig.tar.xz.asc 488
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/f/findutils/findutils_4.9.0-5build1.debian.tar.xz' findutils_4.9.0-5build1.debian.tar.xz 32864
+```
+
+### `dpkg` source package: `gcc-14=14.2.0-4ubuntu2~24.04.1`
+
+Binary Packages:
+
+- `gcc-14-base:riscv64=14.2.0-4ubuntu2~24.04.1`
+- `libgcc-s1:riscv64=14.2.0-4ubuntu2~24.04.1`
+- `libstdc++6:riscv64=14.2.0-4ubuntu2~24.04.1`
+
+Licenses: (parsed from: `/usr/share/doc/gcc-14-base/copyright`, `/usr/share/doc/libgcc-s1/copyright`, `/usr/share/doc/libstdc++6/copyright`)
+
+- `Artistic`
+- `GFDL-1.2`
+- `GPL`
+- `GPL-3`
+- `LGPL`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris gcc-14=14.2.0-4ubuntu2~24.04.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gcc-14/gcc-14_14.2.0.orig.tar.gz' gcc-14_14.2.0.orig.tar.gz 97158172
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gcc-14/gcc-14_14.2.0-4ubuntu2%7e24.04.1.debian.tar.xz' gcc-14_14.2.0-4ubuntu2~24.04.1.debian.tar.xz 1950432
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gcc-14/gcc-14_14.2.0-4ubuntu2%7e24.04.1.dsc' gcc-14_14.2.0-4ubuntu2~24.04.1.dsc 46930
+```
+
+### `dpkg` source package: `gforth=0.7.3+dfsg-9build4.1`
+
+Binary Packages:
+
+- `gforth:riscv64=0.7.3+dfsg-9build4.1`
+- `gforth-common=0.7.3+dfsg-9build4.1`
+- `gforth-lib:riscv64=0.7.3+dfsg-9build4.1`
+
+Licenses: (parsed from: `/usr/share/doc/gforth/copyright`, `/usr/share/doc/gforth-common/copyright`, `/usr/share/doc/gforth-lib/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `GPL-3+`
+- `LGPL-3`
+- `LGPL-3+`
+- `PD`
+- `other-copy-share-modify`
+- `other-distribute-freely`
+- `other-distribute-freely-jhopkins`
+- `other-emacs`
+- `other-free-doc`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris gforth=0.7.3+dfsg-9build4.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/universe/g/gforth/gforth_0.7.3%2bdfsg-9build4.1.dsc' gforth_0.7.3+dfsg-9build4.1.dsc 2232
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/universe/g/gforth/gforth_0.7.3%2bdfsg.orig.tar.xz' gforth_0.7.3+dfsg.orig.tar.xz 705716
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/universe/g/gforth/gforth_0.7.3%2bdfsg-9build4.1.debian.tar.xz' gforth_0.7.3+dfsg-9build4.1.debian.tar.xz 38408
+```
+
+### `dpkg` source package: `glibc=2.39-0ubuntu8.7`
+
+Binary Packages:
+
+- `libc-bin:riscv64=2.39-0ubuntu8.7`
+- `libc6:riscv64=2.39-0ubuntu8.7`
+
+Licenses: (parsed from: `/usr/share/doc/libc-bin/copyright`, `/usr/share/doc/libc6/copyright`)
+
+- `GFDL-1.3`
+- `GPL-2`
+- `LGPL-2.1`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris glibc=2.39-0ubuntu8.7
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/glibc/glibc_2.39.orig.tar.xz' glibc_2.39.orig.tar.xz 18520988
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/glibc/glibc_2.39.orig.tar.xz.asc' glibc_2.39.orig.tar.xz.asc 833
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/glibc/glibc_2.39-0ubuntu8.7.debian.tar.xz' glibc_2.39-0ubuntu8.7.debian.tar.xz 469880
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/glibc/glibc_2.39-0ubuntu8.7.dsc' glibc_2.39-0ubuntu8.7.dsc 9257
+```
+
+### `dpkg` source package: `gmp=2:6.3.0+dfsg-2ubuntu6.1`
+
+Binary Packages:
+
+- `libgmp10:riscv64=2:6.3.0+dfsg-2ubuntu6.1`
+
+Licenses: (parsed from: `/usr/share/doc/libgmp10/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `GPL-3+`
+- `GPL-3+ with Bison exception`
+- `LGPL-3`
+- `LGPL-3+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris gmp=2:6.3.0+dfsg-2ubuntu6.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gmp/gmp_6.3.0%2bdfsg.orig.tar.xz' gmp_6.3.0+dfsg.orig.tar.xz 1870556
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gmp/gmp_6.3.0%2bdfsg-2ubuntu6.1.debian.tar.xz' gmp_6.3.0+dfsg-2ubuntu6.1.debian.tar.xz 38908
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gmp/gmp_6.3.0%2bdfsg-2ubuntu6.1.dsc' gmp_6.3.0+dfsg-2ubuntu6.1.dsc 2345
+```
+
+### `dpkg` source package: `gnupg2=2.4.4-2ubuntu17.4`
+
+Binary Packages:
+
+- `gpgv:riscv64=2.4.4-2ubuntu17.4`
+
+Licenses: (parsed from: `/usr/share/doc/gpgv/copyright`)
+
+- `BSD-3-clause`
+- `CC0-1.0`
+- `Expat`
+- `GPL-2+`
+- `GPL-2.0`
+- `GPL-3`
+- `GPL-3+`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `LGPL-3`
+- `LGPL-3+`
+- `RFC-Reference`
+- `TinySCHEME`
+- `permissive`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris gnupg2=2.4.4-2ubuntu17.4
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gnupg2/gnupg2_2.4.4.orig.tar.bz2' gnupg2_2.4.4.orig.tar.bz2 7886036
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gnupg2/gnupg2_2.4.4.orig.tar.bz2.asc' gnupg2_2.4.4.orig.tar.bz2.asc 386
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gnupg2/gnupg2_2.4.4-2ubuntu17.4.debian.tar.xz' gnupg2_2.4.4-2ubuntu17.4.debian.tar.xz 97376
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gnupg2/gnupg2_2.4.4-2ubuntu17.4.dsc' gnupg2_2.4.4-2ubuntu17.4.dsc 3984
+```
+
+### `dpkg` source package: `gnutls28=3.8.3-1.1ubuntu3.5`
+
+Binary Packages:
+
+- `libgnutls30t64:riscv64=3.8.3-1.1ubuntu3.5`
+
+Licenses: (parsed from: `/usr/share/doc/libgnutls30t64/copyright`)
+
+- `Apache-2.0`
+- `BSD-3-Clause`
+- `CC0 license`
+- `Expat`
+- `GFDL-1.3`
+- `GPL`
+- `GPL-3`
+- `GPLv3+`
+- `LGPL`
+- `LGPL-3`
+- `LGPLv2.1+`
+- `LGPLv3+_or_GPLv2+`
+- `The main library is licensed under GNU Lesser`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris gnutls28=3.8.3-1.1ubuntu3.5
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gnutls28/gnutls28_3.8.3-1.1ubuntu3.5.dsc' gnutls28_3.8.3-1.1ubuntu3.5.dsc 3397
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gnutls28/gnutls28_3.8.3.orig.tar.xz' gnutls28_3.8.3.orig.tar.xz 6463720
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gnutls28/gnutls28_3.8.3.orig.tar.xz.asc' gnutls28_3.8.3.orig.tar.xz.asc 854
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gnutls28/gnutls28_3.8.3-1.1ubuntu3.5.debian.tar.xz' gnutls28_3.8.3-1.1ubuntu3.5.debian.tar.xz 109884
+```
+
+### `dpkg` source package: `grep=3.11-4build1`
+
+Binary Packages:
+
+- `grep:riscv64=3.11-4build1`
+
+Licenses: (parsed from: `/usr/share/doc/grep/copyright`)
+
+- `GPL-3`
+- `GPL-3+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris grep=3.11-4build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/grep/grep_3.11-4build1.dsc' grep_3.11-4build1.dsc 2379
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/grep/grep_3.11.orig.tar.xz' grep_3.11.orig.tar.xz 1703776
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/grep/grep_3.11.orig.tar.xz.asc' grep_3.11.orig.tar.xz.asc 833
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/grep/grep_3.11-4build1.debian.tar.xz' grep_3.11-4build1.debian.tar.xz 20584
+```
+
+### `dpkg` source package: `gzip=1.12-1ubuntu3.1`
+
+Binary Packages:
+
+- `gzip:riscv64=1.12-1ubuntu3.1`
+
+Licenses: (parsed from: `/usr/share/doc/gzip/copyright`)
+
+- `FSF-manpages`
+- `GFDL-1.3+-no-invariant`
+- `GFDL-3`
+- `GPL-3`
+- `GPL-3+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris gzip=1.12-1ubuntu3.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gzip/gzip_1.12.orig.tar.xz' gzip_1.12.orig.tar.xz 825548
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gzip/gzip_1.12-1ubuntu3.1.debian.tar.xz' gzip_1.12-1ubuntu3.1.debian.tar.xz 21180
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/g/gzip/gzip_1.12-1ubuntu3.1.dsc' gzip_1.12-1ubuntu3.1.dsc 2042
+```
+
+### `dpkg` source package: `hostname=3.23+nmu2ubuntu2`
+
+Binary Packages:
+
+- `hostname:riscv64=3.23+nmu2ubuntu2`
+
+Licenses: (parsed from: `/usr/share/doc/hostname/copyright`)
+
+- `GPL-2`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris hostname=3.23+nmu2ubuntu2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/h/hostname/hostname_3.23%2bnmu2ubuntu2.dsc' hostname_3.23+nmu2ubuntu2.dsc 1567
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/h/hostname/hostname_3.23%2bnmu2ubuntu2.tar.xz' hostname_3.23+nmu2ubuntu2.tar.xz 13276
+```
+
+### `dpkg` source package: `init-system-helpers=1.66ubuntu1`
+
+Binary Packages:
+
+- `init-system-helpers=1.66ubuntu1`
+
+Licenses: (parsed from: `/usr/share/doc/init-system-helpers/copyright`)
+
+- `BSD-3-clause`
+- `GPL-2`
+- `GPL-2+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris init-system-helpers=1.66ubuntu1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/i/init-system-helpers/init-system-helpers_1.66ubuntu1.dsc' init-system-helpers_1.66ubuntu1.dsc 2353
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/i/init-system-helpers/init-system-helpers_1.66ubuntu1.tar.xz' init-system-helpers_1.66ubuntu1.tar.xz 45100
+```
+
+### `dpkg` source package: `jq=1.7.1-3ubuntu0.24.04.2`
+
+Binary Packages:
+
+- `jq:riscv64=1.7.1-3ubuntu0.24.04.2`
+- `libjq1:riscv64=1.7.1-3ubuntu0.24.04.2`
+
+Licenses: (parsed from: `/usr/share/doc/jq/copyright`, `/usr/share/doc/libjq1/copyright`)
+
+- `CC-BY-3.0`
+- `Expat`
+- `GPL-2`
+- `GPL-2.0+`
+- `MIT`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris jq=1.7.1-3ubuntu0.24.04.2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/j/jq/jq_1.7.1.orig.tar.gz' jq_1.7.1.orig.tar.gz 1323338
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/j/jq/jq_1.7.1-3ubuntu0.24.04.2.debian.tar.xz' jq_1.7.1-3ubuntu0.24.04.2.debian.tar.xz 22008
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/j/jq/jq_1.7.1-3ubuntu0.24.04.2.dsc' jq_1.7.1-3ubuntu0.24.04.2.dsc 1965
+```
+
+### `dpkg` source package: `keyutils=1.6.3-3build1`
+
+Binary Packages:
+
+- `libkeyutils1:riscv64=1.6.3-3build1`
+
+Licenses: (parsed from: `/usr/share/doc/libkeyutils1/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `LGPL-2`
+- `LGPL-2+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris keyutils=1.6.3-3build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/k/keyutils/keyutils_1.6.3-3build1.dsc' keyutils_1.6.3-3build1.dsc 2211
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/k/keyutils/keyutils_1.6.3.orig.tar.gz' keyutils_1.6.3.orig.tar.gz 137022
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/k/keyutils/keyutils_1.6.3-3build1.debian.tar.xz' keyutils_1.6.3-3build1.debian.tar.xz 13456
+```
+
+### `dpkg` source package: `krb5=1.20.1-6ubuntu2.6`
+
+Binary Packages:
+
+- `libgssapi-krb5-2:riscv64=1.20.1-6ubuntu2.6`
+- `libk5crypto3:riscv64=1.20.1-6ubuntu2.6`
+- `libkrb5-3:riscv64=1.20.1-6ubuntu2.6`
+- `libkrb5support0:riscv64=1.20.1-6ubuntu2.6`
+
+Licenses: (parsed from: `/usr/share/doc/libgssapi-krb5-2/copyright`, `/usr/share/doc/libk5crypto3/copyright`, `/usr/share/doc/libkrb5-3/copyright`, `/usr/share/doc/libkrb5support0/copyright`)
+
+- `GPL-2`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris krb5=1.20.1-6ubuntu2.6
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/k/krb5/krb5_1.20.1.orig.tar.gz' krb5_1.20.1.orig.tar.gz 8661660
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/k/krb5/krb5_1.20.1.orig.tar.gz.asc' krb5_1.20.1.orig.tar.gz.asc 833
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/k/krb5/krb5_1.20.1-6ubuntu2.6.debian.tar.xz' krb5_1.20.1-6ubuntu2.6.debian.tar.xz 122284
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/k/krb5/krb5_1.20.1-6ubuntu2.6.dsc' krb5_1.20.1-6ubuntu2.6.dsc 4125
+```
+
+### `dpkg` source package: `libassuan=2.5.6-1build1`
+
+Binary Packages:
+
+- `libassuan0:riscv64=2.5.6-1build1`
+
+Licenses: (parsed from: `/usr/share/doc/libassuan0/copyright`)
+
+- `GAP`
+- `GAP~FSF`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-2+ with libtool exception`
+- `GPL-3`
+- `GPL-3+`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `LGPL-3`
+- `LGPL-3+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libassuan=2.5.6-1build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/liba/libassuan/libassuan_2.5.6-1build1.dsc' libassuan_2.5.6-1build1.dsc 2734
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/liba/libassuan/libassuan_2.5.6.orig.tar.bz2' libassuan_2.5.6.orig.tar.bz2 577012
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/liba/libassuan/libassuan_2.5.6.orig.tar.bz2.asc' libassuan_2.5.6.orig.tar.bz2.asc 228
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/liba/libassuan/libassuan_2.5.6-1build1.debian.tar.xz' libassuan_2.5.6-1build1.debian.tar.xz 14412
+```
+
+### `dpkg` source package: `libcap-ng=0.8.4-2build2`
+
+Binary Packages:
+
+- `libcap-ng0:riscv64=0.8.4-2build2`
+
+Licenses: (parsed from: `/usr/share/doc/libcap-ng0/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libcap-ng=0.8.4-2build2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libc/libcap-ng/libcap-ng_0.8.4-2build2.dsc' libcap-ng_0.8.4-2build2.dsc 2351
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libc/libcap-ng/libcap-ng_0.8.4.orig.tar.gz' libcap-ng_0.8.4.orig.tar.gz 59317
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libc/libcap-ng/libcap-ng_0.8.4-2build2.debian.tar.xz' libcap-ng_0.8.4-2build2.debian.tar.xz 7384
+```
+
+### `dpkg` source package: `libcap2=1:2.66-5ubuntu2.2`
+
+Binary Packages:
+
+- `libcap2:riscv64=1:2.66-5ubuntu2.2`
+
+Licenses: (parsed from: `/usr/share/doc/libcap2/copyright`)
+
+- `BSD-3-clause`
+- `GPL-2`
+- `GPL-2+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libcap2=1:2.66-5ubuntu2.2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libc/libcap2/libcap2_2.66-5ubuntu2.2.dsc' libcap2_2.66-5ubuntu2.2.dsc 2319
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libc/libcap2/libcap2_2.66.orig.tar.xz' libcap2_2.66.orig.tar.xz 181592
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libc/libcap2/libcap2_2.66-5ubuntu2.2.debian.tar.xz' libcap2_2.66-5ubuntu2.2.debian.tar.xz 23076
+```
+
+### `dpkg` source package: `libffi=3.4.6-1build1`
+
+Binary Packages:
+
+- `libffi8:riscv64=3.4.6-1build1`
+
+Licenses: (parsed from: `/usr/share/doc/libffi8/copyright`)
+
+- `Expat`
+- `GPL`
+- `GPL-2+`
+- `GPL-3+`
+- `LGPL-2.1+`
+- `MPL-1.1`
+- `X11`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libffi=3.4.6-1build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libf/libffi/libffi_3.4.6-1build1.dsc' libffi_3.4.6-1build1.dsc 2055
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libf/libffi/libffi_3.4.6.orig.tar.gz' libffi_3.4.6.orig.tar.gz 598175
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libf/libffi/libffi_3.4.6-1build1.debian.tar.xz' libffi_3.4.6-1build1.debian.tar.xz 10736
+```
+
+### `dpkg` source package: `libgcrypt20=1.10.3-2build1`
+
+Binary Packages:
+
+- `libgcrypt20:riscv64=1.10.3-2build1`
+
+Licenses: (parsed from: `/usr/share/doc/libgcrypt20/copyright`)
+
+- `GPL-2`
+- `LGPL`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libgcrypt20=1.10.3-2build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libg/libgcrypt20/libgcrypt20_1.10.3-2build1.dsc' libgcrypt20_1.10.3-2build1.dsc 2931
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libg/libgcrypt20/libgcrypt20_1.10.3.orig.tar.bz2' libgcrypt20_1.10.3.orig.tar.bz2 3783827
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libg/libgcrypt20/libgcrypt20_1.10.3.orig.tar.bz2.asc' libgcrypt20_1.10.3.orig.tar.bz2.asc 390
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libg/libgcrypt20/libgcrypt20_1.10.3-2build1.debian.tar.xz' libgcrypt20_1.10.3-2build1.debian.tar.xz 36604
+```
+
+### `dpkg` source package: `libgpg-error=1.47-3build2.1`
+
+Binary Packages:
+
+- `libgpg-error0:riscv64=1.47-3build2.1`
+
+Licenses: (parsed from: `/usr/share/doc/libgpg-error0/copyright`)
+
+- `BSD-3-clause`
+- `GPL-3`
+- `GPL-3+`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `g10-permissive`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libgpg-error=1.47-3build2.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libg/libgpg-error/libgpg-error_1.47.orig.tar.bz2' libgpg-error_1.47.orig.tar.bz2 1020862
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libg/libgpg-error/libgpg-error_1.47.orig.tar.bz2.asc' libgpg-error_1.47.orig.tar.bz2.asc 228
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libg/libgpg-error/libgpg-error_1.47-3build2.1.debian.tar.xz' libgpg-error_1.47-3build2.1.debian.tar.xz 18776
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libg/libgpg-error/libgpg-error_1.47-3build2.1.dsc' libgpg-error_1.47-3build2.1.dsc 3007
+```
+
+### `dpkg` source package: `libidn2=2.3.7-2build1.1`
+
+Binary Packages:
+
+- `libidn2-0:riscv64=2.3.7-2build1.1`
+
+Licenses: (parsed from: `/usr/share/doc/libidn2-0/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `GPL-3+`
+- `LGPL-3`
+- `LGPL-3+`
+- `Unicode`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libidn2=2.3.7-2build1.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libi/libidn2/libidn2_2.3.7.orig.tar.gz' libidn2_2.3.7.orig.tar.gz 2155214
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libi/libidn2/libidn2_2.3.7.orig.tar.gz.asc' libidn2_2.3.7.orig.tar.gz.asc 228
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libi/libidn2/libidn2_2.3.7-2build1.1.debian.tar.xz' libidn2_2.3.7-2build1.1.debian.tar.xz 16468
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libi/libidn2/libidn2_2.3.7-2build1.1.dsc' libidn2_2.3.7-2build1.1.dsc 2651
+```
+
+### `dpkg` source package: `libmd=1.1.0-2build1.1`
+
+Binary Packages:
+
+- `libmd0:riscv64=1.1.0-2build1.1`
+
+Licenses: (parsed from: `/usr/share/doc/libmd0/copyright`)
+
+- `BSD-2-clause`
+- `BSD-2-clause-NetBSD`
+- `BSD-3-clause`
+- `BSD-3-clause-Aaron-D-Gifford`
+- `Beerware`
+- `ISC`
+- `public-domain-md4`
+- `public-domain-md5`
+- `public-domain-sha1`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libmd=1.1.0-2build1.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libm/libmd/libmd_1.1.0.orig.tar.xz' libmd_1.1.0.orig.tar.xz 271228
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libm/libmd/libmd_1.1.0.orig.tar.xz.asc' libmd_1.1.0.orig.tar.xz.asc 833
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libm/libmd/libmd_1.1.0-2build1.1.debian.tar.xz' libmd_1.1.0-2build1.1.debian.tar.xz 8448
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libm/libmd/libmd_1.1.0-2build1.1.dsc' libmd_1.1.0-2build1.1.dsc 2391
+```
+
+### `dpkg` source package: `libonig=6.9.9-1build1`
+
+Binary Packages:
+
+- `libonig5:riscv64=6.9.9-1build1`
+
+Licenses: (parsed from: `/usr/share/doc/libonig5/copyright`)
+
+- `BSD-2-clause`
+- `GPL-2`
+- `GPL-2+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libonig=6.9.9-1build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libo/libonig/libonig_6.9.9-1build1.dsc' libonig_6.9.9-1build1.dsc 1994
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libo/libonig/libonig_6.9.9.orig.tar.gz' libonig_6.9.9.orig.tar.gz 645616
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libo/libonig/libonig_6.9.9-1build1.debian.tar.xz' libonig_6.9.9-1build1.debian.tar.xz 9084
+```
+
+### `dpkg` source package: `libpsl=0.21.2-1.1build1`
+
+Binary Packages:
+
+- `libpsl5t64:riscv64=0.21.2-1.1build1`
+
+Licenses: (parsed from: `/usr/share/doc/libpsl5t64/copyright`)
+
+- `Chromium`
+- `MIT`
+- `gnulib`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libpsl=0.21.2-1.1build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libp/libpsl/libpsl_0.21.2-1.1build1.dsc' libpsl_0.21.2-1.1build1.dsc 2425
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libp/libpsl/libpsl_0.21.2.orig.tar.xz' libpsl_0.21.2.orig.tar.xz 1870352
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libp/libpsl/libpsl_0.21.2-1.1build1.debian.tar.xz' libpsl_0.21.2-1.1build1.debian.tar.xz 12244
+```
+
+### `dpkg` source package: `libselinux=3.5-2ubuntu2.1`
+
+Binary Packages:
+
+- `libselinux1:riscv64=3.5-2ubuntu2.1`
+
+Licenses: (parsed from: `/usr/share/doc/libselinux1/copyright`)
+
+- `GPL-2`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libselinux=3.5-2ubuntu2.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libselinux/libselinux_3.5.orig.tar.gz' libselinux_3.5.orig.tar.gz 211453
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libselinux/libselinux_3.5.orig.tar.gz.asc' libselinux_3.5.orig.tar.gz.asc 981
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libselinux/libselinux_3.5-2ubuntu2.1.debian.tar.xz' libselinux_3.5-2ubuntu2.1.debian.tar.xz 38112
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libselinux/libselinux_3.5-2ubuntu2.1.dsc' libselinux_3.5-2ubuntu2.1.dsc 3098
+```
+
+### `dpkg` source package: `libsemanage=3.5-1build5`
+
+Binary Packages:
+
+- `libsemanage-common=3.5-1build5`
+- `libsemanage2:riscv64=3.5-1build5`
+
+Licenses: (parsed from: `/usr/share/doc/libsemanage-common/copyright`, `/usr/share/doc/libsemanage2/copyright`)
+
+- `GPL-2`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libsemanage=3.5-1build5
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libsemanage/libsemanage_3.5-1build5.dsc' libsemanage_3.5-1build5.dsc 3105
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libsemanage/libsemanage_3.5.orig.tar.gz' libsemanage_3.5.orig.tar.gz 185060
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libsemanage/libsemanage_3.5.orig.tar.gz.asc' libsemanage_3.5.orig.tar.gz.asc 981
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libsemanage/libsemanage_3.5-1build5.debian.tar.xz' libsemanage_3.5-1build5.debian.tar.xz 30188
+```
+
+### `dpkg` source package: `libsepol=3.5-2build1`
+
+Binary Packages:
+
+- `libsepol2:riscv64=3.5-2build1`
+
+Licenses: (parsed from: `/usr/share/doc/libsepol2/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `Zlib`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libsepol=3.5-2build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libsepol/libsepol_3.5-2build1.dsc' libsepol_3.5-2build1.dsc 2458
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libsepol/libsepol_3.5.orig.tar.gz' libsepol_3.5.orig.tar.gz 497522
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libsepol/libsepol_3.5.orig.tar.gz.asc' libsepol_3.5.orig.tar.gz.asc 981
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libsepol/libsepol_3.5-2build1.debian.tar.xz' libsepol_3.5-2build1.debian.tar.xz 27716
+```
+
+### `dpkg` source package: `libssh=0.10.6-2ubuntu0.4`
+
+Binary Packages:
+
+- `libssh-4:riscv64=0.10.6-2ubuntu0.4`
+
+Licenses: (parsed from: `/usr/share/doc/libssh-4/copyright`)
+
+- `BSD-2-clause`
+- `BSD-3-clause`
+- `LGPL-2.1`
+- `LGPL-2.1+~OpenSSL`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libssh=0.10.6-2ubuntu0.4
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libssh/libssh_0.10.6.orig.tar.xz' libssh_0.10.6.orig.tar.xz 561036
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libssh/libssh_0.10.6.orig.tar.xz.asc' libssh_0.10.6.orig.tar.xz.asc 833
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libssh/libssh_0.10.6-2ubuntu0.4.debian.tar.xz' libssh_0.10.6-2ubuntu0.4.debian.tar.xz 56400
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libs/libssh/libssh_0.10.6-2ubuntu0.4.dsc' libssh_0.10.6-2ubuntu0.4.dsc 2723
+```
+
+### `dpkg` source package: `libtasn1-6=4.19.0-3ubuntu0.24.04.2`
+
+Binary Packages:
+
+- `libtasn1-6:riscv64=4.19.0-3ubuntu0.24.04.2`
+
+Licenses: (parsed from: `/usr/share/doc/libtasn1-6/copyright`)
+
+- `GFDL-1.3`
+- `GPL-3`
+- `LGPL`
+- `LGPL-2.1`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libtasn1-6=4.19.0-3ubuntu0.24.04.2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libt/libtasn1-6/libtasn1-6_4.19.0.orig.tar.gz' libtasn1-6_4.19.0.orig.tar.gz 1786576
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libt/libtasn1-6/libtasn1-6_4.19.0.orig.tar.gz.asc' libtasn1-6_4.19.0.orig.tar.gz.asc 228
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libt/libtasn1-6/libtasn1-6_4.19.0-3ubuntu0.24.04.2.debian.tar.xz' libtasn1-6_4.19.0-3ubuntu0.24.04.2.debian.tar.xz 25112
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libt/libtasn1-6/libtasn1-6_4.19.0-3ubuntu0.24.04.2.dsc' libtasn1-6_4.19.0-3ubuntu0.24.04.2.dsc 2801
+```
+
+### `dpkg` source package: `libtool=2.4.7-7build1`
+
+Binary Packages:
+
+- `libltdl7:riscv64=2.4.7-7build1`
+
+Licenses: (parsed from: `/usr/share/doc/libltdl7/copyright`)
+
+- `GFDL-1.3`
+- `GFDL-NIV-1.3+`
+- `GPL-2`
+- `GPL-2+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libtool=2.4.7-7build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libt/libtool/libtool_2.4.7-7build1.dsc' libtool_2.4.7-7build1.dsc 2389
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libt/libtool/libtool_2.4.7.orig.tar.xz' libtool_2.4.7.orig.tar.xz 1026028
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libt/libtool/libtool_2.4.7-7build1.debian.tar.xz' libtool_2.4.7-7build1.debian.tar.xz 41052
+```
+
+### `dpkg` source package: `libunistring=1.1-2build1.1`
+
+Binary Packages:
+
+- `libunistring5:riscv64=1.1-2build1.1`
+
+Licenses: (parsed from: `/usr/share/doc/libunistring5/copyright`)
+
+- `FreeSoftware`
+- `GFDL-1.2`
+- `GFDL-NIV-1.2+`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-2+ with distribution exception`
+- `GPL-2+ with distribution exception, Expat`
+- `GPL-3`
+- `GPL-3+`
+- `LGPL-3`
+- `LGPL-3+`
+- `X11`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libunistring=1.1-2build1.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libu/libunistring/libunistring_1.1.orig.tar.xz' libunistring_1.1.orig.tar.xz 2397676
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libu/libunistring/libunistring_1.1.orig.tar.xz.asc' libunistring_1.1.orig.tar.xz.asc 833
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libu/libunistring/libunistring_1.1-2build1.1.debian.tar.xz' libunistring_1.1-2build1.1.debian.tar.xz 14188
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libu/libunistring/libunistring_1.1-2build1.1.dsc' libunistring_1.1-2build1.1.dsc 2292
+```
+
+### `dpkg` source package: `libxcrypt=1:4.4.36-4build1`
+
+Binary Packages:
+
+- `libcrypt1:riscv64=1:4.4.36-4build1`
+
+**WARNING:** unable to detect licenses! (package likely not compliant with DEP-5)  
+If source is available (seen below), check the contents of `debian/copyright` within it.
+
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libxcrypt=1:4.4.36-4build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libx/libxcrypt/libxcrypt_4.4.36-4build1.dsc' libxcrypt_4.4.36-4build1.dsc 2300
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libx/libxcrypt/libxcrypt_4.4.36.orig.tar.xz' libxcrypt_4.4.36.orig.tar.xz 392732
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libx/libxcrypt/libxcrypt_4.4.36-4build1.debian.tar.xz' libxcrypt_4.4.36-4build1.debian.tar.xz 8356
+```
+
+### `dpkg` source package: `libyaml=0.2.5-1build1`
+
+Binary Packages:
+
+- `libyaml-0-2:riscv64=0.2.5-1build1`
+
+Licenses: (parsed from: `/usr/share/doc/libyaml-0-2/copyright`)
+
+- `Expat`
+- `permissive`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libyaml=0.2.5-1build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/liby/libyaml/libyaml_0.2.5-1build1.dsc' libyaml_0.2.5-1build1.dsc 2203
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/liby/libyaml/libyaml_0.2.5.orig.tar.gz' libyaml_0.2.5.orig.tar.gz 85055
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/liby/libyaml/libyaml_0.2.5-1build1.debian.tar.xz' libyaml_0.2.5-1build1.debian.tar.xz 5496
+```
+
+### `dpkg` source package: `libzstd=1.5.5+dfsg2-2build1.1`
+
+Binary Packages:
+
+- `libzstd1:riscv64=1.5.5+dfsg2-2build1.1`
+
+Licenses: (parsed from: `/usr/share/doc/libzstd1/copyright`)
+
+- `BSD-3-clause`
+- `Expat`
+- `GPL-2`
+- `zlib`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris libzstd=1.5.5+dfsg2-2build1.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libz/libzstd/libzstd_1.5.5%2bdfsg2.orig.tar.xz' libzstd_1.5.5+dfsg2.orig.tar.xz 1784164
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libz/libzstd/libzstd_1.5.5%2bdfsg2-2build1.1.debian.tar.xz' libzstd_1.5.5+dfsg2-2build1.1.debian.tar.xz 21288
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/libz/libzstd/libzstd_1.5.5%2bdfsg2-2build1.1.dsc' libzstd_1.5.5+dfsg2-2build1.1.dsc 2485
+```
+
+### `dpkg` source package: `lua5.4=5.4.6-3build2`
+
+Binary Packages:
+
+- `lua5.4:riscv64=5.4.6-3build2`
+
+Licenses: (parsed from: `/usr/share/doc/lua5.4/copyright`)
+
+- `Expat`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris lua5.4=5.4.6-3build2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/l/lua5.4/lua5.4_5.4.6-3build2.dsc' lua5.4_5.4.6-3build2.dsc 2191
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/l/lua5.4/lua5.4_5.4.6.orig.tar.gz' lua5.4_5.4.6.orig.tar.gz 363329
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/l/lua5.4/lua5.4_5.4.6-3build2.debian.tar.xz' lua5.4_5.4.6-3build2.debian.tar.xz 13240
+```
+
+### `dpkg` source package: `luasocket=3.1.0-1`
+
+Binary Packages:
+
+- `lua-socket:riscv64=3.1.0-1`
+
+Licenses: (parsed from: `/usr/share/doc/lua-socket/copyright`)
+
+- `Expat`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris luasocket=3.1.0-1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/universe/l/luasocket/luasocket_3.1.0-1.dsc' luasocket_3.1.0-1.dsc 1498
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/universe/l/luasocket/luasocket_3.1.0.orig.tar.gz' luasocket_3.1.0.orig.tar.gz 336570
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/universe/l/luasocket/luasocket_3.1.0-1.debian.tar.xz' luasocket_3.1.0-1.debian.tar.xz 7092
+```
+
+### `dpkg` source package: `lz4=1.9.4-1build1.1`
+
+Binary Packages:
+
+- `liblz4-1:riscv64=1.9.4-1build1.1`
+
+Licenses: (parsed from: `/usr/share/doc/liblz4-1/copyright`)
+
+- `BSD-2-clause`
+- `GPL-2`
+- `GPL-2+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris lz4=1.9.4-1build1.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/l/lz4/lz4_1.9.4.orig.tar.gz' lz4_1.9.4.orig.tar.gz 354063
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/l/lz4/lz4_1.9.4-1build1.1.debian.tar.xz' lz4_1.9.4-1build1.1.debian.tar.xz 8356
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/l/lz4/lz4_1.9.4-1build1.1.dsc' lz4_1.9.4-1build1.1.dsc 2061
+```
+
+### `dpkg` source package: `machine-guest-tools=0.18.0test-1`
+
+Binary Packages:
+
+- `machine-guest-tools:riscv64=0.18.0test-1`
+
+**WARNING:** unable to detect licenses! (package likely not compliant with DEP-5)  
+If source is available (seen below), check the contents of `debian/copyright` within it.
+
+
+**WARNING:** no archive source (package was installed from a local `.deb`, not a repository).
+
+
+### `dpkg` source package: `mawk=1.3.4.20240123-1build1`
+
+Binary Packages:
+
+- `mawk:riscv64=1.3.4.20240123-1build1`
+
+Licenses: (parsed from: `/usr/share/doc/mawk/copyright`)
+
+- `CC-BY-3.0`
+- `GPL-2`
+- `GPL-2.0-only`
+- `X11`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris mawk=1.3.4.20240123-1build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/m/mawk/mawk_1.3.4.20240123-1build1.dsc' mawk_1.3.4.20240123-1build1.dsc 2312
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/m/mawk/mawk_1.3.4.20240123.orig.tar.gz' mawk_1.3.4.20240123.orig.tar.gz 413943
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/m/mawk/mawk_1.3.4.20240123.orig.tar.gz.asc' mawk_1.3.4.20240123.orig.tar.gz.asc 729
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/m/mawk/mawk_1.3.4.20240123-1build1.debian.tar.xz' mawk_1.3.4.20240123-1build1.debian.tar.xz 15704
+```
+
+### `dpkg` source package: `ncurses=6.4+20240113-1ubuntu2`
+
+Binary Packages:
+
+- `libncursesw6:riscv64=6.4+20240113-1ubuntu2`
+- `libtinfo6:riscv64=6.4+20240113-1ubuntu2`
+- `ncurses-base=6.4+20240113-1ubuntu2`
+- `ncurses-bin:riscv64=6.4+20240113-1ubuntu2`
+
+Licenses: (parsed from: `/usr/share/doc/libncursesw6/copyright`, `/usr/share/doc/libtinfo6/copyright`, `/usr/share/doc/ncurses-base/copyright`, `/usr/share/doc/ncurses-bin/copyright`)
+
+- `BSD-3-clause`
+- `MIT/X11`
+- `X11`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris ncurses=6.4+20240113-1ubuntu2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/ncurses/ncurses_6.4%2b20240113-1ubuntu2.dsc' ncurses_6.4+20240113-1ubuntu2.dsc 3963
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/ncurses/ncurses_6.4%2b20240113.orig.tar.gz' ncurses_6.4+20240113.orig.tar.gz 3688489
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/ncurses/ncurses_6.4%2b20240113.orig.tar.gz.asc' ncurses_6.4+20240113.orig.tar.gz.asc 729
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/ncurses/ncurses_6.4%2b20240113-1ubuntu2.debian.tar.xz' ncurses_6.4+20240113-1ubuntu2.debian.tar.xz 49372
+```
+
+### `dpkg` source package: `nettle=3.9.1-2.2build1.1`
+
+Binary Packages:
+
+- `libhogweed6t64:riscv64=3.9.1-2.2build1.1`
+- `libnettle8t64:riscv64=3.9.1-2.2build1.1`
+
+Licenses: (parsed from: `/usr/share/doc/libhogweed6t64/copyright`, `/usr/share/doc/libnettle8t64/copyright`)
+
+- `Expat`
+- `GAP`
+- `GPL`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3+ with Autoconf exception`
+- `LGPL`
+- `LGPL-2`
+- `LGPL-2+`
+- `LGPL-3+`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris nettle=3.9.1-2.2build1.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/nettle/nettle_3.9.1.orig.tar.gz' nettle_3.9.1.orig.tar.gz 2396741
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/nettle/nettle_3.9.1.orig.tar.gz.asc' nettle_3.9.1.orig.tar.gz.asc 573
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/nettle/nettle_3.9.1-2.2build1.1.debian.tar.xz' nettle_3.9.1-2.2build1.1.debian.tar.xz 24848
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/nettle/nettle_3.9.1-2.2build1.1.dsc' nettle_3.9.1-2.2build1.1.dsc 2325
+```
+
+### `dpkg` source package: `nghttp2=1.59.0-1ubuntu0.3`
+
+Binary Packages:
+
+- `libnghttp2-14:riscv64=1.59.0-1ubuntu0.3`
+
+Licenses: (parsed from: `/usr/share/doc/libnghttp2-14/copyright`)
+
+- `BSD-2-clause`
+- `Expat`
+- `GPL-3`
+- `GPL-3+ with autoconf exception`
+- `MIT`
+- `all-permissive`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris nghttp2=1.59.0-1ubuntu0.3
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/nghttp2/nghttp2_1.59.0.orig.tar.gz' nghttp2_1.59.0.orig.tar.gz 1055492
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/nghttp2/nghttp2_1.59.0-1ubuntu0.3.debian.tar.xz' nghttp2_1.59.0-1ubuntu0.3.debian.tar.xz 16364
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/nghttp2/nghttp2_1.59.0-1ubuntu0.3.dsc' nghttp2_1.59.0-1ubuntu0.3.dsc 2669
+```
+
+### `dpkg` source package: `npth=1.6-3.1build1`
+
+Binary Packages:
+
+- `libnpth0t64:riscv64=1.6-3.1build1`
+
+Licenses: (parsed from: `/usr/share/doc/libnpth0t64/copyright`)
+
+- `LGPL-2.1`
+- `LGPL-2.1+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris npth=1.6-3.1build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/npth/npth_1.6-3.1build1.dsc' npth_1.6-3.1build1.dsc 2107
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/npth/npth_1.6.orig.tar.bz2' npth_1.6.orig.tar.bz2 300486
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/n/npth/npth_1.6-3.1build1.debian.tar.xz' npth_1.6-3.1build1.debian.tar.xz 11036
+```
+
+### `dpkg` source package: `openldap=2.6.10+dfsg-0ubuntu0.24.04.1`
+
+Binary Packages:
+
+- `libldap2:riscv64=2.6.10+dfsg-0ubuntu0.24.04.1`
+
+Licenses: (parsed from: `/usr/share/doc/libldap2/copyright`)
+
+- `BSD-3-clause`
+- `BSD-3-clause-California`
+- `BSD-3-clause-variant`
+- `BSD-4-clause-California`
+- `Beerware`
+- `Expat`
+- `Expat-ISC`
+- `Expat-UNM`
+- `F5`
+- `FSF-unlimited`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-2+ with Autoconf exception`
+- `GPL-2+ with Libtool exception`
+- `GPL-3`
+- `GPL-3+`
+- `GPL-3+ with Autoconf exception`
+- `GPL-3+ with Libtool exception`
+- `JCG`
+- `MIT-XC`
+- `NeoSoft-permissive`
+- `OpenLDAP-2.8`
+- `UMich`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris openldap=2.6.10+dfsg-0ubuntu0.24.04.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/o/openldap/openldap_2.6.10%2bdfsg.orig.tar.xz' openldap_2.6.10+dfsg.orig.tar.xz 3754560
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/o/openldap/openldap_2.6.10%2bdfsg-0ubuntu0.24.04.1.debian.tar.xz' openldap_2.6.10+dfsg-0ubuntu0.24.04.1.debian.tar.xz 191132
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/o/openldap/openldap_2.6.10%2bdfsg-0ubuntu0.24.04.1.dsc' openldap_2.6.10+dfsg-0ubuntu0.24.04.1.dsc 3653
+```
+
+### `dpkg` source package: `openssl=3.0.13-0ubuntu3.11`
+
+Binary Packages:
+
+- `libssl3t64:riscv64=3.0.13-0ubuntu3.11`
+
+Licenses: (parsed from: `/usr/share/doc/libssl3t64/copyright`)
+
+- `Apache-2.0`
+- `Artistic`
+- `GPL-1`
+- `GPL-1+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris openssl=3.0.13-0ubuntu3.11
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/o/openssl/openssl_3.0.13.orig.tar.gz' openssl_3.0.13.orig.tar.gz 15294843
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/o/openssl/openssl_3.0.13-0ubuntu3.11.debian.tar.xz' openssl_3.0.13-0ubuntu3.11.debian.tar.xz 195932
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/o/openssl/openssl_3.0.13-0ubuntu3.11.dsc' openssl_3.0.13-0ubuntu3.11.dsc 2516
+```
+
+### `dpkg` source package: `p11-kit=0.25.3-4ubuntu2.1`
+
+Binary Packages:
+
+- `libp11-kit0:riscv64=0.25.3-4ubuntu2.1`
+
+Licenses: (parsed from: `/usr/share/doc/libp11-kit0/copyright`)
+
+- `Apache-2.0`
+- `BSD-3-clause`
+- `FSFAP`
+- `FSFULLR`
+- `GPL-2+ with Autoconf-data exception`
+- `GPL-3+ with Autoconf-data exception`
+- `ISC`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `X11`
+- `customFSFUL`
+- `customFSFULLRWD`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris p11-kit=0.25.3-4ubuntu2.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/p11-kit/p11-kit_0.25.3.orig.tar.xz' p11-kit_0.25.3.orig.tar.xz 991528
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/p11-kit/p11-kit_0.25.3-4ubuntu2.1.debian.tar.xz' p11-kit_0.25.3-4ubuntu2.1.debian.tar.xz 26028
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/p11-kit/p11-kit_0.25.3-4ubuntu2.1.dsc' p11-kit_0.25.3-4ubuntu2.1.dsc 2405
+```
+
+### `dpkg` source package: `pam=1.5.3-5ubuntu5.5`
+
+Binary Packages:
+
+- `libpam-modules:riscv64=1.5.3-5ubuntu5.5`
+- `libpam-modules-bin:riscv64=1.5.3-5ubuntu5.5`
+- `libpam-runtime=1.5.3-5ubuntu5.5`
+- `libpam0g:riscv64=1.5.3-5ubuntu5.5`
+
+Licenses: (parsed from: `/usr/share/doc/libpam-modules/copyright`, `/usr/share/doc/libpam-modules-bin/copyright`, `/usr/share/doc/libpam-runtime/copyright`, `/usr/share/doc/libpam0g/copyright`)
+
+- `BSD-3-clause`
+- `BSD-tcp_wrappers`
+- `Beerware`
+- `GPL`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `GPL-3+ with Bison exception`
+- `LGPL-2`
+- `LGPL-2+`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris pam=1.5.3-5ubuntu5.5
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/pam/pam_1.5.3.orig.tar.xz' pam_1.5.3.orig.tar.xz 1020076
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/pam/pam_1.5.3-5ubuntu5.5.debian.tar.xz' pam_1.5.3-5ubuntu5.5.debian.tar.xz 204688
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/pam/pam_1.5.3-5ubuntu5.5.dsc' pam_1.5.3-5ubuntu5.5.dsc 2727
+```
+
+### `dpkg` source package: `pcre2=10.42-4ubuntu2.1`
+
+Binary Packages:
+
+- `libpcre2-8-0:riscv64=10.42-4ubuntu2.1`
+
+Licenses: (parsed from: `/usr/share/doc/libpcre2-8-0/copyright`)
+
+- `BSD-2-clause`
+- `BSD-3-clause`
+- `BSD-3-clause-Cambridge with BINARY LIBRARY-LIKE PACKAGES exception`
+- `X11`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris pcre2=10.42-4ubuntu2.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/pcre2/pcre2_10.42.orig.tar.gz' pcre2_10.42.orig.tar.gz 2397194
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/pcre2/pcre2_10.42-4ubuntu2.1.diff.gz' pcre2_10.42-4ubuntu2.1.diff.gz 8431
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/pcre2/pcre2_10.42-4ubuntu2.1.dsc' pcre2_10.42-4ubuntu2.1.dsc 2277
+```
+
+### `dpkg` source package: `perl=5.38.2-3.2ubuntu0.2`
+
+Binary Packages:
+
+- `perl-base:riscv64=5.38.2-3.2ubuntu0.2`
+
+Licenses: (parsed from: `/usr/share/doc/perl-base/copyright`)
+
+- `Artistic`
+- `Artistic,`
+- `Artistic-2`
+- `Artistic-dist`
+- `BSD-3-clause`
+- `BSD-3-clause-GENERIC`
+- `BSD-3-clause-with-weird-numbering`
+- `BSD-4-clause-POWERDOG`
+- `BZIP`
+- `CC0-1.0`
+- `DONT-CHANGE-THE-GPL`
+- `Expat`
+- `FSFAP`
+- `GPL-1`
+- `GPL-1+`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3+-WITH-BISON-EXCEPTION`
+- `LGPL-2.1`
+- `REGCOMP`
+- `REGCOMP,`
+- `SDBM-PUBLIC-DOMAIN`
+- `TEXT-TABS`
+- `Unicode`
+- `ZLIB`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris perl=5.38.2-3.2ubuntu0.2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/perl/perl_5.38.2-3.2ubuntu0.2.dsc' perl_5.38.2-3.2ubuntu0.2.dsc 3036
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/perl/perl_5.38.2.orig-regen-configure.tar.xz' perl_5.38.2.orig-regen-configure.tar.xz 418808
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/perl/perl_5.38.2.orig.tar.xz' perl_5.38.2.orig.tar.xz 13679524
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/perl/perl_5.38.2-3.2ubuntu0.2.debian.tar.xz' perl_5.38.2-3.2ubuntu0.2.debian.tar.xz 171736
+```
+
+### `dpkg` source package: `procps=2:4.0.4-4ubuntu3.2`
+
+Binary Packages:
+
+- `libproc2-0:riscv64=2:4.0.4-4ubuntu3.2`
+- `procps:riscv64=2:4.0.4-4ubuntu3.2`
+
+Licenses: (parsed from: `/usr/share/doc/libproc2-0/copyright`, `/usr/share/doc/procps/copyright`)
+
+- `GPL-2`
+- `GPL-2.0+`
+- `LGPL-2`
+- `LGPL-2.0+`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris procps=2:4.0.4-4ubuntu3.2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/procps/procps_4.0.4.orig.tar.xz' procps_4.0.4.orig.tar.xz 1401540
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/procps/procps_4.0.4-4ubuntu3.2.debian.tar.xz' procps_4.0.4-4ubuntu3.2.debian.tar.xz 38784
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/procps/procps_4.0.4-4ubuntu3.2.dsc' procps_4.0.4-4ubuntu3.2.dsc 2251
+```
+
+### `dpkg` source package: `python3-defaults=3.12.3-0ubuntu2.1`
+
+Binary Packages:
+
+- `python3-minimal:riscv64=3.12.3-0ubuntu2.1`
+
+**WARNING:** unable to detect licenses! (package likely not compliant with DEP-5)  
+If source is available (seen below), check the contents of `debian/copyright` within it.
+
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris python3-defaults=3.12.3-0ubuntu2.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/python3-defaults/python3-defaults_3.12.3-0ubuntu2.1.tar.gz' python3-defaults_3.12.3-0ubuntu2.1.tar.gz 147765
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/python3-defaults/python3-defaults_3.12.3-0ubuntu2.1.dsc' python3-defaults_3.12.3-0ubuntu2.1.dsc 3116
+```
+
+### `dpkg` source package: `python3.12=3.12.3-1ubuntu0.13`
+
+Binary Packages:
+
+- `libpython3.12-minimal:riscv64=3.12.3-1ubuntu0.13`
+- `python3.12-minimal:riscv64=3.12.3-1ubuntu0.13`
+
+Licenses: (parsed from: `/usr/share/doc/libpython3.12-minimal/copyright`, `/usr/share/doc/python3.12-minimal/copyright`)
+
+- `* Permission to use this software in any way is granted without`
+- `By obtaining, using, and/or copying this software and/or its`
+- `GPL-2`
+- `Permission  is  hereby granted,  free  of charge,  to  any person`
+- `Permission is hereby granted, free of charge, to any person obtaining`
+- `Permission to use, copy, modify,`
+- `Redistribution`
+- `This software is provided 'as-is', without any express`
+- `This software is provided as-is, without express`
+- `binary forms, with`
+- `distribute this software`
+- `distribute this software and`
+- `distribute this software for any`
+- `implied`
+- `its`
+- `use in source`
+- `without`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris python3.12=3.12.3-1ubuntu0.13
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/python3.12/python3.12_3.12.3.orig.tar.xz' python3.12_3.12.3.orig.tar.xz 20625068
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/python3.12/python3.12_3.12.3-1ubuntu0.13.debian.tar.xz' python3.12_3.12.3-1ubuntu0.13.debian.tar.xz 271684
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/p/python3.12/python3.12_3.12.3-1ubuntu0.13.dsc' python3.12_3.12.3-1ubuntu0.13.dsc 3879
+```
+
+### `dpkg` source package: `readline=8.2-4build1`
+
+Binary Packages:
+
+- `libreadline8t64:riscv64=8.2-4build1`
+- `readline-common=8.2-4build1`
+
+Licenses: (parsed from: `/usr/share/doc/libreadline8t64/copyright`, `/usr/share/doc/readline-common/copyright`)
+
+- `GFDL`
+- `GFDL-NIV-1.3+`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `GPL-3+`
+- `ISC-no-attribution`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris readline=8.2-4build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/r/readline/readline_8.2-4build1.dsc' readline_8.2-4build1.dsc 2926
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/r/readline/readline_8.2.orig.tar.gz' readline_8.2.orig.tar.gz 3043952
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/r/readline/readline_8.2-4build1.debian.tar.xz' readline_8.2-4build1.debian.tar.xz 33816
+```
+
+### `dpkg` source package: `rtmpdump=2.4+20151223.gitfa8646d.1-2build7`
+
+Binary Packages:
+
+- `librtmp1:riscv64=2.4+20151223.gitfa8646d.1-2build7`
+
+Licenses: (parsed from: `/usr/share/doc/librtmp1/copyright`)
+
+- `GPL-2`
+- `LGPL-2.1`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris rtmpdump=2.4+20151223.gitfa8646d.1-2build7
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/r/rtmpdump/rtmpdump_2.4%2b20151223.gitfa8646d.1-2build7.dsc' rtmpdump_2.4+20151223.gitfa8646d.1-2build7.dsc 2439
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/r/rtmpdump/rtmpdump_2.4%2b20151223.gitfa8646d.1.orig.tar.gz' rtmpdump_2.4+20151223.gitfa8646d.1.orig.tar.gz 142213
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/r/rtmpdump/rtmpdump_2.4%2b20151223.gitfa8646d.1-2build7.debian.tar.xz' rtmpdump_2.4+20151223.gitfa8646d.1-2build7.debian.tar.xz 8464
+```
+
+### `dpkg` source package: `sed=4.9-2build1`
+
+Binary Packages:
+
+- `sed:riscv64=4.9-2build1`
+
+Licenses: (parsed from: `/usr/share/doc/sed/copyright`)
+
+- `BSD-4-clause-UC`
+- `BSL-1`
+- `GFDL-1.3`
+- `GFDL-NIV-1.3+`
+- `GPL-3`
+- `GPL-3+`
+- `ISC`
+- `X11`
+- `pcre`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris sed=4.9-2build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/sed/sed_4.9-2build1.dsc' sed_4.9-2build1.dsc 1992
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/sed/sed_4.9.orig.tar.xz' sed_4.9.orig.tar.xz 1397092
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/sed/sed_4.9-2build1.debian.tar.xz' sed_4.9-2build1.debian.tar.xz 62896
+```
+
+### `dpkg` source package: `sensible-utils=0.0.22`
+
+Binary Packages:
+
+- `sensible-utils=0.0.22`
+
+Licenses: (parsed from: `/usr/share/doc/sensible-utils/copyright`)
+
+- `All-permissive`
+- `BSD-2-clause`
+- `GPL-2`
+- `GPL-2+`
+- `configure`
+- `installsh`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris sensible-utils=0.0.22
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/sensible-utils/sensible-utils_0.0.22.dsc' sensible-utils_0.0.22.dsc 1737
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/sensible-utils/sensible-utils_0.0.22.tar.xz' sensible-utils_0.0.22.tar.xz 74412
+```
+
+### `dpkg` source package: `shadow=1:4.13+dfsg1-4ubuntu3.2`
+
+Binary Packages:
+
+- `login:riscv64=1:4.13+dfsg1-4ubuntu3.2`
+- `passwd:riscv64=1:4.13+dfsg1-4ubuntu3.2`
+
+Licenses: (parsed from: `/usr/share/doc/login/copyright`, `/usr/share/doc/passwd/copyright`)
+
+- `BSD-3-clause`
+- `GPL-1`
+- `GPL-2`
+- `GPL-2+`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris shadow=1:4.13+dfsg1-4ubuntu3.2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/shadow/shadow_4.13%2bdfsg1.orig.tar.xz' shadow_4.13+dfsg1.orig.tar.xz 1811752
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/shadow/shadow_4.13%2bdfsg1-4ubuntu3.2.debian.tar.xz' shadow_4.13+dfsg1-4ubuntu3.2.debian.tar.xz 96392
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/shadow/shadow_4.13%2bdfsg1-4ubuntu3.2.dsc' shadow_4.13+dfsg1-4ubuntu3.2.dsc 2400
+```
+
+### `dpkg` source package: `systemd=255.4-1ubuntu8.15`
+
+Binary Packages:
+
+- `libsystemd0:riscv64=255.4-1ubuntu8.15`
+- `libudev1:riscv64=255.4-1ubuntu8.15`
+
+Licenses: (parsed from: `/usr/share/doc/libsystemd0/copyright`, `/usr/share/doc/libudev1/copyright`)
+
+- `CC0-1.0`
+- `Expat`
+- `GPL-2`
+- `GPL-2 with Linux-syscall-note exception`
+- `GPL-2+`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris systemd=255.4-1ubuntu8.15
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/systemd/systemd_255.4-1ubuntu8.15.dsc' systemd_255.4-1ubuntu8.15.dsc 7324
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/systemd/systemd_255.4.orig.tar.gz' systemd_255.4.orig.tar.gz 14952427
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/systemd/systemd_255.4-1ubuntu8.15.debian.tar.xz' systemd_255.4-1ubuntu8.15.debian.tar.xz 264648
+```
+
+### `dpkg` source package: `sysvinit=3.08-6ubuntu3`
+
+Binary Packages:
+
+- `sysvinit-utils:riscv64=3.08-6ubuntu3`
+
+Licenses: (parsed from: `/usr/share/doc/sysvinit-utils/copyright`)
+
+- `GPL-2`
+- `GPL-2.0`
+- `GPL-2.0+`
+- `GPL-3`
+- `GPL-3.0`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris sysvinit=3.08-6ubuntu3
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/sysvinit/sysvinit_3.08-6ubuntu3.dsc' sysvinit_3.08-6ubuntu3.dsc 2495
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/sysvinit/sysvinit_3.08.orig.tar.gz' sysvinit_3.08.orig.tar.gz 513674
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/s/sysvinit/sysvinit_3.08-6ubuntu3.debian.tar.xz' sysvinit_3.08-6ubuntu3.debian.tar.xz 140128
+```
+
+### `dpkg` source package: `tar=1.35+dfsg-3build1`
+
+Binary Packages:
+
+- `tar:riscv64=1.35+dfsg-3build1`
+
+Licenses: (parsed from: `/usr/share/doc/tar/copyright`)
+
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `GPL-3+`
+- `GPL-3+ with Bison exception`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `LGPL-3`
+- `LGPL-3+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris tar=1.35+dfsg-3build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tar/tar_1.35%2bdfsg-3build1.dsc' tar_1.35+dfsg-3build1.dsc 2141
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tar/tar_1.35%2bdfsg.orig.tar.xz' tar_1.35+dfsg.orig.tar.xz 2111608
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tar/tar_1.35%2bdfsg-3build1.debian.tar.xz' tar_1.35+dfsg-3build1.debian.tar.xz 20948
+```
+
+### `dpkg` source package: `tcl8.6=8.6.14+dfsg-1build1`
+
+Binary Packages:
+
+- `libtcl8.6:riscv64=8.6.14+dfsg-1build1`
+- `tcl8.6:riscv64=8.6.14+dfsg-1build1`
+
+**WARNING:** unable to detect licenses! (package likely not compliant with DEP-5)  
+If source is available (seen below), check the contents of `debian/copyright` within it.
+
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris tcl8.6=8.6.14+dfsg-1build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tcl8.6/tcl8.6_8.6.14%2bdfsg-1build1.dsc' tcl8.6_8.6.14+dfsg-1build1.dsc 2260
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tcl8.6/tcl8.6_8.6.14%2bdfsg.orig.tar.gz' tcl8.6_8.6.14+dfsg.orig.tar.gz 7091313
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tcl8.6/tcl8.6_8.6.14%2bdfsg-1build1.debian.tar.xz' tcl8.6_8.6.14+dfsg-1build1.debian.tar.xz 14484
+```
+
+### `dpkg` source package: `tcltk-defaults=8.6.14build1`
+
+Binary Packages:
+
+- `tcl:riscv64=8.6.14build1`
+
+Licenses: (parsed from: `/usr/share/doc/tcl/copyright`)
+
+- `GPL`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris tcltk-defaults=8.6.14build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tcltk-defaults/tcltk-defaults_8.6.14build1.dsc' tcltk-defaults_8.6.14build1.dsc 2151
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tcltk-defaults/tcltk-defaults_8.6.14build1.tar.xz' tcltk-defaults_8.6.14build1.tar.xz 14252
+```
+
+### `dpkg` source package: `tzdata=2026a-0ubuntu0.24.04.1`
+
+Binary Packages:
+
+- `tzdata=2026a-0ubuntu0.24.04.1`
+
+Licenses: (parsed from: `/usr/share/doc/tzdata/copyright`)
+
+- `ICU`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris tzdata=2026a-0ubuntu0.24.04.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tzdata/tzdata_2026a.orig.tar.gz' tzdata_2026a.orig.tar.gz 471812
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tzdata/tzdata_2026a.orig.tar.gz.asc' tzdata_2026a.orig.tar.gz.asc 833
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tzdata/tzdata_2026a-0ubuntu0.24.04.1.debian.tar.xz' tzdata_2026a-0ubuntu0.24.04.1.debian.tar.xz 188416
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/t/tzdata/tzdata_2026a-0ubuntu0.24.04.1.dsc' tzdata_2026a-0ubuntu0.24.04.1.dsc 2728
+```
+
+### `dpkg` source package: `ubuntu-keyring=2023.11.28.1`
+
+Binary Packages:
+
+- `ubuntu-keyring=2023.11.28.1`
+
+Licenses: (parsed from: `/usr/share/doc/ubuntu-keyring/copyright`)
+
+- `GPL`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris ubuntu-keyring=2023.11.28.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/u/ubuntu-keyring/ubuntu-keyring_2023.11.28.1.dsc' ubuntu-keyring_2023.11.28.1.dsc 1872
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/u/ubuntu-keyring/ubuntu-keyring_2023.11.28.1.tar.xz' ubuntu-keyring_2023.11.28.1.tar.xz 20236
+```
+
+### `dpkg` source package: `unminimize=0.2.1`
+
+Binary Packages:
+
+- `unminimize:riscv64=0.2.1`
+
+Licenses: (parsed from: `/usr/share/doc/unminimize/copyright`)
+
+- `GPL-2`
+- `GPL-2.0+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris unminimize=0.2.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/u/unminimize/unminimize_0.2.1.tar.xz' unminimize_0.2.1.tar.xz 9400
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/u/unminimize/unminimize_0.2.1.dsc' unminimize_0.2.1.dsc 1554
+```
+
+### `dpkg` source package: `util-linux=2.39.3-9ubuntu6.5`
+
+Binary Packages:
+
+- `bsdutils:riscv64=1:2.39.3-9ubuntu6.5`
+- `libblkid1:riscv64=2.39.3-9ubuntu6.5`
+- `libmount1:riscv64=2.39.3-9ubuntu6.5`
+- `libsmartcols1:riscv64=2.39.3-9ubuntu6.5`
+- `libuuid1:riscv64=2.39.3-9ubuntu6.5`
+- `mount:riscv64=2.39.3-9ubuntu6.5`
+- `util-linux:riscv64=2.39.3-9ubuntu6.5`
+
+Licenses: (parsed from: `/usr/share/doc/bsdutils/copyright`, `/usr/share/doc/libblkid1/copyright`, `/usr/share/doc/libmount1/copyright`, `/usr/share/doc/libsmartcols1/copyright`, `/usr/share/doc/libuuid1/copyright`, `/usr/share/doc/mount/copyright`, `/usr/share/doc/util-linux/copyright`)
+
+- `BSD-3-clause`
+- `BSD-4-clause`
+- `BSLA`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `GPL-3+`
+- `LGPL`
+- `LGPL-2`
+- `LGPL-2+`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `LGPL-3`
+- `LGPL-3+`
+- `MIT`
+- `public-domain`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris util-linux=2.39.3-9ubuntu6.5
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/u/util-linux/util-linux_2.39.3.orig.tar.xz' util-linux_2.39.3.orig.tar.xz 8526168
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/u/util-linux/util-linux_2.39.3-9ubuntu6.5.debian.tar.xz' util-linux_2.39.3-9ubuntu6.5.debian.tar.xz 148016
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/u/util-linux/util-linux_2.39.3-9ubuntu6.5.dsc' util-linux_2.39.3-9ubuntu6.5.dsc 4726
+```
+
+### `dpkg` source package: `xxhash=0.8.2-2build1`
+
+Binary Packages:
+
+- `libxxhash0:riscv64=0.8.2-2build1`
+
+Licenses: (parsed from: `/usr/share/doc/libxxhash0/copyright`)
+
+- `BSD-2-clause`
+- `GPL-2`
+- `GPL-2+`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris xxhash=0.8.2-2build1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/x/xxhash/xxhash_0.8.2-2build1.dsc' xxhash_0.8.2-2build1.dsc 2076
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/x/xxhash/xxhash_0.8.2.orig.tar.gz' xxhash_0.8.2.orig.tar.gz 1141188
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/x/xxhash/xxhash_0.8.2-2build1.debian.tar.xz' xxhash_0.8.2-2build1.debian.tar.xz 5048
+```
+
+### `dpkg` source package: `xz-utils=5.6.1+really5.4.5-1ubuntu0.2`
+
+Binary Packages:
+
+- `liblzma5:riscv64=5.6.1+really5.4.5-1ubuntu0.2`
+
+Licenses: (parsed from: `/usr/share/doc/liblzma5/copyright`)
+
+- `Autoconf`
+- `GPL-2`
+- `GPL-2+`
+- `GPL-3`
+- `LGPL-2`
+- `LGPL-2.1`
+- `LGPL-2.1+`
+- `PD`
+- `PD-debian`
+- `config-h`
+- `noderivs`
+- `none`
+- `permissive-fsf`
+- `permissive-nowarranty`
+- `probably-PD`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris xz-utils=5.6.1+really5.4.5-1ubuntu0.2
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/x/xz-utils/xz-utils_5.6.1%2breally5.4.5-1ubuntu0.2.dsc' xz-utils_5.6.1+really5.4.5-1ubuntu0.2.dsc 2639
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/x/xz-utils/xz-utils_5.6.1%2breally5.4.5.orig.tar.xz' xz-utils_5.6.1+really5.4.5.orig.tar.xz 1680520
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/x/xz-utils/xz-utils_5.6.1%2breally5.4.5-1ubuntu0.2.debian.tar.xz' xz-utils_5.6.1+really5.4.5-1ubuntu0.2.debian.tar.xz 30776
+```
+
+### `dpkg` source package: `zlib=1:1.3.dfsg-3.1ubuntu2.1`
+
+Binary Packages:
+
+- `zlib1g:riscv64=1:1.3.dfsg-3.1ubuntu2.1`
+
+Licenses: (parsed from: `/usr/share/doc/zlib1g/copyright`)
+
+- `Zlib`
+
+Source:
+
+```console
+$ apt-get -o APT::Architecture=riscv64 -o APT::Architectures=riscv64 --snapshot=20260421T000000Z source -qq --print-uris zlib=1:1.3.dfsg-3.1ubuntu2.1
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/z/zlib/zlib_1.3.dfsg.orig.tar.xz' zlib_1.3.dfsg.orig.tar.xz 1128572
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/z/zlib/zlib_1.3.dfsg-3.1ubuntu2.1.debian.tar.xz' zlib_1.3.dfsg-3.1ubuntu2.1.debian.tar.xz 61028
+'https://snapshot.ubuntu.com/ubuntu/20260421T000000Z/pool/main/z/zlib/zlib_1.3.dfsg-3.1ubuntu2.1.dsc' zlib_1.3.dfsg-3.1ubuntu2.1.dsc 3116
+```
diff --git a/doc/recipes/run-calculator-with-new-drives.lua b/doc/recipes/run-calculator-with-new-drives.lua
new file mode 100644
index 000000000..4d317647c
--- /dev/null
+++ b/doc/recipes/run-calculator-with-new-drives.lua
@@ -0,0 +1,25 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Instantiate machine from template
+local machine = cartesi.machine("calculator-template")
+
+-- Replace input NVRAM by label
+machine:replace_memory_range({
+    label = "input",
+    backing_store = { data_filename = assert(arg[1], "missing input image filename") },
+})
+
+-- Replace output NVRAM by label
+machine:replace_memory_range({
+    label = "output",
+    backing_store = {
+        data_filename = assert(arg[2], "missing output image filename"),
+        shared = true,
+    },
+})
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
diff --git a/doc/recipes/run-calculator-with-proof.lua b/doc/recipes/run-calculator-with-proof.lua
new file mode 100644
index 000000000..7205cb78c
--- /dev/null
+++ b/doc/recipes/run-calculator-with-proof.lua
@@ -0,0 +1,32 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+local hash_tree = require("cartesi.hash-tree")
+
+-- Instantiate machine from configuration
+local config = require("config-calculator")
+local machine = cartesi.machine(config)
+
+-- Write expression to input NVRAM
+local input_nvram = assert(util.find_drive(config, "nvram", "input"))
+machine:write_memory(input_nvram.start, table.concat(arg, " ") .. "\n")
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+
+-- Obtain value proof for output NVRAM
+local output_state_hash = machine:get_root_hash()
+local output_nvram = assert(util.find_drive(config, "nvram", "output"))
+local output_proof = machine:get_proof(output_nvram.start, output_nvram.log2_size)
+
+-- Proof must be a whole-machine proof rooted at the current machine state
+assert(output_proof.log2_root_size == cartesi.HASH_TREE_LOG2_ROOT_SIZE, "proof depth mismatch")
+assert(output_proof.root_hash == output_state_hash, "proof root mismatch")
+
+-- Verify proof
+hash_tree.verify_slice(output_proof)
+print("\nOutput NVRAM proof accepted!\n")
+
+print((string.unpack("z", machine:read_memory(output_nvram.start, output_nvram.length))))
diff --git a/doc/recipes/run-calculator.lua b/doc/recipes/run-calculator.lua
new file mode 100644
index 000000000..928b0ec1e
--- /dev/null
+++ b/doc/recipes/run-calculator.lua
@@ -0,0 +1,20 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+
+-- Instantiate machine from configuration
+local calculator_config = require("config-calculator")
+local machine = cartesi.machine(calculator_config)
+
+-- Write expression to input NVRAM
+local input_nvram = assert(util.find_drive(calculator_config, "nvram", "input"))
+machine:write_memory(input_nvram.start, table.concat(arg, " ") .. "\n")
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+
+-- Read result from output NVRAM
+local output_nvram = assert(util.find_drive(calculator_config, "nvram", "output"))
+print((string.unpack("z", machine:read_memory(output_nvram.start, output_nvram.length))))
diff --git a/doc/recipes/run-config-in-chunks-with-progress.lua b/doc/recipes/run-config-in-chunks-with-progress.lua
new file mode 100644
index 000000000..4b9889659
--- /dev/null
+++ b/doc/recipes/run-config-in-chunks-with-progress.lua
@@ -0,0 +1,35 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+local CHUNK = 1000000 -- 1 million cycles
+local max_mcycle = CHUNK
+-- Loop until machine halts or yields manual
+repeat
+    -- Execute up to max_mcycle
+    local break_reason = machine:run(max_mcycle)
+    -- Check if machine yielded automatic with a progress report
+    if
+        break_reason == cartesi.BREAK_REASON_YIELDED_AUTOMATICALLY
+        and machine:read_reg("htif_tohost_reason") == cartesi.HTIF_YIELD_AUTOMATIC_REASON_PROGRESS
+    then
+        local permil = machine:read_reg("htif_tohost_data")
+        -- Show progress feedback
+        stderr("Progress: %6.2f\r", permil / 10)
+    end
+    -- Refill the time slice for the next iteration
+    if break_reason == cartesi.BREAK_REASON_REACHED_TARGET_MCYCLE then
+        max_mcycle = max_mcycle + CHUNK
+        -- Potentially perform other tasks
+    end
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+-- Machine is now halted or yielded manual
+stderr("\nCycles: %u\n", machine:read_reg("mcycle"))
diff --git a/doc/recipes/run-config-in-chunks.lua b/doc/recipes/run-config-in-chunks.lua
new file mode 100644
index 000000000..509000f21
--- /dev/null
+++ b/doc/recipes/run-config-in-chunks.lua
@@ -0,0 +1,23 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+local CHUNK = 1000000 -- 1 million cycles
+-- Loop until machine halts or yields manual
+local chunks = 0
+repeat
+    -- Execute at most CHUNK additional cycles, then potentially perform other tasks
+    local break_reason = machine:run(machine:read_reg("mcycle") + CHUNK)
+    chunks = chunks + 1
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+
+-- Print the number of chunks
+stderr("%u chunks\n", chunks)
diff --git a/doc/recipes/run-config-with-hashes.lua b/doc/recipes/run-config-with-hashes.lua
new file mode 100644
index 000000000..2d225e690
--- /dev/null
+++ b/doc/recipes/run-config-with-hashes.lua
@@ -0,0 +1,38 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Converts hash from binary to hexadecimal string
+local function hexhash(hash)
+    return (string.gsub(hash, ".", function(c)
+        return string.format("%02x", string.byte(c))
+    end))
+end
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+-- Print the initial cycle count and root hash
+stderr("%u: %s\n", machine:read_reg("mcycle"), hexhash(machine:get_root_hash()))
+
+-- Run machine until it halts or yields manual
+local break_reason
+repeat
+    break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+
+-- Print machine status
+if break_reason == cartesi.BREAK_REASON_HALTED then
+    stderr("\nHalted\n")
+else
+    stderr("\nYielded manual\n")
+end
+stderr("Cycles: %u\n", machine:read_reg("mcycle"))
+
+-- Print the final cycle count and root hash
+stderr("%u: %s\n", machine:read_reg("mcycle"), hexhash(machine:get_root_hash()))
diff --git a/doc/recipes/run-config.lua b/doc/recipes/run-config.lua
new file mode 100644
index 000000000..e65eb8ba2
--- /dev/null
+++ b/doc/recipes/run-config.lua
@@ -0,0 +1,11 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
diff --git a/doc/recipes/run-remote-config.lua b/doc/recipes/run-remote-config.lua
new file mode 100644
index 000000000..914b8817e
--- /dev/null
+++ b/doc/recipes/run-remote-config.lua
@@ -0,0 +1,34 @@
+-- Load the JSON-RPC submodule for remote Cartesi Machines
+local cartesi_jsonrpc = require("cartesi.jsonrpc")
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Connect to remote Cartesi Machine server (shut it down automatically on exit)
+local remote_address = assert(arg[1], "missing remote address")
+stderr("Connecting to remote cartesi machine at '%s'\n", remote_address)
+local cartesi_jsonrpc_machine <close> =
+    assert(cartesi_jsonrpc.connect_server(remote_address)):set_cleanup_call(cartesi_jsonrpc.SHUTDOWN)
+
+-- Print server version (and test connection)
+local v = assert(cartesi_jsonrpc_machine:get_server_version())
+stderr("Connected: remote version is %d.%d.%d\n", v.major, v.minor, v.patch)
+
+-- Instantiate remote machine from configuration
+local machine = cartesi_jsonrpc_machine((require(arg[2])))
+
+-- Run machine until it halts or yields
+while machine:read_reg("iflags_H") == 0 and machine:read_reg("iflags_Y") == 0 do
+    machine:run(math.maxinteger)
+end
+
+-- Print machine status
+if machine:read_reg("iflags_H") ~= 0 then
+    stderr("\nHalted\n")
+else
+    stderr("\nYielded manual\n")
+end
+-- Print cycle count
+stderr("Cycles: %u\n", machine:read_reg("mcycle"))
diff --git a/doc/recipes/run-rolling-calculator-output-proofs.lua b/doc/recipes/run-rolling-calculator-output-proofs.lua
new file mode 100644
index 000000000..c7e257063
--- /dev/null
+++ b/doc/recipes/run-rolling-calculator-output-proofs.lua
@@ -0,0 +1,162 @@
+-- Load the JSON-RPC submodule, the EVM ABI helpers, and the hash-tree helpers
+local cartesi = require("cartesi")
+local cartesi_jsonrpc = require("cartesi.jsonrpc")
+local evmu = require("cartesi.evmu")
+local util = require("cartesi.util")
+local hash_tree = require("cartesi.hash-tree")
+
+local EVM_ADVANCE = "EvmAdvance(uint256 chain_id, address app_contract, address msg_sender, "
+    .. "uint256 block_number, uint256 block_timestamp, uint256 prev_randao, uint256 index, bytes payload)"
+local NOTICE = "Notice(bytes payload)"
+local ZERO_ADDRESS = "0x0000000000000000000000000000000000000000"
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Encode a raw expression as an EvmAdvance request payload (bc needs a
+-- trailing newline to accept the line as a complete expression)
+local function encode_advance(expr, index)
+    local bint = evmu.bint
+    return evmu.encode_calldata(EVM_ADVANCE, {
+        chain_id = bint.new(0),
+        app_contract = ZERO_ADDRESS,
+        msg_sender = ZERO_ADDRESS,
+        block_number = bint.new(0),
+        block_timestamp = bint.new(os.time()),
+        prev_randao = bint.new(0),
+        index = bint.new(index),
+        payload = evmu.raw(expr .. "\n"),
+    })
+end
+
+-- Print a string folded into lines of width w
+local function fold(s, w)
+    for i = 1, #s, w do
+        print(s:sub(i, i + w - 1))
+    end
+end
+
+-- Decode a response inside a notice
+local function print_decoded_notice(data)
+    fold(evmu.decode_calldata(NOTICE, data, "raw").payload, 68)
+end
+
+-- Serialize a proof as a Lua chunk and save it
+local function save_proof(proof, name)
+    local f <close> = assert(io.open(name, "w"))
+    f:write("return ")
+    util.dump_table(proof, f)
+    f:write("\n")
+    stderr("saved %s\n", name)
+end
+
+-- Connect to remote Cartesi Machine server (and shut it down on exit)
+local remote_address = assert(arg[1], "missing remote address")
+stderr("Connecting to remote cartesi machine at '%s'\n", remote_address)
+local cartesi_jsonrpc_machine <close> =
+    assert(cartesi_jsonrpc.connect_server(remote_address)):set_cleanup_call(cartesi_jsonrpc.SHUTDOWN)
+
+-- Print server version (and test connection)
+local v = assert(cartesi_jsonrpc_machine:get_server_version())
+stderr("Connected: remote version is %d.%d.%d\n", v.major, v.minor, v.patch)
+
+-- Load remote machine from the rolling-calculator template
+local machine = cartesi_jsonrpc_machine("rolling-calculator-template")
+
+-- Snapshot via fork: the backup server keeps the pre-input state
+local backup
+local function snapshot()
+    backup = machine:fork_server()
+end
+local function commit()
+    if backup then
+        backup:shutdown_server()
+    end
+    backup = nil
+end
+local function rollback()
+    assert(backup, "no snapshot to rollback to")
+    local address = machine:get_server_address()
+    machine:shutdown_server()
+    machine:swap(backup)
+    machine:rebind_server(address)
+    backup = nil
+end
+
+-- Seed frontier builds the end-of-epoch proofs, a running copy checks each input's root
+local seed_frontier = hash_tree.frontier(cartesi.CMIO_LOG2_MAX_OUTPUT_COUNT)
+local running_frontier = hash_tree.frontier_copy(seed_frontier)
+local output_hashes = {} -- keccak256 leaf of every accepted output, in order
+local output_inputs = {} -- the input index each accepted output came from
+local pending_outputs = {} -- outputs of the current input, buffered until its verdict is known
+
+-- On accept, fold the input's outputs into the tree and save its tx-buffer root-hash proof
+local function flush_accepted(input_index, root_hash)
+    for _, output in ipairs(pending_outputs) do
+        local leaf = cartesi.keccak256(output)
+        output_hashes[#output_hashes + 1] = leaf
+        output_inputs[#output_inputs + 1] = input_index
+        hash_tree.frontier_push_back(running_frontier, leaf)
+    end
+    pending_outputs = {}
+    assert(#root_hash == cartesi.HASH_SIZE, "expected output hashes root hash in tx buffer")
+    assert(hash_tree.frontier_get_root_hash(running_frontier) == root_hash, "output hashes root hash mismatch")
+    local proof = machine:get_proof(cartesi.AR_CMIO_TX_BUFFER_START, cartesi.HASH_TREE_LOG2_WORD_SIZE)
+    assert(proof.root_hash == machine:get_root_hash(), "proof root mismatch")
+    assert(proof.target_hash == cartesi.keccak256(root_hash), "tx buffer does not hold the output hashes root hash")
+    hash_tree.verify_slice(proof)
+    save_proof(proof, string.format("input-%d-output-hashes-root-hash-proof.lua", input_index))
+end
+
+-- Run the machine until it halts or stdin closes
+local i = 0
+repeat
+    local break_reason = machine:run(math.maxinteger)
+    if break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY then
+        local _, yield_reason, data = machine:receive_cmio_request()
+        if yield_reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED then
+            commit()
+            -- the just-run input was accepted, so close it out before feeding the next one
+            if i > 0 then
+                flush_accepted(i, data)
+            end
+            stderr("type expression\n")
+            local expr = io.read()
+            if not expr then
+                break
+            end
+            stderr("%s\n", expr) -- echo the input so non-tty transcripts make sense
+            i = i + 1
+            snapshot()
+            machine:send_cmio_response(
+                machine:get_root_hash(),
+                cartesi.HTIF_YIELD_REASON_ADVANCE_STATE,
+                encode_advance(expr, i)
+            )
+        elseif i > 0 and yield_reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED then
+            stderr("input rejected\n")
+            pending_outputs = {} -- discard the rejected input's outputs; the tree is left untouched
+            rollback()
+        else
+            stderr("machine initialization failed\n")
+            break
+        end
+    elseif break_reason == cartesi.BREAK_REASON_YIELDED_AUTOMATICALLY then
+        local _, yield_reason, data = machine:receive_cmio_request()
+        if yield_reason == cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT then
+            pending_outputs[#pending_outputs + 1] = data -- buffer until the input's verdict is known
+            stderr("result is\n")
+            print_decoded_notice(data)
+        end
+    end
+until break_reason == cartesi.BREAK_REASON_HALTED
+commit()
+
+-- Build, verify, and save one per-output proof against the final root
+local proofs = hash_tree.frontier_next_proofs(seed_frontier, output_hashes)
+for k, proof in ipairs(proofs) do
+    hash_tree.verify_slice(proof)
+    save_proof(proof, string.format("output-%d-input-%d-proof.lua", proof.target_address, output_inputs[k]))
+end
diff --git a/doc/recipes/run-rolling-calculator.lua b/doc/recipes/run-rolling-calculator.lua
new file mode 100644
index 000000000..7a2b5abf5
--- /dev/null
+++ b/doc/recipes/run-rolling-calculator.lua
@@ -0,0 +1,113 @@
+-- Load the JSON-RPC submodule and the EVM ABI helpers
+local cartesi = require("cartesi")
+local cartesi_jsonrpc = require("cartesi.jsonrpc")
+local evmu = require("cartesi.evmu")
+
+local EVM_ADVANCE = "EvmAdvance(uint256 chain_id, address app_contract, address msg_sender, "
+    .. "uint256 block_number, uint256 block_timestamp, uint256 prev_randao, uint256 index, bytes payload)"
+local NOTICE = "Notice(bytes payload)"
+local ZERO_ADDRESS = "0x0000000000000000000000000000000000000000"
+
+-- Writes formatted text to stderr
+local function stderr(fmt, ...)
+    io.stderr:write(string.format(fmt, ...))
+end
+
+-- Encode a raw expression as an EvmAdvance request payload (bc needs a
+-- trailing newline to accept the line as a complete expression)
+local function encode_advance(expr, index)
+    local bint = evmu.bint
+    return evmu.encode_calldata(EVM_ADVANCE, {
+        chain_id = bint.new(0),
+        app_contract = ZERO_ADDRESS,
+        msg_sender = ZERO_ADDRESS,
+        block_number = bint.new(0),
+        block_timestamp = bint.new(os.time()),
+        prev_randao = bint.new(0),
+        index = bint.new(index),
+        payload = evmu.raw(expr .. "\n"),
+    })
+end
+
+-- Print a string folded into lines of width w
+local function fold(s, w)
+    for i = 1, #s, w do
+        print(s:sub(i, i + w - 1))
+    end
+end
+
+-- Decode a response inside a notice
+local function print_decoded_notice(data)
+    fold(evmu.decode_calldata(NOTICE, data, "raw").payload, 68)
+end
+
+-- Connect to remote Cartesi Machine server (and shut it down on exit)
+local remote_address = assert(arg[1], "missing remote address")
+stderr("Connecting to remote cartesi machine at '%s'\n", remote_address)
+local cartesi_jsonrpc_machine <close> =
+    assert(cartesi_jsonrpc.connect_server(remote_address)):set_cleanup_call(cartesi_jsonrpc.SHUTDOWN)
+
+-- Print server version (and test connection)
+local v = assert(cartesi_jsonrpc_machine:get_server_version())
+stderr("Connected: remote version is %d.%d.%d\n", v.major, v.minor, v.patch)
+
+-- Load remote machine from the rolling-calculator template
+local machine = cartesi_jsonrpc_machine("rolling-calculator-template")
+
+-- Snapshot via fork: the backup server keeps the pre-input state
+local backup
+local function snapshot()
+    backup = machine:fork_server()
+end
+local function commit()
+    if backup then
+        backup:shutdown_server()
+    end
+    backup = nil
+end
+local function rollback()
+    assert(backup, "no snapshot to rollback to")
+    local address = machine:get_server_address()
+    machine:shutdown_server()
+    machine:swap(backup)
+    machine:rebind_server(address)
+    backup = nil
+end
+
+-- Run the machine until it halts or stdin closes
+local i = 0
+repeat
+    local break_reason = machine:run(math.maxinteger)
+    if break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY then
+        local _, yield_reason = machine:receive_cmio_request()
+        if yield_reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED then
+            commit()
+            stderr("type expression\n")
+            local expr = io.read()
+            if not expr then
+                break
+            end
+            stderr("%s\n", expr) -- echo the input so non-tty transcripts make sense
+            i = i + 1
+            snapshot()
+            machine:send_cmio_response(
+                machine:get_root_hash(),
+                cartesi.HTIF_YIELD_REASON_ADVANCE_STATE,
+                encode_advance(expr, i)
+            )
+        elseif i > 0 and yield_reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED then
+            stderr("input rejected\n")
+            rollback()
+        else
+            stderr("machine initialization failed\n")
+            break
+        end
+    elseif break_reason == cartesi.BREAK_REASON_YIELDED_AUTOMATICALLY then
+        local _, yield_reason, data = machine:receive_cmio_request()
+        if yield_reason == cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT then
+            stderr("result is\n")
+            print_decoded_notice(data)
+        end
+    end
+until break_reason == cartesi.BREAK_REASON_HALTED
+commit()
diff --git a/doc/recipes/slice-calculator-output.lua b/doc/recipes/slice-calculator-output.lua
new file mode 100644
index 000000000..4d80d0071
--- /dev/null
+++ b/doc/recipes/slice-calculator-output.lua
@@ -0,0 +1,41 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+local hash_tree = require("cartesi.hash-tree")
+
+-- Obtain input expression from the command line
+local input_expr = assert(arg[1], "missing input expression")
+
+-- Get the result and the halted state hash concretely
+
+-- Load machine from template, silencing its console output
+local machine = cartesi.machine("calculator-template", { console = { output_destination = "to_null" } })
+local config = machine:get_initial_config()
+
+-- Write input expression to input NVRAM
+local input_nvram = assert(util.find_drive(config, "nvram", "input"))
+machine:write_memory(input_nvram.start, input_expr .. "\n")
+
+-- Run machine until it halts or yields manual
+repeat
+    local break_reason = machine:run(math.maxinteger)
+until break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY
+
+-- Read result string from output NVRAM and save the halted state hash
+local output_nvram = assert(util.find_drive(config, "nvram", "output"))
+local result = string.unpack("z", machine:read_memory(output_nvram.start, output_nvram.length))
+local halted_state_hash = machine:get_root_hash()
+
+-- Verify the result against the output proof
+
+-- Load output proof (must be a whole-machine proof)
+local output_proof = require("output-proof")
+assert(output_proof.log2_root_size == cartesi.HASH_TREE_LOG2_ROOT_SIZE, "proof depth mismatch")
+
+-- Reconstruct the root hash of the output NVRAM from the result alone
+local output_hash = hash_tree.get_root_hash(result, output_nvram.log2_size)
+
+-- Splicing the reconstructed output drive into the proof must reproduce the agreed machine hash
+hash_tree.verify_splice(output_proof, output_hash, halted_state_hash)
+print("Extraction by proof works!")
+print(result)
diff --git a/doc/recipes/splice-calculator-with-new-drive.lua b/doc/recipes/splice-calculator-with-new-drive.lua
new file mode 100644
index 000000000..8093378e5
--- /dev/null
+++ b/doc/recipes/splice-calculator-with-new-drive.lua
@@ -0,0 +1,34 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+local hash_tree = require("cartesi.hash-tree")
+
+-- Obtain input expression from the command line
+local input_expr = assert(arg[1], "missing input expression")
+
+-- Get instantiated template hash concretely
+
+-- Load machine from template
+local machine = cartesi.machine("calculator-template")
+
+-- Find input NVRAM by label
+local input_nvram = assert(util.find_drive(machine:get_initial_config(), "nvram", "input"))
+
+-- Write input expression to input NVRAM
+machine:write_memory(input_nvram.start, input_expr .. "\n")
+
+-- Get root hash of instantiated template
+local instantiated_template_hash = machine:get_root_hash()
+
+-- Verify instantiated template hash using proofs
+
+-- Load input proof (must be a whole-machine proof)
+local template_input_proof = require("pristine-input-proof")
+assert(template_input_proof.log2_root_size == cartesi.HASH_TREE_LOG2_ROOT_SIZE, "proof depth mismatch")
+
+-- Load actual input hash
+local input_hash = hash_tree.get_root_hash(input_expr .. "\n", input_nvram.log2_size)
+
+-- Check that instantiated template hash can be obtained directly from input proof and new input hash
+hash_tree.verify_splice(template_input_proof, input_hash, instantiated_template_hash)
+print("Instantiation by proof works!")
diff --git a/doc/recipes/store-cat-foo-bar.lua b/doc/recipes/store-cat-foo-bar.lua
new file mode 100644
index 000000000..0805897af
--- /dev/null
+++ b/doc/recipes/store-cat-foo-bar.lua
@@ -0,0 +1,9 @@
+-- Load the Cartesi module
+local cartesi = require("cartesi")
+
+-- Instantiate machine from configuration
+local config = require("config-cat-foo-bar")
+local machine = cartesi.machine(config)
+
+-- Store persistent state to directory
+machine:store("cat-foo-bar")
diff --git a/doc/recipes/third-party/repo-info/Dockerfile.local-dpkg b/doc/recipes/third-party/repo-info/Dockerfile.local-dpkg
new file mode 100644
index 000000000..96dbc2c4c
--- /dev/null
+++ b/doc/recipes/third-party/repo-info/Dockerfile.local-dpkg
@@ -0,0 +1,18 @@
+# Modified from the original
+ARG UBUNTU_TAG=24.04
+ARG UBUNTU_DIGEST=sha256:c4a8d5503dfb2a3eb8ab5f807da5bc69a85730fb49b5cfca2330194ebcc41c7b
+FROM ubuntu:${UBUNTU_TAG}@${UBUNTU_DIGEST}
+
+RUN set -eux; \
+	apt-get update; \
+	apt-get install -y --no-install-recommends \
+		ca-certificates \
+		e2fsprogs \
+		gawk \
+		wget \
+	; \
+	rm -rf /var/lib/apt/lists/*
+
+COPY gather-dpkg.sh /usr/local/bin/
+
+CMD ["gather-dpkg.sh"]
diff --git a/doc/recipes/third-party/repo-info/LICENSE b/doc/recipes/third-party/repo-info/LICENSE
new file mode 100644
index 000000000..27448585a
--- /dev/null
+++ b/doc/recipes/third-party/repo-info/LICENSE
@@ -0,0 +1,191 @@
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   Copyright 2014 Docker, Inc.
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/doc/recipes/third-party/repo-info/gather-dpkg.sh b/doc/recipes/third-party/repo-info/gather-dpkg.sh
new file mode 100755
index 000000000..ff3c8b02c
--- /dev/null
+++ b/doc/recipes/third-party/repo-info/gather-dpkg.sh
@@ -0,0 +1,231 @@
+#!/bin/bash
+set -e
+
+IFS=$'\n'
+rawPackages=( $(dpkg-query --show --showformat='${db:Status-Abbrev} ${source:Package}=${source:Version} ${binary:Package}=${Version}\n' 2>/dev/null) )
+unset IFS
+
+declare -A packages=()
+for rawPackage in "${rawPackages[@]}"; do
+	rawPackage=( $rawPackage )
+	stat="${rawPackage[0]}"
+	case "$stat" in
+		i?|h?)
+			# "install" or "hold"
+			;;
+		*)
+			# skip "unknown", "remove", "purge"
+			continue
+			;;
+	esac
+	src="${rawPackage[1]}"
+	bin="${rawPackage[2]}"
+	[ -z "${packages[$src]}" ] || packages[$src]+=' '
+	packages[$src]+="$bin"
+done
+
+if [ "${#packages[@]}" -eq 0 ]; then
+	# not Debian-based
+	exit 1
+fi
+
+if [ -z "${DPKG_ARCH:-}" ]; then
+	echo >&2 "error: DPKG_ARCH is not set"
+	exit 1
+fi
+apt_arch_opt=(-o "APT::Architecture=$DPKG_ARCH" -o "APT::Architectures=$DPKG_ARCH")
+
+# resolve package lists against a fixed archive snapshot so the
+# output does not drift as the live archive moves on
+apt_snapshot_opt=()
+if [ -n "${APT_SNAPSHOT:-}" ]; then
+	apt_snapshot_opt=(--snapshot="$APT_SNAPSHOT")
+fi
+
+if [ -e /etc/apt/sources.list ] || [ -d /etc/apt/sources.list.d ]; then
+	# make sure we have "deb-src" entries for "apt-get source"
+	# (deb822 files must not have their lines duplicated; a stanza with
+	# two Types fields makes "apt-get update --snapshot" abort)
+	find /etc/apt/sources.list* \
+		-type f -name '*.sources' \
+		-exec sed -i 's/^Types: deb$/Types: deb deb-src/' '{}' +
+	find /etc/apt/sources.list* \
+		-type f ! -name '*.sources' \
+		-exec sed -i 'p; s/^deb /deb-src /' '{}' +
+
+	# retry a few times if "apt-get update" fails
+	tries=5
+	while ! apt-get "${apt_arch_opt[@]}" update -qq; do
+		(( --tries )) || :
+		if [ "$tries" -le 0 ]; then
+			echo >&2 'error: failed to "apt-get update" after multiple attempts'
+			exit 1
+		fi
+	done
+
+	# switch the package lists to the pinned snapshot; this must come
+	# after a regular update, or apt aborts on deb822 sources that have
+	# multiple suites (assertion failure in debmetaindex.cc)
+	if [ "${#apt_snapshot_opt[@]}" -gt 0 ]; then
+		apt-get "${apt_arch_opt[@]}" "${apt_snapshot_opt[@]}" update -qq
+	fi
+fi
+
+IFS=$'\n'
+sortedSources=( $(echo "${!packages[*]}" | sort) )
+unset IFS
+
+echo
+echo '## `dpkg` (`.deb`-based packages)'
+
+# prints "$2$1$3$1...$N"
+join() {
+	local sep="$1"; shift
+	local out; printf -v out "${sep//%/%%}%s" "$@"
+	echo "${out#$sep}"
+}
+
+for src in "${sortedSources[@]}"; do
+	echo
+	echo '### `dpkg` source package: `'"$src"'`'
+	echo
+	echo 'Binary Packages:'
+	echo
+	for bin in ${packages[$src]}; do
+		echo '- `'"$bin"'`'
+	done
+
+	# parse /usr/share/doc/BIN/copyright
+	licenses=()
+	licenseFiles=()
+	for bin in ${packages[$src]}; do
+		# https://www.debian.org/doc/packaging-manuals/copyright-format/1.0/
+		# http://dep.debian.net/deps/dep5/
+		binPkg="${bin%%=*}"
+		binPkgOnly="${binPkg%%:*}"
+		f=
+		for try in \
+			"/usr/share/doc/$bin/copyright" \
+			"/usr/share/doc/$binPkg/copyright" \
+			"/usr/share/doc/$binPkgOnly/copyright" \
+		; do
+			if [ -f "$try" ]; then
+				f="$try"
+				break
+			fi
+		done
+		if [ -z "$f" ]; then
+			echo >&2
+			echo >&2 "**WARNING:** '/usr/share/doc/$binPkgOnly/copyright' is missing!"
+			echo >&2
+			continue
+		fi
+		IFS=$'\n'
+		licenses+=( $(gawk -F ':[ \t]+' '$1 == "License" && NF > 1 { gsub(/^License:[ \t]+/, ""); print }' "$f") )
+		licenses+=( $(grep -oE '/usr/share/common-licenses/[0-9a-zA-Z_.+-]+' "$f" | cut -d/ -f5-) )
+		unset IFS
+		licenseFiles+=( "$f" )
+	done
+	if [ "${#licenses[@]}" -gt 0 ]; then
+		IFS=$'\n'
+		licenses=( $(
+			echo "${licenses[*]}" \
+				| sed -r \
+					-e 's/ (and|or) /\n/g' \
+					-e 's/[.,]+$//' \
+				| sort -u
+		) )
+		unset IFS
+
+		echo
+		echo 'Licenses: (parsed from: `'"$(join '`, `' "${licenseFiles[@]}")"'`)'
+		echo
+		for lic in "${licenses[@]}"; do
+			echo '- `'"$lic"'`'
+		done
+	else
+		echo
+		echo '**WARNING:** unable to detect licenses! (package likely not compliant with DEP-5)  '
+		echo 'If source is available (seen below), check the contents of `debian/copyright` within it.'
+		echo
+	fi
+
+	sourcesUrl="https://sources.debian.net/src/${src//=//}/"
+	snapshotUrl="http://snapshot.debian.org/package/${src//=//}/"
+
+	# A binary that came from a repository must have a resolvable source. A
+	# binary installed from a local .deb (e.g. machine-guest-tools) has no
+	# archive source, so a missing source is expected only in that case. Tell
+	# the two apart by asking apt whether any of this source's binaries is
+	# available from a repository at all.
+	fromRepo=
+	for bin in ${packages[$src]}; do
+		binPkg="${bin%%=*}"
+		binPkgOnly="${binPkg%%:*}"
+		if [ -n "$(apt-cache "${apt_arch_opt[@]}" madison "$binPkgOnly" 2>/dev/null)" ]; then
+			fromRepo=1
+			break
+		fi
+	done
+
+	aptSourceArgs=( apt-get "${apt_arch_opt[@]}" "${apt_snapshot_opt[@]}" source -qq --print-uris "$src" )
+	aptSource=
+	if [ -n "$fromRepo" ]; then
+		# Repository package: the source must resolve. Retry to ride out
+		# transient archive hiccups, then fail hard rather than emit a report
+		# that silently differs from the committed one. A persistent failure
+		# means the pinned snapshot's source index has not converged for this
+		# version; move the snapshot pin back to a converged date.
+		tries=5
+		while ! aptSource="$("${aptSourceArgs[@]}" 2>/dev/null)" || [ -z "$aptSource" ]; do
+			(( --tries )) || :
+			if [ "$tries" -le 0 ]; then
+				echo >&2 "error: no source for repository package '$src' (snapshot index not converged or archive unreachable)"
+				exit 1
+			fi
+		done
+	fi
+
+	# Normalize the captured source URIs so the report stays byte-stable.
+	# apt prints whichever location currently serves each file. While a
+	# version is still in the pool that is the live mirror with a SHA256
+	# digest, and once it has been superseded it is the pinned snapshot
+	# host with a SHA512 digest. Neither the host nor the digest is needed
+	# to satisfy the source-distribution obligation, and the two digests
+	# cannot be reconciled because they use different algorithms. Rewrite
+	# every URL to the durable snapshot host and drop the digest field so
+	# the output changes only when the committed rootfs or the snapshot pin
+	# does.
+	if [ -n "$aptSource" ]; then
+		sedArgs=( -E -e 's/ [A-Za-z0-9]+:[0-9a-fA-F]+$//' )
+		if [ -n "${APT_SNAPSHOT:-}" ]; then
+			sedArgs+=( -e "s#'[^']*/pool/#'https://snapshot.ubuntu.com/ubuntu/${APT_SNAPSHOT}/pool/#" )
+		fi
+		aptSource="$(printf '%s\n' "$aptSource" | sed "${sedArgs[@]}")"
+	fi
+
+	if [ -n "$aptSource" ]; then
+		echo
+		echo 'Source:'
+		echo
+		echo '```console'
+		echo '$' "${aptSourceArgs[@]}"
+		echo "$aptSource"
+		echo '```'
+		case "$aptSource" in
+			*.debian.org/*)
+				# _probably_ Debian -- let's link to sources.debian.net too
+				echo
+				echo 'Other potentially useful URLs:'
+				echo
+				echo '- '"$sourcesUrl"' (for browsing the source)'
+				echo '- '"$sourcesUrl"'debian/copyright/ (for direct copyright/license information)'
+				echo '- '"$snapshotUrl"' (for access to the source package after it no longer exists in the archive)'
+				;;
+		esac
+	else
+		echo
+		echo '**WARNING:** no archive source (package was installed from a local `.deb`, not a repository).'
+		echo
+	fi
+done
diff --git a/doc/recipes/third-party/repo-info/scan-local.sh b/doc/recipes/third-party/repo-info/scan-local.sh
new file mode 100755
index 000000000..feb85d527
--- /dev/null
+++ b/doc/recipes/third-party/repo-info/scan-local.sh
@@ -0,0 +1,60 @@
+#!/bin/bash
+# Modified from the original
+set -e
+
+trap 'echo >&2 Ctrl+C captured, exiting; exit 1' SIGINT
+
+image="$1"; shift
+platform="$1"; shift
+arch="${platform##*/}"
+
+docker buildx build --load --pull -t repo-info:local-dpkg -f Dockerfile.local-dpkg . 1>&2
+
+name="repo-info-local-$$-$RANDOM"
+trap "docker rm -vf '$name-data' > /dev/null || :" EXIT
+
+docker create \
+    --platform $platform \
+	--name "$name-data" \
+	-v /etc \
+	-v /lib/apk \
+	-v /usr/lib/rpm \
+	-v /usr/share/apk \
+	-v /usr/share/doc \
+	-v /var/lib \
+	"$image" \
+	bogus > /dev/null
+
+echo '# `'"$image"'`'
+
+size="$(
+	docker inspect -f '{{ .Size }}' "$image" 2>/dev/null | awk '{
+		oneKb = 1000;
+		oneMb = 1000 * oneKb;
+		oneGb = 1000 * oneMb;
+		if ($1 >= oneGb) {
+			printf "~ %.2f Gb", $1 / oneGb
+		} else if ($1 >= oneMb) {
+			printf "~ %.2f Mb", $1 / oneMb
+		} else if ($1 >= oneKb) {
+			printf "~ %.2f Kb", $1 / oneKb
+		} else {
+			printf "%d bytes", $1
+		}
+	}'
+)"
+
+docker inspect -f '
+## Docker Metadata
+
+- Image ID: `{{ .Id }}`
+- Created: `{{ .Created }}`
+- Virtual Size: '"$size"'
+  (total size of all layers on-disk)
+- Arch: `{{ .Os }}`/`{{ .Architecture }}`
+{{ if .Config.Entrypoint }}- Entrypoint: `{{ json .Config.Entrypoint }}`
+{{ end }}{{ if .Config.Cmd }}- Command: `{{ json .Config.Cmd }}`
+{{ end }}- Environment:{{ range .Config.Env }}{{ "\n" }}  - `{{ . }}`{{ end }}{{ if .Config.Labels }}
+- Labels:{{ range $k, $v := .Config.Labels }}{{ "\n" }}  - `{{ $k }}={{ $v }}`{{ end }}{{ end }}' "$image" 2>/dev/null || :
+
+docker run --rm --volumes-from "$name-data" -v /etc/ssl -e DPKG_ARCH="$arch" -e APT_SNAPSHOT repo-info:local-dpkg
diff --git a/doc/recipes/trunc8.sh b/doc/recipes/trunc8.sh
new file mode 100755
index 000000000..88ee66124
--- /dev/null
+++ b/doc/recipes/trunc8.sh
@@ -0,0 +1,2 @@
+#!/bin/bash
+head -c 8
diff --git a/doc/recipes/verification-game.lua b/doc/recipes/verification-game.lua
new file mode 100644
index 000000000..539a42b28
--- /dev/null
+++ b/doc/recipes/verification-game.lua
@@ -0,0 +1,612 @@
+-- A self-contained model of the Cartesi verification game.
+--
+-- A referee, standing in for the blockchain, mediates a dispute between two players, told
+-- apart only by connection order. Each controls its own Cartesi machine and claims a final
+-- state hash for the same computation. One is honest, the other cheats past a chosen point by
+-- switching to a machine that ran a different expression.
+--
+-- All game logic lives in the referee, which never trusts a player. The players are thin and
+-- identical, differing only in the machine they hold, the honest one bare and the dishonest
+-- one a composite that reports a fake machine past the cheat point. Each runs Lua code the
+-- referee sends against its machine and replies. The fork trick lets it answer bisection
+-- queries without re-running from scratch.
+--
+-- Roles, selected by the first argument.
+--   verification-game.lua referee   <address> <expr>
+--   verification-game.lua honest    <address> <expr>
+--   verification-game.lua dishonest <address> <expr> <cheat-mcycle> <cheat-uarch-cycle> <cheat-expr>
+
+local cartesi = require("cartesi")
+local cartesi_jsonrpc = require("cartesi.jsonrpc")
+local util = require("cartesi.util")
+local socket = require("socket")
+local hash_tree = require("cartesi.hash-tree")
+local dishonest = require("dishonest")
+
+local TEMPLATE = "calculator-template"
+
+--------------------------------------------------------------------------------
+-- Small utilities
+--------------------------------------------------------------------------------
+
+-- With VERIFICATION_GAME_TRACE set, every wire message is dumped to stderr, unbuffered so it
+-- survives a redirect. The referee runs with it on, the players with it off, so an empty
+-- player transcript also confirms a clean run.
+io.stderr:setvbuf("no")
+local tracing = os.getenv("VERIFICATION_GAME_TRACE") ~= nil
+local function trace_wire(player, direction, line)
+    if tracing then
+        io.stderr:write(string.format("%s player %s: %s\n", direction, player.index or "?", line))
+    end
+end
+
+-- The referee narrates the game, kept apart from the wire trace on stderr so the run reads as a
+-- story whether or not tracing is on. A hash is shown by its first four bytes.
+local function short_hash(hash)
+    return "0x" .. util.hexhash(hash):sub(1, 8) .. "..."
+end
+
+-- The narration is split into phases, each written to its own file so the rendered walkthrough can
+-- print a short phase whole and reduce a long bisection to its first and last few lines. phase()
+-- opens the file the following eventf() lines go to, closing the previous one. Before the first
+-- phase() the narration goes to stdout. Once a phase file is open eventf() echoes to stdout as
+-- well, so a live run still shows the story even though its lines are being filed away.
+local narration = io.stdout
+local function phase(filename)
+    if narration ~= io.stdout then
+        narration:close()
+    end
+    narration = assert(io.open(filename, "w"))
+end
+
+local function eventf(fmt, ...)
+    local line = string.format(fmt, ...)
+    narration:write(line, "\n")
+    if narration ~= io.stdout then
+        io.stdout:write(line, "\n")
+    end
+end
+
+--------------------------------------------------------------------------------
+-- Wire protocol
+--
+-- Each message is one line, the compact JSON of a Lua value by cartesi.tojson plus a newline.
+-- Binary values do not survive plain JSON, so each reply carries a schema, named by the
+-- referee, that tags its binary and compound fields. tojson then encodes hashes as Base64 and
+-- embeds proofs and access logs as nested objects, and fromjson decodes them back. The schema
+-- dictionary below, referencing the built-in Proof and AccessLog, is passed to both.
+--------------------------------------------------------------------------------
+
+local SCHEMA_DICT = {
+    -- A value at a proof's target and the proof itself, used for the winner's output drive.
+    StateValueProof = {
+        target_value = "Base64",
+        proof = "Proof",
+    },
+    -- The claimed final state hash a player posts at the start.
+    FinalHashCommitment = "Base64",
+    -- A single bisection round's reply, the root hash at the mid cycle.
+    BisectionCommitment = "Base64",
+    -- The disputed step's access log. Step or reset is decided by the cycle the referee names,
+    -- not carried in the message.
+    LogCommitment = "AccessLog",
+}
+
+-- Encodes a value and writes it as one line. Returns the truthy byte count on success, or nil and
+-- an error on a closed connection, so the caller decides whether a failed send is fatal.
+local function send(player, value, schema)
+    local line = cartesi.tojson(value, -1, schema, SCHEMA_DICT)
+    trace_wire(player, "to", line)
+    return player.connection:send(line .. "\n")
+end
+
+-- Reads and decodes one full line from a player, blocking until it is in and resuming from any
+-- partial parked on the player. Lines the player still owes as drops (replies to superseded
+-- requests) are discarded. On the awaited reply the player's in-flight request is cleared.
+local function receive(player, schema)
+    local conn = player.connection
+    conn:settimeout(nil)
+    while true do
+        local line = assert(conn:receive("*l", player.partial))
+        trace_wire(player, "from", line)
+        if player.stale_requests_pending > 0 then
+            player.stale_requests_pending, player.partial = player.stale_requests_pending - 1, nil
+        else
+            player.last_request_code, player.last_request_schema, player.partial = nil, nil, nil
+            return cartesi.fromjson(line, schema, SCHEMA_DICT)
+        end
+    end
+end
+
+-- Reads a line from whichever connection completes one first, without blocking on any single
+-- one. The players table's connection-to-index map links each ready connection back to its
+-- player. Bytes accumulate in each player's partial until a line completes. A line a player
+-- still owes as a drop is discarded and reading continues, otherwise its in-flight request is
+-- cleared and that player and its decoded reply returned.
+local function receive_any(players, conns, schema)
+    for _, conn in ipairs(conns) do
+        conn:settimeout(0)
+    end
+    while true do
+        for _, conn in ipairs(socket.select(conns, nil)) do
+            local player = players[players.index_of[conn]]
+            local line, status, partial = conn:receive("*l", player.partial)
+            if line then
+                trace_wire(player, "from", line)
+                if player.stale_requests_pending > 0 then
+                    player.stale_requests_pending, player.partial = player.stale_requests_pending - 1, nil
+                else
+                    player.last_request_code, player.last_request_schema, player.partial = nil, nil, nil
+                    return player, cartesi.fromjson(line, schema, SCHEMA_DICT)
+                end
+            elseif status == "closed" then
+                player.dead = true
+                table.remove(conns, player.index)
+            else
+                assert(status == "timeout", status)
+                player.partial = partial
+            end
+        end
+    end
+end
+
+--------------------------------------------------------------------------------
+-- Players
+--
+-- The two players run identical code, differing only in the machine they hold, the honest one
+-- a bare machine and the dishonest one a composite that reports a fake machine past the cheat
+-- point.
+--------------------------------------------------------------------------------
+
+-- Instantiates the calculator template on its own freshly spawned server, with `expr` written
+-- into the input NVRAM.
+local function new_remote_machine(expr)
+    local server = assert(cartesi_jsonrpc.spawn_server("127.0.0.1:0"))
+    server:set_cleanup_call(cartesi_jsonrpc.SHUTDOWN)
+    local machine = server(TEMPLATE)
+    local input = assert(util.find_drive(machine:get_initial_config(), "nvram", "input"))
+    -- bc reads a line at a time, so the expression needs a trailing newline. The rest of the
+    -- pristine NVRAM stays zero.
+    machine:write_memory(input.start, expr .. "\n")
+    return machine
+end
+
+--------------------------------------------------------------------------------
+-- Fork trick
+--
+-- A player holds the agreed lower bound in `agreed_lo_machine` and, while bisecting, a
+-- `tentative_mid_machine` forked from it and advanced to the mid cycle. It never runs backward,
+-- since the referee never bisects below the agreed machine. Each round the referee names the
+-- branch taken at the previous round, so the player promotes the tentative machine on "agree",
+-- discards it on "disagree", and does nothing on "start".
+--------------------------------------------------------------------------------
+
+-- Applies the branch the referee reported for the previous round. "agree" promotes the tentative
+-- machine to the agreed one, "disagree" discards it, "start" has none. A round past the halt is a
+-- fixed point answered without forking, leaving no tentative machine, but that only happens above
+-- the halt where rounds disagree, so "agree" never finds the slot empty. Either way it is cleared.
+local function take_branch(player, branch)
+    if branch == "agree" then
+        player.agreed_lo_machine:shutdown_server()
+        player.agreed_lo_machine = player.tentative_mid_machine
+    elseif branch == "disagree" and player.tentative_mid_machine then
+        player.tentative_mid_machine:shutdown_server()
+    end
+    player.tentative_mid_machine = nil
+end
+
+-- The operations the referee invokes on a player by name, each taking the player first so a
+-- colon call like player:prove_output() supplies it. They return plain Lua values that the
+-- referee's named schema turns into wire JSON and back. new_player below stores them as player
+-- fields, and the referee's trusted snippets run with the player as their environment, reaching
+-- these by name.
+
+-- The claimed final state. Forks the agreed machine, runs it to halt, and reports its root
+-- hash. At halt it also captures the output into player.output_result (the result string plus
+-- the output drive's subtree proof) so prove_output() answers later without a rerun, and records
+-- the final hash and halting mcycle so rounds past the halt are answered from this fixed point.
+-- It runs at commitment time, when the agreed machine is still the clean mcycle-0 machine.
+local function commit_final_hash(player)
+    local machine = assert(player.agreed_lo_machine:fork_server())
+    local output_nvram = assert(util.find_drive(machine:get_initial_config(), "nvram", "output"))
+    machine:run(math.maxinteger)
+    player.output_result = {
+        target_value = (string.unpack("z", machine:read_memory(output_nvram.start, output_nvram.length))),
+        proof = machine:get_proof(output_nvram.start, output_nvram.log2_size),
+    }
+    player.final_hash = machine:get_root_hash()
+    player.halt_mcycle = machine:read_reg("mcycle")
+    machine:shutdown_server()
+    return player.final_hash
+end
+
+-- One bisection round. After taking the previous branch, the player forks the agreed machine,
+-- advances the fork to the target (an mcycle or uarch_cycle per level), and returns its root
+-- hash. An mcycle round at or past the halting mcycle is a fixed point answered with the cached
+-- final hash, no fork at all.
+local function commit_bisection(player, branch, level, target)
+    take_branch(player, branch)
+    if level == "mcycle" and target >= player.halt_mcycle then
+        return player.final_hash
+    end
+    player.tentative_mid_machine = assert(player.agreed_lo_machine:fork_server())
+    if level == "mcycle" then
+        player.tentative_mid_machine:run(target)
+    else
+        player.tentative_mid_machine:run_uarch(target)
+    end
+    return player.tentative_mid_machine:get_root_hash()
+end
+
+-- The terminal round, once bisection has isolated the disputed step. The last branch leaves the
+-- agreed machine at that step, so the player logs the transition out of it. The transition out of
+-- UARCH_CYCLE_MAX-1 is the reset, every other an ordinary step, decided by the cycle the referee
+-- names rather than the machine's own uarch_cycle, which at the reset boundary sits at the halt.
+local function commit_log(player, branch, cycle)
+    take_branch(player, branch)
+    local agreed = player.agreed_lo_machine
+    if cycle == cartesi.UARCH_CYCLE_MAX - 1 then
+        return agreed:log_reset_uarch()
+    end
+    return agreed:log_step_uarch()
+end
+
+-- The output captured during commit_final_hash, the result bytes and the output drive's subtree
+-- proof. Only those bytes travel, the referee pads the rest when it hashes. Posting the result is
+-- a player's last act, so it marks itself done and its serve loop exits right after this reply.
+-- The send_result_delay is a demo-ordering device, not protocol: the honest player holds its reply
+-- back so the loser's invalid result arrives, and is rejected, first.
+local function prove_output(player)
+    socket.sleep(player.send_result_delay)
+    player.done = true
+    return player.output_result
+end
+
+-- Connects to the referee and serves its requests, loading each code snippet, running it in the
+-- player's scope, and sending the value back. The last request is always for the result, whose
+-- handler marks the player done, so the loop exits after that reply. Then it shuts down every
+-- machine and fork it still holds.
+local function run(player)
+    local address = assert(arg[2], "missing referee address")
+    local host, port = address:match("^(.-):(%d+)$")
+    player.connection = assert(socket.connect(host, tonumber(port)))
+    repeat
+        local request = receive(player)
+        -- The trusted referee's snippet runs with the player as its environment, reaching the
+        -- player and its operations by name. The referee names the schema its reply is encoded under.
+        local chunk = assert(load(request.code, "=referee", "t", player))
+        assert(send(player, chunk(), request.schema))
+    until player.done
+    player.connection:close()
+    if player.tentative_mid_machine then
+        player.tentative_mid_machine:shutdown_server()
+    end
+    player.agreed_lo_machine:shutdown_server()
+end
+
+-- A player bundles the agreed machine it was handed (bare or the composite), which anchors the
+-- bisection at the lower bound, the tentative machine it forks while bisecting, and the operations
+-- above as fields the referee invokes by name. It also carries a reference to itself under
+-- `player`, since it is the environment the referee's snippets run in.
+local function new_player(machine, send_result_delay)
+    local player = {
+        agreed_lo_machine = machine,
+        tentative_mid_machine = nil,
+        stale_requests_pending = 0,
+        send_result_delay = send_result_delay or 0,
+        commit_final_hash = commit_final_hash,
+        commit_bisection = commit_bisection,
+        commit_log = commit_log,
+        prove_output = prove_output,
+        run = run,
+    }
+    player.player = player
+    return player
+end
+
+--------------------------------------------------------------------------------
+-- Referee
+--------------------------------------------------------------------------------
+
+-- The one place the referee issues a request, used by every wait_for_*. Each player records the
+-- request it is handling, cleared once the reply is read. If it is already handling this exact
+-- request, its in-flight reply answers it and nothing is sent. If it is handling a superseded
+-- one, the new request is sent and the stale reply counted to be dropped. A player handling
+-- nothing is simply asked. A player that has posted its result has exited and closed, so the send
+-- fails; it is marked dead and skipped from then on.
+local function request(player, schema, code)
+    if player.dead then
+        return
+    end
+    if player.last_request_code == code and player.last_request_schema == schema then
+        return
+    end
+    if player.last_request_code ~= nil then
+        player.stale_requests_pending = player.stale_requests_pending + 1
+    end
+    if not send(player, { code = code, schema = schema }) then
+        player.dead = true
+        return
+    end
+    player.last_request_code, player.last_request_schema = code, schema
+end
+
+-- Asks a player to run a snippet (a string.format template plus its arguments) and waits for
+-- the single reply, encoded and decoded under the named schema.
+local function wait_for_one(player, schema, code, ...)
+    request(player, schema, string.format(code, ...))
+    return receive(player, schema)
+end
+
+-- Broadcasts the request to every player, then collects every reply in completion order through
+-- receive_any, so the players compute in parallel and a slow one never holds up a ready one.
+-- Returns the replies keyed by player index.
+local function wait_for_all(players, schema, code, ...)
+    code = string.format(code, ...)
+    local conns, replies = {}, {}
+    for _, player in ipairs(players) do
+        request(player, schema, code)
+        conns[#conns + 1] = player.connection
+    end
+    for _ = 1, #conns do
+        local player, reply = receive_any(players, conns, schema)
+        replies[player.index] = reply
+    end
+    return replies
+end
+
+-- Broadcasts the request and returns the first reply to arrive, leaving the rest. It shares the
+-- request discipline above and does not judge the reply, the caller does. A player that died
+-- (exited after posting its result) is skipped, so its closed connection is never polled.
+local function wait_for_any(players, schema, code, ...)
+    code = string.format(code, ...)
+    local conns = {}
+    for _, player in ipairs(players) do
+        request(player, schema, code)
+        if not player.dead then
+            conns[#conns + 1] = player.connection
+        end
+    end
+    local _, reply = receive_any(players, conns, schema)
+    return reply
+end
+
+-- Asks both players for their opening commitment and returns the two, keyed by index.
+local function wait_for_final_hash(players)
+    return wait_for_all(players, "FinalHashCommitment", "return player:commit_final_hash()")
+end
+
+-- Broadcasts one bisection round at `target` on `level`, carrying the branch taken at the
+-- previous round, and returns both players' root hashes there, keyed by player index.
+local function wait_for_bisection(players, branch, level, target)
+    return wait_for_all(
+        players,
+        "BisectionCommitment",
+        "return player:commit_bisection(%q, %q, %d)",
+        branch,
+        level,
+        target
+    )
+end
+
+-- Sends a player the terminal round, naming the agreed uarch cycle so the player logs the
+-- matching transition (a reset out of UARCH_CYCLE_MAX-1, a step otherwise), and waits for the
+-- disputed step's access log.
+local function wait_for_log(player, branch, cycle)
+    return wait_for_one(player, "LogCommitment", "return player:commit_log(%q, %d)", branch, cycle)
+end
+
+-- Asks both players for the result and returns the first output proof to arrive.
+local function wait_for_output(players)
+    return wait_for_any(players, "StateValueProof", "return player:prove_output()")
+end
+
+-- Checks an output submission against a verified final hash. The proof must be whole-machine, the
+-- bytes must hash to the proof's target, the target must sit at the output drive address, and the
+-- proof must roll up to the final hash. Returns whether it holds.
+-- docs:begin verify_output
+local function verify_output(dapp_contract, output, final_hash)
+    return output.proof.root_hash == final_hash
+        and output.proof.log2_root_size == cartesi.HASH_TREE_LOG2_ROOT_SIZE
+        and output.proof.target_address == dapp_contract.output.start
+        and output.proof.log2_target_size == dapp_contract.output.log2_size
+        and hash_tree.get_root_hash(output.target_value, dapp_contract.output.log2_size) == output.proof.target_hash
+        and pcall(hash_tree.verify_slice, output.proof)
+end
+-- docs:end verify_output
+
+-- Bisects one level over [0, hi], updating `state` in place. Each round it sends the running
+-- branch and writes back the agreed lower-end hash, player 1's after-hash, the branch, and the
+-- converged lower bound `lo`. Bounds are compared and halved as unsigned 64-bit (math.ult and
+-- >>), so the mcycle level can use the full MCYCLE_MAX ceiling (-1 as a signed Lua integer),
+-- and the small uarch bounds reduce to ordinary arithmetic. Each round is narrated into the
+-- level's own phase file, so the rendered walkthrough can show just its ends.
+-- docs:begin bisect_level
+local function bisect_level(players, level, hi, state)
+    phase("bisect_" .. level)
+    local lo, round = 0, 0
+    while math.ult(1, hi - lo) do
+        local mid = lo + ((hi - lo) >> 1)
+        local hash = wait_for_bisection(players, state.branch, level, mid)
+        if hash[1] == hash[2] then
+            lo, state.last_agreed_hash, state.branch = mid, hash[1], "agree"
+        else
+            hi, state.hash_after, state.branch = mid, hash[1], "disagree"
+        end
+        round = round + 1
+        eventf("%s bisection round %d, interval of disagreement is [0x%x, 0x%x]", level, round, lo, hi)
+    end
+    state.lo = lo
+end
+-- docs:end bisect_level
+
+-- Verifies the disputed step's access log on its own, the way a Cartesi contract would on the
+-- blockchain, without ever instantiating a machine. The only transition out of UARCH_CYCLE_MAX-1 is
+-- the terminal reset, every other an ordinary step, so the agreed cycle alone selects
+-- verify_reset_uarch or verify_step_uarch. It passes when the log proves the agreed before-hash
+-- advances to the committed after-hash; pcall turns a rejected log into a false return, not an error.
+-- docs:begin verify_state_transition
+local function verify_state_transition(uarch_cycle, state_hash_before, log, state_hash_after)
+    local pass
+    if uarch_cycle == cartesi.UARCH_CYCLE_MAX - 1 then
+        eventf("Verifying uarch reset log!")
+        pass = pcall(cartesi.machine.verify_reset_uarch, cartesi.machine, state_hash_before, log, state_hash_after)
+    else
+        eventf("Verifying uarch step log!")
+        pass = pcall(cartesi.machine.verify_step_uarch, cartesi.machine, state_hash_before, log, state_hash_after)
+    end
+    eventf("Log is %s!", pass and "valid" or "invalid")
+    return pass
+end
+-- docs:end verify_state_transition
+
+-- Drives the interactive dispute and returns the winner. It shrinks the interval of
+-- disagreement, first an mcycle range to the disputed instruction, then a uarch_cycle range to
+-- the disputed step, tracking the agreed lower-end hash and player 1's after-hash in `state`. At
+-- the disputed step it hands player 1's log to verify_state_transition, which checks it standalone
+-- against the agreed before-hash and the committed after-hash. If it proves, player 1 won,
+-- otherwise player 2 is the honest one.
+--
+-- Both levels bisect the emulator's full ceiling. Past its halt a machine is a fixed point, so a
+-- hash asked there just repeats its final hash, and the disagreement still lands on the diverging
+-- cycle wherever each halts.
+--
+-- The converged uarch cycle says whether the disputed transition is a step or the terminal reset,
+-- since the only transition out of UARCH_CYCLE_MAX-1 is the reset. The referee names it to player 1,
+-- which logs the matching transition. Player 2 is not asked, only player 1 is verified.
+-- docs:begin adjudicate_dispute
+local function adjudicate_dispute(players, initial_hash)
+    local state = { last_agreed_hash = initial_hash, hash_after = players[1].final_hash, branch = "start" }
+
+    -- Bisect to the disputed main-processor instruction.
+    bisect_level(players, "mcycle", cartesi.MCYCLE_MAX, state)
+    -- Narrow down to the microarchitecture instruction.
+    bisect_level(players, "uarch_cycle", cartesi.UARCH_CYCLE_MAX, state)
+
+    -- A converged cycle of UARCH_CYCLE_MAX-1 means the disputed transition is the reset, else a step.
+    phase("verdict")
+    local log = wait_for_log(players[1], state.branch, state.lo)
+    eventf("Player 1 posted log")
+
+    -- Player 1 won if its log verifies against the agreed before-hash, otherwise player 2 is honest.
+    local winner = verify_state_transition(state.lo, state.last_agreed_hash, log, state.hash_after) and players[1]
+        or players[2]
+    eventf("Player %d wins! Final state hash is %s.", winner.index, short_hash(winner.final_hash))
+    return winner
+end
+-- docs:end adjudicate_dispute
+
+-- Waits for both players to connect, collects their commitments, and announces them. It binds the
+-- listen address, accepts the two players in turn, numbering them by connection order, and asks both
+-- for their final state hash at once so the run-to-halt commitments overlap. The hash needs no
+-- checking here, since a wrong hash can win neither the dispute nor the output phase.
+local function wait_for_commitments()
+    local address = assert(arg[2], "missing listen address")
+    local host, port = address:match("^(.-):(%d+)$")
+    local listener = assert(socket.bind(host, tonumber(port)))
+    -- The connection-to-index map lets receive_any link each ready connection back to its player.
+    local players = { index_of = {} }
+    for index = 1, 2 do
+        local connection = assert(listener:accept())
+        players[index] = { index = index, connection = connection, stale_requests_pending = 0 }
+        players.index_of[connection] = index
+    end
+    phase("commitments")
+    local commitments = wait_for_final_hash(players)
+    for index, player in ipairs(players) do
+        player.final_hash = commitments[index]
+        eventf("Player %d posted final state hash %s.", index, short_hash(player.final_hash))
+    end
+    return players
+end
+
+-- Models application deployment, returning the contract context the referee works against. Its
+-- constant, expression-independent parts are fixed here before any dispute, as they would be on
+-- chain at deploy time. It loads the calculator template once to read what the contract
+-- publishes, the input and output NVRAM descriptors and a proof of the pristine input drive,
+-- then discards it. The agreed initial hash is not here, since it depends on the expression.
+local function deploy()
+    local template = cartesi.machine(TEMPLATE)
+    local config = template:get_initial_config()
+    local dapp_contract = {
+        input = assert(util.find_drive(config, "nvram", "input")),
+        output = assert(util.find_drive(config, "nvram", "output")),
+    }
+    dapp_contract.input_proof = template:get_proof(dapp_contract.input.start, dapp_contract.input.log2_size)
+    return dapp_contract
+end
+
+-- Waits for the result, the value that hashes into the winner's committed final state. It takes the
+-- first posted proof that verifies, since the loser's output cannot match, and keeps asking until
+-- one arrives. The honest player holds its reply back so the loser's invalid result is rejected first.
+-- docs:begin wait_for_result
+local function wait_for_result(dapp_contract, players, final_hash)
+    phase("output")
+    while true do
+        local output = wait_for_output(players)
+        if verify_output(dapp_contract, output, final_hash) then
+            eventf("Result posted:\n%sAccepted!", output.target_value)
+            return
+        end
+        eventf("Result posted:\n%sRejected!", output.target_value)
+    end
+end
+-- docs:end wait_for_result
+
+-- Runs the whole game in three steps. It collects both players' committed final hashes, settles any
+-- dispute over them to name the honest winner, then posts the result that verifies against the
+-- winner's hash. Equal commitments mean no dispute, so either player's hash is the true one.
+-- docs:begin run_referee
+local function run_referee(referee, dapp_contract)
+    local players = wait_for_commitments()
+
+    local winner = players[1]
+    if players[1].final_hash ~= players[2].final_hash then
+        winner = adjudicate_dispute(players, referee.initial_hash)
+    end
+
+    wait_for_result(dapp_contract, players, winner.final_hash)
+end
+-- docs:end run_referee
+
+-- Builds a referee for a public expression against a deployed dapp contract. The agreed initial
+-- hash depends on the expression, so it is computed here and kept on the referee. Rolling the
+-- hash of the input NVRAM holding the expression up the pristine input proof gives the root hash
+-- of the template instantiated with it, with hash_tree.get_root_hash padding the rest to match the honest
+-- player's NVRAM. Honest play starts from exactly this state, never a player-declared one.
+local function new_referee(dapp_contract, expr)
+    local initial_hash = hash_tree.roll_hash_up_tree(
+        dapp_contract.input_proof,
+        hash_tree.get_root_hash(expr .. "\n", dapp_contract.input.log2_size)
+    )
+    return { initial_hash = initial_hash, run = run_referee }
+end
+
+--------------------------------------------------------------------------------
+-- Role dispatch
+--------------------------------------------------------------------------------
+
+local role = assert(arg[1], "missing role (referee, honest, or dishonest)")
+
+if role == "referee" then
+    local dapp_contract = deploy()
+    local referee = new_referee(dapp_contract, assert(arg[3], "missing public expression"))
+    referee:run(dapp_contract)
+elseif role == "honest" then
+    -- The one-second delay is the demo-ordering device from prove_output: it holds the honest
+    -- result back so the dishonest player's invalid result is rejected first in the referee's log.
+    local player = new_player(new_remote_machine(assert(arg[3], "missing expression")), 1)
+    player:run()
+elseif role == "dishonest" then
+    local player = new_player(
+        dishonest.new_composite_machine(
+            new_remote_machine(assert(arg[3], "missing expression")),
+            assert(tonumber(arg[4]), "missing cheat mcycle"),
+            assert(tonumber(arg[5]), "missing cheat uarch cycle"),
+            new_remote_machine(assert(arg[6], "missing cheat expression"))
+        )
+    )
+    player:run()
+else
+    error("unknown role: " .. role)
+end
diff --git a/doc/recipes/verify-output-proof.lua b/doc/recipes/verify-output-proof.lua
new file mode 100644
index 000000000..d953e17a1
--- /dev/null
+++ b/doc/recipes/verify-output-proof.lua
@@ -0,0 +1,30 @@
+local cartesi = require("cartesi")
+local util = require("cartesi.util")
+local hash_tree = require("cartesi.hash-tree")
+
+-- Read a proof saved as a Lua chunk
+local function read_proof(name)
+    return assert(loadfile(name, "t", {}))()
+end
+
+-- The settled machine state hash, the two proofs, and the output to verify against them
+local machine_hash = util.read_file(assert(arg[1], "missing machine state hash"))
+local output_hashes_root_hash_proof = read_proof(assert(arg[2], "missing output hashes root hash proof"))
+local output_proof = read_proof(assert(arg[3], "missing output proof"))
+local output = util.read_file(assert(arg[4], "missing output"))
+
+-- The output hashes root hash proof must be rooted at the agreed machine state hash
+assert(output_hashes_root_hash_proof.root_hash == machine_hash, "proof not rooted at the machine state hash")
+hash_tree.verify_slice(output_hashes_root_hash_proof)
+
+-- The output proof's root is the output hashes root hash, the value the tx-buffer word holds
+assert(
+    cartesi.keccak256(output_proof.root_hash) == output_hashes_root_hash_proof.target_hash,
+    "tx buffer holds another value"
+)
+hash_tree.verify_slice(output_proof)
+
+-- The output proof's target must be the hash of the output itself
+assert(cartesi.keccak256(output) == output_proof.target_hash, "output does not match the proof")
+
+print(string.format("output %d verified against the machine state hash", output_proof.target_address))
diff --git a/doc/recipes/verify-uarch-step.lua b/doc/recipes/verify-uarch-step.lua
new file mode 100644
index 000000000..7d212ae39
--- /dev/null
+++ b/doc/recipes/verify-uarch-step.lua
@@ -0,0 +1,28 @@
+-- Load the Cartesi modules
+local cartesi = require("cartesi")
+
+-- Instantiate machine from configuration
+local config = require(arg[1])
+local machine = cartesi.machine(config)
+
+-- Advance to the requested mcycle and uarch_cycle
+local mcycle = assert(tonumber(arg[2]), "missing mcycle")
+local ucycle = assert(tonumber(arg[3]), "missing uarch_cycle")
+machine:run(mcycle)
+machine:run_uarch(ucycle)
+
+-- Obtain state hash before step, access log, and state hash after step
+local hash_before = machine:get_root_hash()
+local log = machine:log_step_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS)
+local hash_after = machine:get_root_hash()
+
+-- Potentially mess with the access log to provoke a verification failure
+if arg[4] then
+    local env = { string = string, cartesi = cartesi, log = log }
+    local f = assert(load(arg[4], arg[4], "t", env))
+    f()
+end
+
+-- Verify the uarch step access log
+machine:verify_step_uarch(hash_before, log, hash_after)
+io.stderr:write("State transition accepted!\n")
diff --git a/doc/replace.lua b/doc/replace.lua
new file mode 100644
index 000000000..2ce966d55
--- /dev/null
+++ b/doc/replace.lua
@@ -0,0 +1,1194 @@
+-- Pandoc Lua filter for the inline-script docs build system.
+--
+-- PURPOSE
+--
+-- Turns README.md.template into README.md. Code blocks annotated with key=
+-- are written to cache/<key>/, executed by `make`, and their outputs spliced
+-- back into the rendered document. The driving Makefile lives in
+-- recipes/Makefile; it calls this filter twice with `make` in between.
+--
+-- LIFECYCLE (three invocations)
+--
+--   1. Dry-run: pass -M write-user-dependencies=<target> to pandoc and use
+--      pandoc's normal -o <path> for the output. The filter walks the
+--      template, writes each block body to cache/<key>/body.<ext>
+--      (idempotently), writes cache/<key>/spec when contents-form vars=
+--      entries exist, builds a self-contained makefile fragment with <target>
+--      on the LHS of the prereqs line, and replaces the document body with a
+--      single RawBlock containing that text. With -t plain, pandoc emits the
+--      RawBlock verbatim, so <path> ends up holding the makefile fragment.
+--      Cached outputs are not read in this pass and replace=K/both and similar
+--      return "".
+--
+--   2. The Makefile includes the .d file. <target>'s prereq line lists every
+--      cache file the document needs. Each rule says "to produce
+--      cache/<key>/both, depend on the runner, cache/<key>/body.<ext>, and
+--      each dep's output file, then exec the runner". Running `make` executes
+--      every needed body in topological order, populating the cache.
+--
+--   3. Real run: same filter, same template, -M write-user-dependencies absent.
+--      Every cache/<key>/<sub> the document needs now exists on disk. The
+--      filter reads those files and splices their contents in place of the
+--      annotated blocks. Pandoc's output is the final rendered document.
+--
+-- TWO-PASS WALK (each invocation)
+--
+--   Pass 1 (collect): pandoc.walk_block records every key= block body, parsed
+--   deps, and parsed vars into `pending` without resolving anything.
+--   Detects duplicate keys.
+--
+--   Pass 2 (render): walk in document order. When a replace=K/... is seen,
+--   ensure_defined(K) lazily defines K -- recursing depth-first through K's
+--   depends= and vars= chains -- before reading its output. This is what
+--   makes replace= and depends= order-independent within the document.
+--
+-- REQUIRED ENVIRONMENT
+--
+--   REPLACE_CACHE_DIR  Absolute path to the cache directory (errors if unset).
+--   REPLACE_DIR Derived from PANDOC_SCRIPT_FILE; runners and vars.lua
+--              live alongside this filter file.
+--
+-- CACHE LAYOUT
+--
+--   cache/<key>/body.<ext>     Source written at dry-run time (idempotent).
+--   cache/<key>/spec           VAR=path lines for contents-form vars= entries
+--                              (written at dry-run time, idempotent).
+--   cache/<key>/outputs        Declared artifact filenames, one per line
+--                              (written at dry-run time, idempotent; empty
+--                              when outputs= is absent). Read by the runner
+--                              after the body exits to verify each artifact
+--                              exists.
+--   cache/<key>/body.run.<ext> Body with contents-form $VAR expanded (runner-produced).
+--   cache/<key>/stdout         Captured standard output (runner-produced).
+--   cache/<key>/stderr         Captured standard error (runner-produced).
+--   cache/<key>/both           stdout and stderr interleaved (runner-produced;
+--                              primary make target -- the others are siblings).
+--                              For include= keys this file is written at filter
+--                              time and holds the published body; no other
+--                              cache/<key>/ files are produced.
+--   cache/<key>/<artifact>     Any declared outputs= artifact. The runner cd's
+--                              into cache/<key>/ before running the body, so
+--                              artifacts written to cwd land there automatically.
+--
+-- CACHE INVALIDATION
+--
+--   Make drives invalidation via mtimes. body.<ext> and spec are written
+--   idempotently (skipped when content is unchanged) to avoid spurious rebuilds.
+--   The runner (run-bash.sh / run-lua.sh) and vars.lua are listed as make
+--   prereqs for every rule that uses them, so editing those files triggers
+--   a rebuild of all affected blocks.
+--
+-- LANGUAGES
+--
+--   LANG_INFO maps a Pandoc class name to {ext, runner-path}:
+--     .bash  ->  body.sh,  run-bash.sh   (default)
+--     .lua   ->  body.lua, run-lua.sh
+--   pick_lang uses runner= when set, else the first Pandoc class, else
+--   DEFAULT_LANG (bash). The class always controls syntax highlighting.
+--   To add a language: add an entry to LANG_INFO and place run-<lang>.sh
+--   alongside this filter.
+--
+-- ATTRIBUTES (CodeBlock / Code / Span)
+--
+--   key=K               Defines block K. Body is its source.
+--                       K must match [a-zA-Z_][a-zA-Z0-9_]*; duplicates error.
+--                       $REPLACE_KEY is replaced with K before writing body.
+--
+--   depends=A,B,...     Only on key= blocks. Each token is either bare K or
+--                       K/SUB. Bare K adds a make prereq on cache/<K>/both;
+--                       K/SUB pins cache/<K>/SUB (stream or declared artifact).
+--                       Reserved for ordering-only cases. Use vars= when $K
+--                       is in the body. For chains of blocks that share a
+--                       runtime resource (e.g., a TCP port), prefer
+--                       sequential= so the chain is built automatically in
+--                       document order.
+--
+--   sequential=TAG      Only on key= blocks. TAG is a single identifier.
+--                       Every block with the same TAG is auto-chained in
+--                       document order: each non-first member gains an
+--                       implicit depends=<previous-member>, a make prereq on
+--                       cache/<previous-member>/both. Composes additively
+--                       with explicit depends= and vars=. Use for ordering-
+--                       only resources (a bound port, a fixed file path)
+--                       where listing the chain by hand would be brittle.
+--                       Not allowed on include= keys (those have no
+--                       executable body to serialize).
+--
+--   vars=VAR->REF,...  Path injection and contents substitution. REF forms:
+--                         VAR->K          contents-form: $VAR -> bytes of cache/<K>/both
+--                                         (same default as replace=K)
+--                         VAR->K/SUB      contents-form: $VAR -> bytes of cache/<K>/SUB
+--                         VAR->K/SUB/path path-form: $VAR -> REPLACE_CACHE_DIR/K/SUB
+--                         K               path-form: $K -> K/path (shortcut)
+--                       Path-form entries are substituted in body.<ext> at dry-run
+--                       time. Contents-form entries are written to cache/<K>/spec
+--                       and expanded by vars.lua at runner time (producing
+--                       body.run.<ext>). Both forms also add make prereqs.
+--
+--   runner=<name>       Optional, key= blocks only. Overrides the runner (and body
+--                       file extension) that replace.lua would otherwise infer from
+--                       the block's Pandoc class. <name> must match a key in
+--                       LANG_INFO; if it does not, the block is display-only (no
+--                       body file written, no runner invocation). Consuming the
+--                       captured output (replace=K/stdout etc.) of a display-only
+--                       block is an error. Has no effect on include= keys (which
+--                       never execute and produce only cache/<K>/both).
+--                       Not allowed on inline Code or Span.
+--
+--   outputs=a,b,c       Only on key= blocks. Declares artifact filenames the body
+--                       writes to its cwd (= cache/<key>/). Reserved names
+--                       (stdout, stderr, both, source, null) are rejected.
+--                       The runner verifies each artifact exists after the body
+--                       exits and fails if it does not.
+--
+--   include=<path>      Only on key= blocks. The block's body becomes the contents
+--                       of $RECIPES_DIR/<path> (null setup regions removed,
+--                       docs:begin/docs:end markers kept). Block body must be empty
+--                       when include= is set. outputs=, depends=, and vars= are not
+--                       allowed on include= keys. The filter writes the body, with
+--                       markers stripped, to cache/<K>/both at filter time; the make
+--                       rule touches that file when the included file changes so
+--                       consumers invalidate. The body is also the key's source, so
+--                       replace=K/source/<region> selects a named region of the
+--                       included file. No stdout, stderr, or body.<ext> are produced
+--                       (an include= block does not execute -- it just publishes its
+--                       body). replace= defaults to "both" on include= blocks; only
+--                       replace=both and replace=null are accepted.
+--                       Region-selecting form: include=<file>/<region>. The
+--                       whole value is tried as a file path first. If that
+--                       fails, the value is split on the last '/' into <file>
+--                       and <region>: only the lines within the named
+--                       docs:begin/docs:end region of <file> become the body
+--                       (markers stripped).
+--
+--   enabled=yes|no      Optional. Controls whether this block is active.
+--                       When absent, the value of the -M default-replace=
+--                       pandoc variable applies (true/yes/1 -> enabled;
+--                       false/no/0 or missing -> disabled). When disabled,
+--                       the block's entire body is rendered verbatim as a
+--                       plain code block (no execution, no region trimming,
+--                       no docs:begin/end processing). Cross-block
+--                       replace= sites that reference a disabled key
+--                       render as empty. ensure_defined errors if an
+--                       enabled block depends on a disabled one.
+--
+--   code=yes|no         Optional, inline Span only. Default yes wraps the
+--                       substituted value in an inline Code element (matches
+--                       backtick styling). Set code=no to emit plain text,
+--                       useful inside HTML markup like <sup>...</sup> where
+--                       monospace styling looks wrong.
+--
+--   replace=<value>     Required on every annotated block except include= blocks,
+--                       where it defaults to "both". See taxonomy below.
+--
+-- REPLACE= TAXONOMY
+--
+--   null                Drop the block from output. Body still runs when key=
+--                       is present. Idiom: hidden setup block.
+--
+--   source              Render this key's body. Requires key=.
+--   source/<region>     Render only the named docs:begin/end region. Requires key=.
+--                       "null" is reserved and cannot be used as a region name.
+--
+--   stdout|stderr|both  Render this key's captured stream. Requires key=.
+--
+--   <artifact>          Render this key's declared artifact. Requires key=;
+--                       artifact name must appear in outputs=.
+--
+--   K                   Cross-block: render K's "both" output (default thing).
+--   K/path              Cross-block: absolute path of cache/<K>/ directory.
+--   K/<thing>           Cross-block: render K's thing.
+--                       thing is stdout|stderr|both|source[/<region>]|<artifact>.
+--                       When K was defined with include=, only the bare K, K/both,
+--                       K/path, K/both/path, K/source, and K/source/<region> forms
+--                       are accepted (K/source selects from the included file's
+--                       regions; the other streams and artifacts do not exist).
+--   K/<thing>/path      Cross-block: absolute path of cache/<K>/<thing>.
+--                       Forces lazy definition of K via ensure_defined.
+--
+--   Inline Code:        Only cross-block forms (K or K/<thing>) are allowed.
+--   Inline Span:        Only cross-block forms. The Span's inline content is
+--                       appended as a literal suffix to the rendered output
+--                       (idiom: insert punctuation after a substituted value).
+--                       Wrapped in inline Code by default; pass code=no to
+--                       emit plain text instead.
+--
+-- DOCS:BEGIN/END SEMANTICS
+--
+--   Marker syntax:  <comment-leader> docs:begin <name>
+--                   <comment-leader> docs:end   <name>
+--   Comment leaders: #, --, // (with optional surrounding whitespace).
+--   <name> may be empty (unnamed default region).
+--
+--   Special name "null":
+--     docs:begin null / docs:end null lines and everything between them are
+--     stripped from the rendered source but still execute. Use this to hide
+--     imports or setup boilerplate. Multiple non-overlapping null regions are
+--     allowed; nesting is not permitted. The marker lines themselves are
+--     also stripped from the executed body, so a null region may be inserted
+--     in the middle of a bash backslash-continued multi-line command without
+--     bash gluing the leading "#" onto the previous "\<NL>" continuation.
+--
+--   Named region:
+--     replace=source/<name> renders only the content between the matching
+--     docs:begin <name> / docs:end <name> pair. Markers are stripped.
+--
+-- OUTPUT POST-PROCESSING
+--
+--   read_output strips ANSI escape sequences and the trailing newline before
+--   substitution. Bodies relying on exact byte-level capture should not use
+--   replace= to consume their output.
+--
+-- GLOBALS PSEUDO-KEY
+--
+--   Pandoc() writes every pandoc metadata variable whose name starts with a
+--   letter or underscore (hyphens are also allowed after the first character)
+--   to REPLACE_CACHE_DIR/globals/<name>. Pass the value on the pandoc command
+--   line with -M NAME=VALUE. Use vars=VAR->globals/NAME (contents-form) to
+--   inject the value into a block body or a replace=source display, or
+--   replace=globals/NAME to render the value as the block's content
+--   (replace=globals/NAME/path yields the absolute path of the file).
+--
+-- DEFAULT-REPLACE METADATA
+--
+--   Pass -M default-replace=true (or false) on the pandoc command line.
+--   replace.lua reads doc.meta["default-replace"] in Pandoc() and uses it
+--   as the default for blocks without an explicit enabled= attribute.
+--   true/yes/1 -> enabled; false/no/0 (or absent) -> disabled.
+--
+-- MAKE-FRAGMENT SHAPE (dry-run)
+--
+--   Grouped target: cache/<key>/both, cache/<key>/stdout, cache/<key>/stderr,
+--     and each declared artifact, emitted as one GNU Make grouped target
+--     (`&:`, requires GNU Make >= 4.3; template.d is only -included inside the
+--     docs container). One runner invocation co-produces all of them, so the
+--     grouped form lets make invalidate every consumer whenever a prereq
+--     changes. The older `sibling: primary` empty-recipe form could leave an
+--     indirect consumer (e.g. one reading another block's reordered stdout)
+--     stale on a timestamp tie across the two-pass rebuild.
+--     prereqs: runner, body.<ext>, outputs, [vars.lua, spec] (iff contents-form
+--              vars= exists), depends= prereqs, vars= file prereqs
+--
+--   include= keys take a simpler shape: a single rule whose only prereq is
+--   the included file, with recipe `touch cache/<key>/both`. The content is
+--   written by the filter; the touch only propagates mtime so consumers
+--   invalidate when the included file changes.
+--
+-- PANDOC RENDERING QUIRK
+--
+--   force_fenced upgrades classless CodeBlocks to class "text" so Pandoc
+--   emits a fenced (not 4-space-indented) GFM code block.
+--
+-- INVARIANTS / GOTCHAS
+--
+--   - Duplicate key= definitions error during pass 1.
+--   - Dependency cycles error during ensure_defined.
+--   - outputs= artifacts not written by the body cause the runner to fail.
+--   - vars= path-form rewrites happen at dry-run time (before execution).
+--     Contents-form $VAR stays literal in body.<ext>; vars.lua expands it
+--     at runner time. Editing vars.lua or the spec file triggers a rebuild.
+--   - $VAR substitution requires a non-word boundary after VAR so $foo does
+--     not consume the start of $foobar; longest var wins for disambiguation.
+--   - include= keys publish cache/<K>/both (the marker-stripped body) and keep the
+--     marker-bearing body as the key's source. The filter writes both at filter time
+--     via write_idempotent; the make rule has the included file as its sole prereq
+--     and touches the primary, forcing consumers to invalidate when the source
+--     changes (pass 3 rewrites the body during the README.md build). Cross-block
+--     references to an include= key may use K, K/both, K/path, K/both/path, K/source,
+--     or K/source/<region>; a source ref depends on cache/<K>/both so it invalidates
+--     with the included file. /stdout, /stderr, and artifact subs are rejected.
+
+local deps_target
+local default_enabled = true -- overridden in Pandoc() from -M default-replace=
+local REPLACE_CACHE_DIR = os.getenv("REPLACE_CACHE_DIR") or error("REPLACE_CACHE_DIR not set")
+local RECIPES_DIR = os.getenv("RECIPES_DIR") or error("RECIPES_DIR not set")
+
+-- Locate the directory containing this filter file; runners live alongside it.
+local REPLACE_DIR = PANDOC_SCRIPT_FILE:match("(.+)/[^/]+$") or "."
+local vars = require("vars")
+
+local LANG_INFO = {
+    bash = { ext = "sh", runner = REPLACE_DIR .. "/run-bash.sh" },
+    lua = { ext = "lua", runner = REPLACE_DIR .. "/run-lua.sh" },
+}
+local DEFAULT_LANG = "bash"
+
+local RESERVED = { stdout = true, stderr = true, both = true, source = true, null = true }
+
+-- State accumulated as the document is walked.
+local pending = {} -- key -> { attr, body, classes, deps, vars }  (pass 1: raw collection)
+local defining = {} -- key -> true  (cycle detection during ensure_defined)
+local defined = {} -- key -> true  (set after define_script completes)
+local outputs_t = {} -- key -> { artifact_name -> true }
+local sources = {} -- key -> resolved body (for replace=source)
+local rules = {} -- list of make rule strings (dry-run only)
+local consumed = {} -- "<key>/<file>" -> true (referenced cache files)
+local no_runner = {} -- key -> lang string (for keys whose runner= is not in LANG_INFO)
+local sequential = {} -- tag -> last-seen key with this sequential= tag (built during collect)
+
+-- Defined further below, but referenced by define_script above their definition.
+local emit_rule, emit_include_rule
+
+local function assertf(cond, fmt, ...)
+    if not cond then
+        error(string.format(fmt, ...))
+    end
+end
+
+local function check_identifier(s, label)
+    assertf(s:match("^[%a_][%w_]*$"), "%s: '%s' is not an identifier (must match [a-zA-Z_][a-zA-Z0-9_]*)", label, s)
+end
+
+local function strip_ansi(s)
+    return (s:gsub("\27%[[%d;]*[mGK]", ""):gsub("\r", ""))
+end
+
+local function is_enabled(attr)
+    local v = attr.enabled
+    if v == nil then
+        return default_enabled
+    end
+    return v == "yes" or v == "true" or v == "1"
+end
+
+local function parse_list(s)
+    local r = {}
+    if not s then
+        return r
+    end
+    for tok in s:gmatch("[^,%s]+") do
+        r[#r + 1] = tok
+    end
+    return r
+end
+
+local function parse_depends(s)
+    local r = {}
+    for _, tok in ipairs(parse_list(s)) do
+        local base, sub = tok:match("^([%w_][%w_%-%.]*)/(.+)$")
+        if not base then
+            base = tok
+        end
+        check_identifier(base, "depends=" .. tok)
+        r[#r + 1] = { base = base, sub = sub }
+    end
+    return r
+end
+
+local function parse_sequential(s)
+    if not s then
+        return nil
+    end
+    local tag = s:match("^%s*(.-)%s*$")
+    assertf(tag ~= "", "sequential=%s: empty tag", s)
+    assertf(not tag:find("[,%s]"), "sequential=%s: only one tag per block (no commas or whitespace)", s)
+    check_identifier(tag, "sequential=" .. tag)
+    return tag
+end
+
+local function parse_vars(s)
+    local r = {}
+    if not s then
+        return r
+    end
+    for tok in s:gmatch("[^,%s]+") do
+        local var, ref = tok:match("^([%w_]+)%->(.+)$")
+        local shortcut = var == nil
+        if shortcut then
+            check_identifier(tok, "vars=" .. tok)
+            var, ref = tok, tok
+        end
+        assertf(ref:match("^[%w._%-/]+$"), "vars=%s->%s: invalid characters in ref", var, ref)
+        local base, sub, kind
+        -- Try K/SUB/path
+        base, sub = ref:match("^([%w_][%w_%-%.]*)/(.+)/path$")
+        if base then
+            assertf(not sub:match("^source/"), "vars=%s->%s: K/source/REGION/path is not allowed", var, ref)
+            kind = "path"
+        else
+            -- Try K/SUB
+            base, sub = ref:match("^([%w_][%w_%-%.]*)/(.+)$")
+            if base then
+                kind = "contents"
+            elseif shortcut then
+                base, sub = ref, nil
+                kind = "dirpath"
+            else
+                -- vars=VAR->K defaults to vars=VAR->K/both (contents-form).
+                base, sub = ref, "both"
+                kind = "contents"
+            end
+        end
+        check_identifier(base, "vars=" .. var .. "->" .. ref)
+        r[#r + 1] = { var = var, base = base, sub = sub, kind = kind, raw = ref }
+    end
+    return r
+end
+
+-- Substitute $VAR in body with abs_path for each {var, abs_path} pair.
+-- Longest var wins; match requires a non-word character (or end) after the var
+-- so $foo does not consume the start of $foobar.
+local function substitute(body, var_pairs)
+    local sorted_pairs = {}
+    for _, p in ipairs(var_pairs) do
+        sorted_pairs[#sorted_pairs + 1] = p
+    end
+    table.sort(sorted_pairs, function(a, b)
+        return #a.var > #b.var
+    end)
+    local out, i, n = {}, 1, #body
+    while i <= n do
+        local c = body:sub(i, i)
+        if c == "$" then
+            local matched = false
+            for _, p in ipairs(sorted_pairs) do
+                local len = #p.var
+                if body:sub(i + 1, i + len) == p.var then
+                    local nextc = body:sub(i + 1 + len, i + 1 + len)
+                    if nextc == "" or not nextc:match("[%w._%-]") then
+                        out[#out + 1] = p.abs_path
+                        i = i + 1 + len
+                        matched = true
+                        break
+                    end
+                end
+            end
+            if not matched then
+                out[#out + 1] = "$"
+                i = i + 1
+            end
+        else
+            out[#out + 1] = c
+            i = i + 1
+        end
+    end
+    return table.concat(out)
+end
+
+-- Process docs:begin null / docs:end null pairs. When keep_content is false
+-- (the rendered-source path), the markers and the lines between them are
+-- removed. When keep_content is true (the executed-body path), only the
+-- marker lines themselves are removed; the lines between them survive. The
+-- latter mode lets a null region sit in the middle of a bash backslash-
+-- continued command without bash collapsing "\<NL>" + "# docs:begin null"
+-- into a comment that severs the logical line.
+-- Multiple non-overlapping null regions are allowed. Nesting is not.
+local function process_null_regions(body, keep_content, label)
+    if not body:find("[#%-/]+%s*docs:begin%s+null") then
+        return body
+    end
+    local scan = body:sub(-1) == "\n" and body or (body .. "\n")
+    local out = {}
+    local in_null = false
+    for line in scan:gmatch("([^\n]*)\n") do
+        if line:match("^%s*[#%-/]+%s*docs:begin%s+null%s*$") then
+            assertf(not in_null, "%s: nested docs:begin null", label)
+            in_null = true
+        elseif line:match("^%s*[#%-/]+%s*docs:end%s+null%s*$") then
+            assertf(in_null, "%s: docs:end null without matching docs:begin null", label)
+            in_null = false
+        elseif keep_content or not in_null then
+            out[#out + 1] = line
+        end
+    end
+    assertf(not in_null, "%s: unterminated docs:begin null", label)
+    local result = table.concat(out, "\n")
+    if body:sub(-1) == "\n" then
+        result = result .. "\n"
+    end
+    return result
+end
+
+local function strip_null_regions(body, label)
+    return process_null_regions(body, false, label)
+end
+
+local function strip_null_markers(body, label)
+    return process_null_regions(body, true, label)
+end
+
+-- Strip every docs:begin / docs:end marker line from body.
+-- Used for include= keys so infrastructure markers do not appear in output.
+local function strip_all_markers(body)
+    local scan = body:sub(-1) == "\n" and body or (body .. "\n")
+    local out = {}
+    for line in scan:gmatch("([^\n]*)\n") do
+        if not line:match("^%s*[#%-/]+%s*docs:%a+") then
+            out[#out + 1] = line
+        end
+    end
+    local result = table.concat(out, "\n")
+    if body:sub(-1) == "\n" then
+        result = result .. "\n"
+    end
+    return result
+end
+
+-- Extract a "docs:begin NAME" / "docs:end NAME" region from body.
+-- Comment leaders #, --, // (and variants) are stripped before the keyword.
+-- NAME may be empty (the unnamed default region). Markers are stripped.
+local function extract_region(body, name, label)
+    local target = name or ""
+    local markers = {}
+    -- Ensure the last line is terminated so a final docs:end at EOF is matched.
+    local scan = body:sub(-1) == "\n" and body or (body .. "\n")
+    scan:gsub("()[%s]*[#%-/]+[%s]*docs:(%a+)[ \t]*(.-)[ \t]*()\n", function(s, kw, rname, e)
+        markers[#markers + 1] = { s = s, kw = kw, name = rname, e = e }
+    end)
+    local regions = {}
+    for _, m in ipairs(markers) do
+        regions[m.name] = regions[m.name] or {}
+        local r = regions[m.name]
+        if m.kw == "begin" then
+            assertf(not r.first, "%s: duplicate docs:begin '%s'", label, m.name)
+            r.first = m.e + 1
+        elseif m.kw == "end" then
+            assertf(not r.last, "%s: duplicate docs:end '%s'", label, m.name)
+            r.last = m.s - 1
+        end
+    end
+    local r = regions[target]
+    assertf(r, "%s: no region '%s' found", label, target)
+    assertf(r.first, "%s: region '%s' has no docs:begin", label, target)
+    assertf(r.last, "%s: region '%s' has no docs:end", label, target)
+    assertf(r.first <= r.last, "%s: region '%s' docs:end before docs:begin", label, target)
+    return (scan:sub(r.first, r.last):gsub("\n$", ""))
+end
+
+local function read_file(path, label)
+    local f = io.open(path, "r")
+    assertf(f, "%s: cannot open %s", label, path)
+    local txt = f:read("a")
+    f:close()
+    return txt
+end
+
+local function read_output(key, sub, label)
+    assertf(
+        not no_runner[key],
+        "%s: runner=%s is not in LANG_INFO; cannot consume cache/%s/%s",
+        label,
+        no_runner[key],
+        key,
+        sub
+    )
+    consumed[key .. "/" .. sub] = true
+    if deps_target then
+        return ""
+    end
+    local path = REPLACE_CACHE_DIR .. "/" .. key .. "/" .. sub
+    return (strip_ansi(read_file(path, label)):gsub("\n$", ""))
+end
+
+local function pick_lang(attr, classes)
+    return attr.runner or classes and classes[1] or DEFAULT_LANG
+end
+
+local function write_idempotent(path, content)
+    local f = io.open(path, "r")
+    if f then
+        local existing = f:read("a")
+        f:close()
+        if existing == content then
+            return
+        end
+    end
+    os.execute("mkdir -p '" .. path:match("(.*)/") .. "'")
+    f = assert(io.open(path, "w"))
+    f:write(content)
+    f:close()
+end
+
+local function define_script(key, attr, body, classes, deps, vars_list, include_abs)
+    assertf(not defined[key], "key=%s: duplicate definition", key)
+    local out_list = parse_list(attr.outputs)
+    for _, n in ipairs(out_list) do
+        assertf(not RESERVED[n], "key=%s: outputs= cannot contain reserved name '%s'", key, n)
+    end
+    if include_abs then
+        assertf(#out_list == 0, "key=%s: outputs= not allowed on include= keys", key)
+        assertf(#deps == 0, "key=%s: depends= not allowed on include= keys", key)
+        assertf(#vars_list == 0, "key=%s: vars= not allowed on include= keys", key)
+        defined[key] = true
+        outputs_t[key] = {}
+        -- The body keeps its region markers so replace=K/source/<region> can pick them out, but the
+        -- published both stream is rendered verbatim, so strip the markers there.
+        sources[key] = body
+        write_idempotent(REPLACE_CACHE_DIR .. "/" .. key .. "/both", strip_all_markers(body))
+        if deps_target then
+            emit_include_rule(key, include_abs)
+        end
+        return
+    end
+    for _, d in ipairs(deps) do
+        assertf(defined[d.base], "key=%s: depends=%s: '%s' not yet defined", key, d.base, d.base)
+    end
+    -- Build path_pairs from path-form vars entries (kind == "dirpath" or "path").
+    -- Contents-form entries stay literal in the body; the runner will expand them at run time.
+    local path_pairs = {}
+    for _, p in ipairs(vars_list) do
+        if p.kind == "dirpath" then
+            assertf(defined[p.base], "key=%s: vars=%s->%s: '%s' not yet defined", key, p.var, p.raw, p.base)
+            path_pairs[#path_pairs + 1] = { var = p.var, abs_path = REPLACE_CACHE_DIR .. "/" .. p.base }
+        elseif p.kind == "path" then
+            assertf(defined[p.base], "key=%s: vars=%s->%s: '%s' not yet defined", key, p.var, p.raw, p.base)
+            path_pairs[#path_pairs + 1] = { var = p.var, abs_path = REPLACE_CACHE_DIR .. "/" .. p.base .. "/" .. p.sub }
+        end
+    end
+    local resolved = substitute(body, path_pairs)
+    resolved = resolved:gsub("%$REPLACE_KEY%f[%W]", function()
+        return key
+    end)
+    local lang = pick_lang(attr, classes)
+    local info = LANG_INFO[lang]
+    defined[key] = true
+    outputs_t[key] = {}
+    for _, n in ipairs(out_list) do
+        outputs_t[key][n] = true
+    end
+    sources[key] = resolved
+    if not info then
+        no_runner[key] = lang
+        return resolved
+    end
+    local exec_body = strip_null_markers(resolved, "key=" .. key)
+    write_idempotent(REPLACE_CACHE_DIR .. "/" .. key .. "/body." .. info.ext, exec_body)
+    -- Write spec file for contents-form vars entries so the runner can expand them.
+    local contents_entries = {}
+    for _, p in ipairs(vars_list) do
+        if p.kind == "contents" then
+            contents_entries[#contents_entries + 1] = p
+        end
+    end
+    if #contents_entries > 0 then
+        table.sort(contents_entries, function(a, b)
+            return a.var < b.var
+        end)
+        local lines = {}
+        for _, p in ipairs(contents_entries) do
+            lines[#lines + 1] = p.var .. "=" .. REPLACE_CACHE_DIR .. "/" .. p.base .. "/" .. p.sub
+        end
+        write_idempotent(REPLACE_CACHE_DIR .. "/" .. key .. "/spec", table.concat(lines, "\n") .. "\n")
+    end
+    -- Always write the outputs file (consumed by the runner to verify declared
+    -- artifacts exist after the body completes). Written even when empty so a
+    -- removed outputs= attribute clears any stale list.
+    local outputs_text = ""
+    if #out_list > 0 then
+        local sorted_out = {}
+        for _, n in ipairs(out_list) do
+            sorted_out[#sorted_out + 1] = n
+        end
+        table.sort(sorted_out)
+        outputs_text = table.concat(sorted_out, "\n") .. "\n"
+    end
+    write_idempotent(REPLACE_CACHE_DIR .. "/" .. key .. "/outputs", outputs_text)
+    if deps_target then
+        emit_rule(key, info, out_list, deps, vars_list, #contents_entries > 0)
+    end
+    return resolved
+end
+
+-- Emit a make rule. One runner invocation produces both, stdout, stderr, and
+-- any declared artifacts together, so they are emitted as a single GNU Make
+-- grouped target (`&:`, requires GNU Make >= 4.3, satisfied by the docs image;
+-- template.d is only -included inside the container). The grouped form tells
+-- make the recipe co-produces every output, so editing an intermediate block
+-- reliably invalidates its consumers. The previous `sibling: primary` form left
+-- consumers stale when timestamps tied across the two-pass rebuild.
+function emit_rule(key, info, out_list, deps, vars_list, has_contents)
+    local runner_path = info.runner
+    local body_path = "$(REPLACE_CACHE_DIR)/" .. key .. "/body." .. info.ext
+    local prereqs = { runner_path, body_path, "$(REPLACE_CACHE_DIR)/" .. key .. "/outputs" }
+    if has_contents then
+        prereqs[#prereqs + 1] = REPLACE_DIR .. "/vars.lua"
+        prereqs[#prereqs + 1] = "$(REPLACE_CACHE_DIR)/" .. key .. "/spec"
+    end
+    -- Collect prereqs from depends= and vars=, deduplicating by path.
+    local seen_prereqs = {}
+    local function add_prereq(path)
+        if not seen_prereqs[path] then
+            seen_prereqs[path] = true
+            prereqs[#prereqs + 1] = path
+        end
+    end
+    for _, d in ipairs(deps) do
+        add_prereq("$(REPLACE_CACHE_DIR)/" .. d.base .. "/" .. (d.sub or "both"))
+    end
+    for _, p in ipairs(vars_list) do
+        if p.kind == "dirpath" then
+            add_prereq("$(REPLACE_CACHE_DIR)/" .. p.base .. "/both")
+        elseif p.kind == "path" or p.kind == "contents" then
+            add_prereq("$(REPLACE_CACHE_DIR)/" .. p.base .. "/" .. p.sub)
+        end
+    end
+    local targets = {
+        "$(REPLACE_CACHE_DIR)/" .. key .. "/both",
+        "$(REPLACE_CACHE_DIR)/" .. key .. "/stdout",
+        "$(REPLACE_CACHE_DIR)/" .. key .. "/stderr",
+    }
+    for _, n in ipairs(out_list) do
+        targets[#targets + 1] = "$(REPLACE_CACHE_DIR)/" .. key .. "/" .. n
+    end
+    local cmd = string.format(
+        "\t@REPLACE_KEY=%s bash %s || (echo '==> FAILED: key=%s' >&2; cat $(REPLACE_CACHE_DIR)/%s/both >&2; exit 1)",
+        key,
+        runner_path,
+        key,
+        key
+    )
+    rules[#rules + 1] = table.concat(targets, " ") .. " &: " .. table.concat(prereqs, " ") .. "\n" .. cmd
+end
+
+-- Emit a make rule for an include= key. The included file is the rule's only
+-- prereq. The filter writes cache/<key>/both with the post-processed body at
+-- filter time (idempotently). The recipe touches the primary so an edit to
+-- the included file invalidates the primary target and cascades to
+-- consumers; pass 3 rewrites cache/<key>/both with the new content while
+-- rebuilding README.md.
+function emit_include_rule(key, include_abs)
+    local primary = "$(REPLACE_CACHE_DIR)/" .. key .. "/both"
+    rules[#rules + 1] = primary .. ": " .. include_abs .. "\n\t@touch " .. primary
+end
+
+-- Lazily define key and all its transitive depends= in DFS order.
+local function ensure_defined(key)
+    if defined[key] then
+        return
+    end
+    assertf(not defining[key], "key=%s: dependency cycle", key)
+    local p = pending[key]
+    assertf(p, "key=%s: not defined", key)
+    defining[key] = true
+    for _, d in ipairs(p.deps) do
+        ensure_defined(d.base)
+    end
+    for _, s in ipairs(p.vars) do
+        if s.kind ~= "contents" then
+            ensure_defined(s.base)
+        end
+    end
+    define_script(key, p.attr, p.body, p.classes, p.deps, p.vars, p.include_abs)
+    defining[key] = nil
+end
+
+-- Pandoc gfm renders a classless CodeBlock as 4-space-indented; force fence.
+local function force_fenced(el)
+    local has_attrs = #el.attr.attributes > 0
+    if #el.classes == 0 and not has_attrs and el.identifier == "" then
+        el.classes = { "text" }
+    end
+end
+
+-- Parse the replace= value into (kind, a, b).
+-- kind == "null"     -> drop the block
+-- kind == "source"   -> a = region string or nil
+-- kind == "stream"   -> a = "stdout"|"stderr"|"both" (own key only)
+-- kind == "artifact" -> a = artifact name (own key only; must be in outputs=)
+-- kind == "cross"    -> a = K, b = thing (stream/artifact/source[/region])
+local function parse_replace_target(val, self_key)
+    if val == "null" then
+        return "null"
+    end
+    if val == "source" then
+        return "source", nil
+    end
+    if val == "stdout" or val == "stderr" or val == "both" then
+        return "stream", val
+    end
+    if val:sub(1, 7) == "source/" then
+        local region = val:sub(8)
+        assertf(region ~= "null", "replace=source/null: 'null' is a reserved marker name, not a region")
+        return "source", region
+    end
+    if self_key and outputs_t[self_key] and outputs_t[self_key][val] then
+        return "artifact", val
+    end
+    local k, rest = val:match("^([%w._%-]+)/(.+)$")
+    if k then
+        return "cross", k, rest
+    end
+    if val:match("^[%w._%-]+$") then
+        return "cross", val, "both"
+    end
+    error("replace=" .. val .. ": unrecognized value")
+end
+
+local render_source -- forward declaration (render_source <-> cross_read mutual ref)
+
+local function cross_read(K, thing, vars_spec, label)
+    ensure_defined(K)
+    assertf(defined[K], "%s: key '%s' not defined", label, K)
+    -- include= keys publish cache/<K>/both (the marker-stripped body) and expose their source for
+    -- region selection. Reject any thing other than these with a clear error.
+    if pending[K] and pending[K].include_abs then
+        local is_source = thing == "source" or thing:sub(1, 7) == "source/"
+        local v = thing == "both" or thing == "path" or thing == "both/path" or is_source
+        assertf(
+            v,
+            "%s: include= key '%s' only supports K, K/both, K/path, K/both/path, K/source[/<region>] (got K/%s)",
+            label,
+            K,
+            thing
+        )
+        -- source renders from the in-memory body, so depend on cache/<K>/both (which tracks the
+        -- included file) to invalidate consumers when it changes.
+        if is_source then
+            consumed[K .. "/both"] = true
+        end
+    end
+    if thing == "path" then
+        return REPLACE_CACHE_DIR .. "/" .. K
+    end
+    local sub_path = thing:match("^(.+)/path$")
+    if sub_path then
+        assertf(
+            not no_runner[K],
+            "%s: runner=%s is not in LANG_INFO; cannot consume cache/%s/%s",
+            label,
+            no_runner[K],
+            K,
+            sub_path
+        )
+        return REPLACE_CACHE_DIR .. "/" .. K .. "/" .. sub_path
+    end
+    -- globals/NAME renders the value of `-M NAME=...`.
+    if K == "globals" then
+        check_identifier(thing:gsub("%-", "_"), label .. ": globals/" .. thing)
+        return read_output(K, thing, label)
+    end
+    if thing == "source" then
+        assertf(sources[K], "%s: replace=source: source not stored for '%s'", label, K)
+        return render_source(sources[K], nil, vars_spec, label)
+    end
+    if thing:sub(1, 7) == "source/" then
+        local region = thing:sub(8)
+        assertf(sources[K], "%s: replace=source: source not stored for '%s'", label, K)
+        return render_source(sources[K], region, vars_spec, label)
+    end
+    if thing == "stdout" or thing == "stderr" or thing == "both" then
+        return read_output(K, thing, label)
+    end
+    assertf(outputs_t[K] and outputs_t[K][thing], "%s: key '%s' has no artifact '%s'", label, K, thing)
+    return read_output(K, thing, label)
+end
+
+render_source = function(text, region, vars_spec, label)
+    text = strip_null_regions(text, label)
+    if region or text:find("[#%-/]+%s*docs:begin") then
+        text = extract_region(text, region, label)
+    end
+    local pairs_list = {}
+    for _, p in ipairs(vars_spec or {}) do
+        if p.kind == "contents" then
+            ensure_defined(p.base)
+            local val
+            if p.sub == "source" then
+                val = render_source(sources[p.base], nil, nil, label .. ": vars=" .. p.var)
+            elseif p.sub:sub(1, 7) == "source/" then
+                local r = p.sub:sub(8)
+                val = render_source(sources[p.base], r, nil, label .. ": vars=" .. p.var)
+            else
+                val = read_output(p.base, p.sub, label .. ": vars=" .. p.var .. "->" .. p.raw)
+            end
+            pairs_list[#pairs_list + 1] = { var = p.var, value = val }
+        end
+    end
+    return vars.apply(text, pairs_list)
+end
+
+-- The filter uses two passes. Pass 1 (collect) uses pandoc.walk_block to
+-- record every key= block body without resolving anything. Pass 2
+-- (walk_blocks) renders in document order, lazily defining each key on
+-- demand via DFS through depends=. Both replace= and depends= are therefore
+-- order-independent.
+
+local function process_codeblock(el)
+    local attr = el.attr.attributes
+    local key, replace = attr.key, attr.replace
+    local has_include = attr.include ~= nil
+    if not key and not replace then
+        return el
+    end
+
+    local enabled = is_enabled(attr)
+    if enabled then
+        if key then
+            ensure_defined(key)
+        end
+        -- include= blocks produce the included body as their output; default
+        -- to replace=both, and forbid forms that don't apply (no stdout/stderr/
+        -- artifact/source for include= keys).
+        if has_include and not replace then
+            replace = "both"
+        end
+        assertf(replace, "%s: replace= attribute required", key and "key=" .. key or "CodeBlock")
+        assertf(
+            not has_include or replace == "both" or replace == "null",
+            "key=%s: include= block only supports replace=both or replace=null (got replace=%s)",
+            key,
+            replace
+        )
+    end
+
+    local vars_spec = parse_vars(attr.vars)
+    attr.key = nil
+    attr.ref = nil
+    attr.depends = nil
+    attr.sequential = nil
+    attr.outputs = nil
+    attr.replace = nil
+    attr.block = nil
+    attr.vars = nil
+    attr.enabled = nil
+    attr.include = nil
+    attr.runner = nil
+
+    if not enabled then
+        force_fenced(el)
+        return el
+    end
+
+    if replace == "null" then
+        return {}
+    end
+
+    local label = key and "key=" .. key or "replace=" .. replace
+    local kind, a, b = parse_replace_target(replace, key)
+
+    if kind == "null" then
+        return {}
+    end
+    if kind == "source" then
+        assertf(key, "%s: replace=source requires key=", label)
+        el.text = render_source(sources[key], a, vars_spec, label)
+        force_fenced(el)
+        return el
+    end
+    if kind == "stream" or kind == "artifact" then
+        assertf(key, "%s: replace=%s requires key=", label, a)
+        el.text = read_output(key, a, label)
+        force_fenced(el)
+        return el
+    end
+    if kind == "cross" then
+        el.text = cross_read(a, b, vars_spec, label)
+        force_fenced(el)
+        return el
+    end
+    error(label .. ": unknown replace= value")
+end
+
+local function process_code(el)
+    local attr = el.attr.attributes
+    local replace = attr.replace
+    if not replace then
+        return el
+    end
+    assertf(not attr.include, "inline Code: include= not supported (use key= CodeBlock)")
+    assertf(not attr.runner, "inline Code: runner= not supported (use key= CodeBlock)")
+    local enabled = is_enabled(attr)
+    attr.replace = nil
+    attr.enabled = nil
+    attr.include = nil
+    if not enabled then
+        return el
+    end
+    local label = "inline Code replace=" .. replace
+    local kind, a, b = parse_replace_target(replace, nil)
+    if kind == "cross" then
+        el.text = cross_read(a, b, nil, label)
+        return el
+    end
+    error(label .. ": only cross-block replace= (K or K/<thing>) supported on inline Code")
+end
+
+local function process_span(el)
+    local attr = el.attr.attributes
+    local replace = attr.replace
+    if not replace then
+        return el
+    end
+    assertf(not attr.include, "inline Span: include= not supported (use key= CodeBlock)")
+    assertf(not attr.runner, "inline Span: runner= not supported (use key= CodeBlock)")
+    local enabled = is_enabled(attr)
+    local code = attr.code
+    attr.replace = nil
+    attr.enabled = nil
+    attr.include = nil
+    attr.code = nil
+    if not enabled then
+        return el
+    end
+    local label = "inline Span replace=" .. replace
+    local kind, a, b = parse_replace_target(replace, nil)
+    if kind == "cross" then
+        local suffix = pandoc.utils.stringify(el.content)
+        local text = cross_read(a, b, nil, label) .. suffix
+        if code == "no" or code == "false" or code == "0" then
+            return pandoc.Str(text)
+        end
+        return pandoc.Code(text)
+    end
+    error(label .. ": only cross-block replace= (K or K/<thing>) supported on inline Span")
+end
+
+local INLINE_FILTER = { Code = process_code, Span = process_span }
+
+-- Walk a list of blocks in document order, processing CodeBlocks via
+-- process_codeblock and recursing into block containers (Div, BlockQuote,
+-- list items) so nested key=/replace= blocks are handled. Inline filters run
+-- on every visited block.
+local walk_blocks
+
+local function walk_block(b)
+    if b.tag == "CodeBlock" then
+        return process_codeblock(b)
+    end
+    if b.content and (b.tag == "Div" or b.tag == "BlockQuote") then
+        b.content = walk_blocks(b.content)
+        return pandoc.walk_block(b, INLINE_FILTER)
+    end
+    if (b.tag == "BulletList" or b.tag == "OrderedList") and b.content then
+        for i, item in ipairs(b.content) do
+            b.content[i] = walk_blocks(item)
+        end
+        return pandoc.walk_block(b, INLINE_FILTER)
+    end
+    return pandoc.walk_block(b, INLINE_FILTER)
+end
+
+walk_blocks = function(blocks)
+    local out = {}
+    for _, b in ipairs(blocks) do
+        local r = walk_block(b)
+        if type(r) == "table" and not r.tag then
+            for _, x in ipairs(r) do
+                out[#out + 1] = x
+            end
+        elseif r then
+            out[#out + 1] = r
+        end
+    end
+    return out
+end
+
+local function sorted(t)
+    local r = {}
+    for k in pairs(t) do
+        r[#r + 1] = k
+    end
+    table.sort(r)
+    return r
+end
+
+local function build_makefile_text()
+    local out = { deps_target, ":" }
+    for _, c in ipairs(sorted(consumed)) do
+        out[#out + 1] = " $(REPLACE_CACHE_DIR)/"
+        out[#out + 1] = c
+    end
+    out[#out + 1] = "\n"
+    for _, r in ipairs(rules) do
+        out[#out + 1] = r
+        out[#out + 1] = "\n"
+    end
+    return table.concat(out)
+end
+
+local function collect_codeblock(b)
+    local key = b.attr.attributes.key
+    if not key then
+        return
+    end
+    if not is_enabled(b.attr.attributes) then
+        return
+    end
+    check_identifier(key, "key=" .. key)
+    assertf(key ~= "globals", "key=globals: 'globals' is a reserved pseudo-key")
+    assertf(not pending[key], "key=%s: duplicate definition", key)
+    local include = b.attr.attributes.include
+    local body = b.text
+    local include_abs
+    if include then
+        assertf(body == "", "key=%s: include=%s: block body must be empty when include= is set", key, include)
+        -- Disambiguate FILE/<region> from a plain path: try the whole value as a
+        -- file path first. If that fails and the value contains a '/', split on
+        -- the last '/' and treat the RHS as a region name within the LHS file.
+        local file_path, region
+        local f = io.open(RECIPES_DIR .. "/" .. include, "r")
+        if f then
+            f:close()
+            file_path = include
+        else
+            local lhs, rhs = include:match("^(.+)/([^/]+)$")
+            assertf(lhs, "key=%s: include=%s: file not found", key, include)
+            file_path = lhs
+            region = rhs
+        end
+        include_abs = RECIPES_DIR .. "/" .. file_path
+        local file_content = read_file(include_abs, "key=" .. key .. " include=" .. include)
+        if region then
+            -- A single region becomes the body (markers already stripped by extract_region).
+            body = extract_region(file_content, region, "key=" .. key .. " include=" .. include)
+        else
+            -- Whole file: keep the infrastructure markers so replace=K/source/<region> can pick
+            -- named regions. They are stripped when cache/<K>/both is written (see define_script).
+            body = strip_null_regions(file_content, "key=" .. key .. " include=" .. include)
+        end
+    end
+    local seq = parse_sequential(b.attr.attributes.sequential)
+    assertf(not (include and seq), "key=%s: sequential= not allowed on include= keys", key)
+    local deps = parse_depends(b.attr.attributes.depends)
+    if seq then
+        local prev = sequential[seq]
+        if prev then
+            deps[#deps + 1] = { base = prev, sub = nil }
+        end
+        sequential[seq] = key
+    end
+    pending[key] = {
+        attr = b.attr.attributes,
+        body = body,
+        classes = b.classes,
+        deps = deps,
+        vars = parse_vars(b.attr.attributes.vars),
+        include_abs = include_abs,
+    }
+end
+
+local function collect(blocks)
+    pandoc.walk_block(pandoc.Div(blocks), { CodeBlock = collect_codeblock })
+end
+
+function Pandoc(doc)
+    local m = doc.meta["write-user-dependencies"]
+    deps_target = m and pandoc.utils.stringify(m) or nil
+    local dr = doc.meta["default-replace"]
+    if dr ~= nil then
+        local v = pandoc.utils.stringify(dr)
+        default_enabled = v == "true" or v == "yes" or v == "1"
+    end
+    local globals_dir = REPLACE_CACHE_DIR .. "/globals"
+    os.execute("mkdir -p '" .. globals_dir .. "'")
+    for k, v in pairs(doc.meta) do
+        if k:match("^[%a_][%w_%-]*$") then
+            local f = io.open(globals_dir .. "/" .. k, "w")
+            if f then
+                f:write(pandoc.utils.stringify(v))
+                f:close()
+            end
+        end
+    end
+    defined["globals"] = true
+    outputs_t["globals"] = {}
+    sources["globals"] = ""
+    collect(doc.blocks)
+    doc.blocks = walk_blocks(doc.blocks)
+    if deps_target then
+        doc.blocks = { pandoc.RawBlock("plain", build_makefile_text()) }
+    end
+    return doc
+end
+
+return { { Pandoc = Pandoc } }
diff --git a/doc/run-bash.sh b/doc/run-bash.sh
new file mode 100755
index 000000000..c658a63d3
--- /dev/null
+++ b/doc/run-bash.sh
@@ -0,0 +1,30 @@
+#!/bin/bash
+set -euo pipefail
+: "${REPLACE_KEY:?}" "${REPLACE_CACHE_DIR:?}"
+REPLACE_DIR="$(dirname "$(realpath "$0")")"
+cd "$REPLACE_CACHE_DIR/$REPLACE_KEY"
+echo "$REPLACE_KEY"
+: > both
+exec > >(tee stdout >> both) 2> >(tee stderr >> both)
+# Stamp the stream markers with an end-of-run mtime after tee has flushed, so the ordering edge a
+# downstream block hangs off (cache/<key>/both) always advances and stays newer than this block's
+# artifacts, even when the captured stream is empty. Without it an empty marker keeps its start-of-run
+# mtime and an incremental parallel build can order a consumer ahead of the artifacts it globs.
+trap 'exec >&- 2>&-; wait; touch both stdout stderr 2>/dev/null || true' EXIT
+if [ -f spec ]; then
+    lua5.4 "$REPLACE_DIR/vars.lua" body.sh body.run.sh
+    body=body.run.sh
+else
+    body=body.sh
+fi
+status=0
+bash -eo pipefail "$body" || status=$?
+if [ "$status" -ne 0 ]; then exit "$status"; fi
+while IFS= read -r artifact; do
+    [ -z "$artifact" ] && continue
+    if [ ! -e "$artifact" ]; then
+        echo "missing declared output: $artifact" >&2
+        status=1
+    fi
+done < outputs
+exit "$status"
diff --git a/doc/run-lua.sh b/doc/run-lua.sh
new file mode 100755
index 000000000..f6646d983
--- /dev/null
+++ b/doc/run-lua.sh
@@ -0,0 +1,30 @@
+#!/bin/bash
+set -euo pipefail
+: "${REPLACE_KEY:?}" "${REPLACE_CACHE_DIR:?}"
+REPLACE_DIR="$(dirname "$(realpath "$0")")"
+cd "$REPLACE_CACHE_DIR/$REPLACE_KEY"
+echo "$REPLACE_KEY"
+: > both
+exec > >(tee stdout >> both) 2> >(tee stderr >> both)
+# Stamp the stream markers with an end-of-run mtime after tee has flushed, so the ordering edge a
+# downstream block hangs off (cache/<key>/both) always advances and stays newer than this block's
+# artifacts, even when the captured stream is empty. Without it an empty marker keeps its start-of-run
+# mtime and an incremental parallel build can order a consumer ahead of the artifacts it globs.
+trap 'exec >&- 2>&-; wait; touch both stdout stderr 2>/dev/null || true' EXIT
+if [ -f spec ]; then
+    lua5.4 "$REPLACE_DIR/vars.lua" body.lua body.run.lua
+    body=body.run.lua
+else
+    body=body.lua
+fi
+status=0
+lua5.4 "$body" || status=$?
+if [ "$status" -ne 0 ]; then exit "$status"; fi
+while IFS= read -r artifact; do
+    [ -z "$artifact" ] && continue
+    if [ ! -e "$artifact" ]; then
+        echo "missing declared output: $artifact" >&2
+        status=1
+    fi
+done < outputs
+exit "$status"
diff --git a/doc/vars.lua b/doc/vars.lua
new file mode 100644
index 000000000..489c23ec4
--- /dev/null
+++ b/doc/vars.lua
@@ -0,0 +1,42 @@
+local M = {}
+
+function M.apply(body, pairs)
+    for _, p in ipairs(pairs) do
+        body = body:gsub("%$" .. p.var .. "%f[%W]", function()
+            return p.value
+        end)
+    end
+    return body
+end
+
+function M.read_value(path)
+    local f = assert(io.open(path, "r"), "vars: cannot open " .. path)
+    local s = f:read("a")
+    f:close()
+    s = s:gsub("\27%[[%d;]*[mGK]", ""):gsub("\r", "")
+    return (s:gsub("\n$", ""))
+end
+
+local function cli(body_in, body_out)
+    local pairs_list = {}
+    local sf = assert(io.open("spec", "r"), "vars CLI: ./spec not found")
+    for line in sf:lines() do
+        local var, path = line:match("^([%w_]+)=(.+)$")
+        assert(var, "vars CLI: bad spec line: " .. line)
+        pairs_list[#pairs_list + 1] = { var = var, value = M.read_value(path) }
+    end
+    sf:close()
+    local bf = assert(io.open(body_in, "r"))
+    local body = bf:read("a")
+    bf:close()
+    body = M.apply(body, pairs_list)
+    local of = assert(io.open(body_out, "w"))
+    of:write(body)
+    of:close()
+end
+
+if arg and arg[0] and arg[0]:match("vars%.lua$") and arg[1] then
+    cli(arg[1], arg[2])
+end
+
+return M
diff --git a/risc0/Makefile b/risc0/Makefile
index 00ba67313..282264405 100644
--- a/risc0/Makefile
+++ b/risc0/Makefile
@@ -68,7 +68,7 @@ $(STEP_LOG):
 	$(CARTESI_MACHINE) \
 		--hash-tree=hash_function:sha256 \
 		--max-mcycle=0 \
-		--log-step=1,$@
+		--log-step=$@,count:1
 
 $(RECEIPT): $(STEP_LOG)
 	@echo "--- Proving step log ---"
diff --git a/risc0/cpp/Makefile b/risc0/cpp/Makefile
index 377a37aee..edac5f8c2 100644
--- a/risc0/cpp/Makefile
+++ b/risc0/cpp/Makefile
@@ -56,6 +56,7 @@ UBFLAGS := -fno-strict-aliasing -fno-strict-overflow -fno-delete-null-pointer-ch
 
 CFLAGS := -march=rv32im -mabi=ilp32 -Wl,--gc-sections $(OPTFLAGS) $(UBFLAGS) \
 	-DZKARCHITECTURE=1 \
+	-DNO_STD_VECTOR=1 \
 	$(DUMP_DEFS) \
 	-DAVOID_NATIVE_UINT128_T=1 \
 	-ffreestanding \
diff --git a/risc0/rust/cartesi-risc0/src/main.rs b/risc0/rust/cartesi-risc0/src/main.rs
index c13842309..1f26356a9 100644
--- a/risc0/rust/cartesi-risc0/src/main.rs
+++ b/risc0/rust/cartesi-risc0/src/main.rs
@@ -20,7 +20,7 @@ Command line interface for the Cartesi Machine RISC0 zkVM prover.
 Pipeline:
 
 1) Generate a step log from the Cartesi Machine.
-   cartesi-machine --max-mcycle=0 --log-step=1,/tmp/step.log
+   cartesi-machine --max-mcycle=0 --log-step=/tmp/step.log,count:1
 
 2) Prove the step log (produces a STARK receipt).
    cartesi-risc0-cli prove <hash_before> /tmp/step.log 1 <hash_after> /tmp/receipt.bin
diff --git a/src/address-range-constants.hpp b/src/address-range-constants.hpp
index 6c315532f..b412efb1f 100644
--- a/src/address-range-constants.hpp
+++ b/src/address-range-constants.hpp
@@ -55,8 +55,6 @@ enum AR_ranges : uint64_t {
     AR_CMIO_TX_BUFFER_START = EXPAND_UINT64_C(AR_CMIO_TX_BUFFER_START_DEF),         ///< Start of CMIO TX buffer range
     AR_CMIO_TX_BUFFER_LOG2_SIZE = EXPAND_UINT64_C(AR_CMIO_TX_BUFFER_LOG2_SIZE_DEF), ///< Log2 of CMIO TX buffer range
     AR_CMIO_TX_BUFFER_LENGTH = (UINT64_C(1) << AR_CMIO_TX_BUFFER_LOG2_SIZE_DEF),    ///< Length of CMIO TX buffer range
-    AR_DRIVE_START = EXPAND_UINT64_C(AR_DRIVE_START_DEF),   ///< Start address for flash drive ranges
-    AR_DRIVE_OFFSET = EXPAND_UINT64_C(AR_DRIVE_OFFSET_DEF), ///< Offset for extra flash drive ranges
 
     AR_FIRST_VIRTIO_START = EXPAND_UINT64_C(AR_FIRST_VIRTIO_START_DEF), ///< Start of first VIRTIO range
     AR_VIRTIO_LENGTH = EXPAND_UINT64_C(AR_VIRTIO_LENGTH_DEF),           ///< Length of each VIRTIO range
diff --git a/src/address-range-defines.h b/src/address-range-defines.h
index 03e4b5331..14fb40f20 100644
--- a/src/address-range-defines.h
+++ b/src/address-range-defines.h
@@ -46,8 +46,6 @@
 #define AR_CMIO_RX_BUFFER_LOG2_SIZE_DEF 21         ///< log<sub>2</sub> of CMIO RX buffer length in bytes
 #define AR_CMIO_TX_BUFFER_START_DEF 0x60800000     ///< CMIO TX buffer start address
 #define AR_CMIO_TX_BUFFER_LOG2_SIZE_DEF 21         ///< log<sub>2</sub> of CMIO TX buffer length in bytes
-#define AR_DRIVE_START_DEF 0x80000000000000        ///< Start PMA address for flash drives
-#define AR_DRIVE_OFFSET_DEF 0x10000000000000       ///< PMA offset for extra flash drives
 
 #define AR_RAM_START_DEF 0x80000000 ///< RAM start address
 
diff --git a/src/address-range-description.hpp b/src/address-range-description.hpp
index 7b50fc2e6..476033ac2 100644
--- a/src/address-range-description.hpp
+++ b/src/address-range-description.hpp
@@ -25,9 +25,17 @@ namespace cartesi {
 
 /// \brief Description of an address range used for introspection (i.e., get_address_ranges())
 struct address_range_description {
-    uint64_t start = 0;      ///< Start of memory range
-    uint64_t length = 0;     ///< Length of memory range
-    std::string description; ///< User-friendly description for memory range
+    uint64_t start = 0;               ///< Start of memory range
+    uint64_t length = 0;              ///< Length of memory range
+    std::string description;          ///< User-friendly description for memory range
+    bool is_memory = false;           ///< True if range is memory (false if device)
+    bool is_device = false;           ///< True if range is a device
+    bool is_readable = false;         ///< True if range is readable by the machine
+    bool is_writeable = false;        ///< True if range is writeable by the machine
+    bool is_executable = false;       ///< True if range is executable by the machine
+    bool is_read_idempotent = false;  ///< True if reads from range are idempotent
+    bool is_write_idempotent = false; ///< True if writes to range are idempotent
+    uint64_t driver_id = 0;           ///< Driver identifier for range
 };
 
 /// \brief List of address range descriptions used for introspection (i.e., get_address_ranges())
diff --git a/src/cartesi-machine.lua b/src/cartesi-machine.lua
index 02935a20e..5ebc08ddc 100755
--- a/src/cartesi-machine.lua
+++ b/src/cartesi-machine.lua
@@ -16,12 +16,20 @@
 -- with this program (see COPYING). If not, see <https://www.gnu.org/licenses/>.
 --
 
-local cartesi = require("cartesi")
-local util = require("cartesi.util")
+local bash = require("cartesi.bash")
+-- forward compiled package declarations so handle_bash_completion can run clean
+local cartesi, util, hash_tree
 
 local function stderr_unsilenceable(fmt, ...) io.stderr:write(string.format(fmt, ...)) end
 local stderr = stderr_unsilenceable
 
+local function errorf(fmt, ...) error(string.format(fmt, ...), 2) end
+
+local function assertf(value, fmt, ...)
+    if value then return value, fmt, ... end
+    error(string.format(fmt, ...), 2)
+end
+
 local function adjust_images_path(path)
     if not path then return "" end
     return string.gsub(path, "/*$", "") .. "/"
@@ -45,6 +53,10 @@ where options are:
   --version-json
     display cartesi machine semantic version and exit.
 
+  --bash-completion
+    print a bash completion script for this program to stdout and exit.
+    Install with: source <(cartesi-machine --bash-completion)
+
   --assert-version=<major>.<minor>[.<patch>]
     exit with failure in case the cartesi machine emulator version mismatches
 
@@ -131,8 +143,14 @@ where options are:
 
         start (optional)
         sets the starting physical memory offset for flash drive in bytes.
-        when omitted, drives start at 1 << 55 and are spaced by 1 << 52.
-        if any start offset is set, all of them must be set.
+        when omitted, flash drives' starts are computed automatically as follows:
+        assume the lengths of RAM and of all flash drives are powers of two (otherwise,
+        round them up to the next power of two for the purposes of this description).
+        each flash drive starts at the lowest address that is aligned to its length and
+        is past the end of the previous flash drive (or past the end of RAM, in the case
+        of the first flash drive).
+        flash drives with explicit starts are ignored by this computation, and overlaps
+        with them are rejected when the machine is created.
 
         length (optional)
         gives the length of the flash drive in bytes (must be multiple of 4Ki).
@@ -172,12 +190,12 @@ where options are:
         mke2fs (optional)
         whether the flash drive should be formatted as an ext2 filesystem in init.
         by default, the drive is formatted as ext2 filesystem if there is no backing file,
-        you can use "mke2fs:false" to disables ext2 formatting.
+        you can use "mke2fs:false" to disable ext2 formatting.
 
         mount (optional)
         whether the flash drive should be mounted automatically in init.
         by default, the drive is mounted if there is an image file backing it or is formatted (mke2fs option),
-        you can use "mount:false" to disables auto mounting,
+        you can use "mount:false" to disable auto mounting,
         you can also use "mount:<path>" to choose a custom mount point.
 
         user (optional)
@@ -220,8 +238,16 @@ where options are:
 
         start (optional)
         sets the starting physical memory offset for the NVRAM in bytes.
-        when omitted, NVRAMs are placed in the same 1 << 55 / 1 << 52-stride
-        pool as flash drives, using the next free slot after all flash drives.
+        when omitted, NVRAMs' starts are computed automatically as follows:
+        assume the lengths of RAM and of all NVRAMs and flash drives are powers of two
+        (otherwise, round them up to the next power of two for the purposes of this
+        description).
+        each NVRAM starts at the lowest address that is aligned to its length and is
+        past the end of the previous NVRAM (in the case of the first NVRAM, past the
+        end of the last automatically placed flash drive, or past the end of RAM if
+        there is none).
+        NVRAMs with explicit starts are ignored by this computation, and overlaps
+        with them are rejected when the machine is created.
 
         length (optional)
         gives the length of the NVRAM in bytes (must be multiple of 4Ki).
@@ -236,6 +262,8 @@ where options are:
 
         user (optional)
         changes the user ownership of the /dev/uioN device.
+        this option is useful to allow dapp's user access the NVRAM.
+        the default ownership is set to the root user.
 
   --replace-memory-range=<key>:<value>[,<key>:<value>[,...]...]
     replaces an existing memory range right after machine instantiation.
@@ -276,7 +304,7 @@ where options are:
     semantics are the same as for the --flash-drive option.
 
   --hash-tree=<key>:<value>[,<key>:<value>[,...]...]
-    configures the global hash tree the the machine
+    configures the global hash tree of the machine
 
     <key>:<value> is one of
         hash_function:<string>
@@ -290,7 +318,7 @@ where options are:
 
         sht_filename (optional)
         gives the name of the file containing the sparse hash-tree for the machine.
-		(this is the part of the hash tree from the root down to leaves that subindend
+		(this is the part of the hash tree from the root down to leaves that subintend
         entire memory ranges, such as flash-drives or the ram.)
         when omitted or set to the empty, the hash tree will be built from scratch.
 
@@ -305,7 +333,7 @@ where options are:
 
         shared (optional)
         target modifications to machine state modify the sparse hash tree file.
-        by default, the files is not modified and changes are lost.
+        by default, the file is not modified and changes are lost.
 
   --cmio-advance-state=<key>:<value>[,<key>:<value>[,...]...]
     advances the state of the machine through a number of inputs.
@@ -315,10 +343,19 @@ where options are:
         input_index_begin:<number>
         input_index_end:<number>
         output:<filename-pattern>
+        rejected_output:<filename-pattern>
+        output_proof:<filename-pattern>
+        last_output_proof:<filename>
+        format:<lua|json>
         report:<filename-pattern>
         output_hashes_root_hash:<filename-pattern>
+        output_hashes_root_hash_proof:<filename-pattern>
+        check_output_hashes_root_hash:<boolean>
         hashes
 
+        any file pattern can be set to the empty string to disable writing
+        that file.
+
         input (default: "input-%%i.bin")
         the pattern that derives the name of the file read for input %%i.
 
@@ -328,24 +365,61 @@ where options are:
         input_index_end (default: 0)
         one past index of last input to advance (one past last value of %%i).
 
-        output (default: "input-%%i-output-%%o.bin")
-        the pattern that derives the name of the file written for output %%o
-        of input %%i.
+        output (default: "output-%%o-input-%%i.bin")
+        the pattern that derives the name of the file written for each accepted
+        output. "%%o" is the global output index across all accepted inputs, and
+        "%%i" is the input it came from.
+
+        rejected_output (default: "rejected-output-%%o-input-%%i.bin")
+        the pattern that derives the name of the file written for each output of
+        a rejected input. "%%o" is the would-be global output index, and "%%i"
+        is the input.
+
+        output_proof (default: "output-%%o-input-%%i-proof.<format>")
+        the pattern that derives the name of the file written for the Merkle
+        proof of each accepted output against the output hashes root hash of the
+        last input of the run. serialized according to "format". when left at the
+        default, its extension tracks "format".
+
+        last_output_proof (no default)
+        a single filename, not a pattern, holding the previous run's last output
+        proof. it resumes the output hashes Merkle tree so this run continues at
+        the running global output index. omit it for the first (genesis) run.
+        read according to "format".
+
+        format (optional)
+        selects the format for output_proof and last_output_proof. when omitted,
+        it is inferred from the filename extension (.json/.lua), defaulting to Lua.
 
         report (default: "input-%%i-report-%%o.bin")
         the pattern that derives the name of the file written for report %%o
         of input %%i.
 
-        outputs_root_hash (default: "input-%%i-output-hashes-root-hash.bin")
-        the pattern that derives the name of the file written for outputs root
-        hash of input %%i.
+        output_hashes_root_hash (default: "input-%%i-output-hashes-root-hash.bin")
+        the pattern that derives the name of the file written for the output
+        hashes root hash after input %%i.
+
+        output_hashes_root_hash_proof (default: "input-%%i-output-hashes-root-hash-proof.<format>")
+        the pattern that derives the name of the file written for the Merkle
+        proof that the output hashes root hash occupied the tx buffer in
+        the machine state in which input %%i was accepted. it ties the output
+        hashes root hash (against which "output_proof" proves each output) back
+        into the machine state hash. serialized according to "format". when left
+        at the default, its extension tracks "format".
+
+        check_output_hashes_root_hash (default: true)
+        on each accepted input, check that the host's running output hashes root
+        hash equals the one the guest wrote to the tx buffer. it needs either the
+        genesis run or a last_output_proof seed to know the count of prior
+        outputs.
 
         hashes
         print out hashes before every input.
 
     the input index ranges in {input_index_begin, ..., input_index_end-1}.
-    for each input, "%%i" is replaced by the input index, and "%%o" by the output
-    or report index.
+    "%%i" is replaced by the input index. "%%o" is replaced by the global output
+    index for output, rejected_output, and output_proof, but by the per-input
+    report index for report.
 
   --cmio-inspect-state=<key>:<value>[,<key>:<value>[,...]...]
     inspect the state of the machine with a query.
@@ -431,8 +505,8 @@ where options are:
             host's file name to feed to the console input,
             this option automatically sets input source to "from_file".
 
-            tty_rows (default: 80)
-            tty_cols (default: 25)
+            tty_rows (default: 25)
+            tty_cols (default: 80)
             terminal size, only relevant when input source is different from stdin.
 
   --skip-version-check
@@ -464,22 +538,23 @@ where options are:
   --sync-init-date
     set the guest date to match the host date on initialization.
     this option is recommended when using TLS connections or when sharing
-    host directories systems.
-    this is is automatically implied with --network or --volume options.
+    host directories.
+    this is automatically implied with --network or --volume options.
 
     NON REPRODUCIBLE OPTION, DON'T USE THIS OPTION IN PRODUCTION
 
-  --virtio-9p=<tag>:<directory>
+  --virtio-9p=tag:<tag>,host_directory:<directory>
     add a VirtIO Plan9 filesystem device for sharing a host directory
     in the guest.
-    the filesystem will have a tag can be used to mount the host directory
+    the filesystem will have a tag that can be used to mount the host directory
     in the guest using the following command:
 
         busybox mount -t 9p <tag> <mountpoint>
 
     NON REPRODUCIBLE OPTION, DON'T USE THIS OPTION IN PRODUCTION
 
-  -v or --volume=<host_directory>:<guest_directory>
+  --volume=host_directory:<directory>,guest_directory:<directory>
+  -v <host-directory>:<guest-directory>
     like --virtio-9p, but also appends init commands to auto mount the
     host directory in the guest directory.
     mount tags are incrementally set to "vfs0", "vfs1", ...
@@ -492,7 +567,7 @@ where options are:
     add a VirtIO network device using host TUN/TAP interface.
     this allows the use of the host network from inside the machine.
     this is more efficient and has fewer limitations than the user-space
-    networking option (--virtio-net=user...).
+    networking option (--virtio-net=user).
 
     run the following commands in the host before starting the emulator:
 
@@ -524,7 +599,7 @@ where options are:
     this allows the use of the host network from inside the machine.
     you don't need root privilege or any configuration in the host to use this.
     although this mode is easier to use, it has the following limitations:
-      - there is an additional an emulation layer of the TCP/IP stack;
+      - there is an additional emulation layer of the TCP/IP stack;
       - not all IP protocols are emulated, but TCP and UDP should work;
       - host cannot connect to guest TCP ports.
     the implementation uses the libslirp TCP/IP emulator library.
@@ -553,16 +628,21 @@ where options are:
 
     NON REPRODUCIBLE OPTION, DON'T USE THIS OPTION IN PRODUCTION
 
-  -p=... or --port-forward=[hostip:]hostport[:guestip][:guestport][/protocol]
+  --port-forward=host_address:[hostip:]hostport,guest_address:[guestip:]guestport,protocol:<tcp|udp>
+  -p [hostip:]hostport:guestport[/protocol]
     redirect incoming TCP or UDP connections.
     bind the host hostip:hostport to the guest guestip:guestport.
-    protocol can be "tcp" or "udp".
+    each address is "[ip:]port", and protocol can be "tcp" or "udp".
     if host ip is absent, it's set to "127.0.0.1".
     if guest ip is absent, it's set to "10.0.2.15".
     if guest port is absent, it's set to the same as host port.
     if protocol is absent, it's set to "tcp".
+    the short -p form is docker-compatible. it requires both ports, has no
+    guest ip field, and takes an optional "/tcp" or "/udp" suffix protocol
+    defaulting to tcp.
+    use the long form to set a guest ip.
     you can pass this option multiple times.
-    this options requires --network or --virtio-net=user option.
+    this option requires --network or --virtio-net=user option.
 
     NON REPRODUCIBLE OPTION, DON'T USE THIS OPTION IN PRODUCTION
 
@@ -639,23 +719,55 @@ where options are:
             config: store "shared" backing stores from current state; others are copied as they were during load.
             all: (default) store current state for all backings stores.
 
-  --initial-hash
+  --initial-hash[=<filename>]
     print initial state hash before running machine.
+    if <filename> is given, write the raw state hash to it instead.
 
-  --final-hash
+  --final-hash[=<filename>]
     print final state hash when done.
+    if <filename> is given, write the raw state hash to it instead.
 
-  --periodic-hashes=<number-period>[,<number-start>]
-    prints root hash every <number-period> cycles.
-    if <number-start> is given, the periodic hashing will start at that mcycle.
+  --periodic-hashes=<period>[,start:<mcycle>]
+    prints root hash every <period> cycles.
+    if start: is given, the periodic hashing will start at that mcycle.
     this option implies --initial-hash and --final-hash.
     (default: none)
 
-  --dense-uarch-hashes=<number-length>[,<number-start>]
-    prints root hash every uarch cycle for <number-length> mcycles.
-    if <number-start> is given, the dense hashing will start at that mcycle.
+  --dense-uarch-hashes=<count>[,start:<mcycle>]
+    prints root hash every uarch cycle for <count> mcycles.
+    if start: is given, the dense hashing will start at that mcycle.
 
-  --log-step=<mcycle-count>,<filename>
+  --initial-proof=<key>:<value>[,<key>:<value>[,...]...]
+    print a Merkle proof for a target region of the initial machine state.
+
+    <key>:<value> is one of
+        address:<number>
+        log2_size:<number>
+        label:<label>
+        filename:<filename>
+
+        address and log2_size
+        give the starting offset and the log2 of the size of the target
+        region in bytes. log2_size must be at least 5 (a 32-byte word).
+
+        label (alternative to address and log2_size)
+        names a flash drive or nvram whose start and length supply the
+        target region's address and log2_size.
+
+        filename (optional)
+        redirects the proof to a file. when omitted, the proof is printed
+        to stdout.
+
+        format:<lua|json> (optional)
+        selects the output format. when omitted, it is inferred from the
+        filename extension (.json/.lua), defaulting to Lua.
+
+    the proof is printed as a Lua table unless format:json is given.
+
+  --final-proof=<key>:<value>[,<key>:<value>[,...]...]
+    like --initial-proof, but for the final machine state.
+
+  --log-step=<filename>,count:<mcycle-count>
     log and save a step of <mcycle-count> mcycles to <filename>.
 
   --log-step-uarch
@@ -667,29 +779,24 @@ where options are:
   --auto-reset-uarch
     reset uarch automatically after halt.
 
-  --store-config[=<filename>]
-    store initial machine config as Lua script to <filename>.
+  --store-config[=<filename>][,format:<lua|json>]
+    store initial machine config to <filename>.
     If <filename> is omitted, print the initial machine config to stdout.
+    the format is taken from format: if given, else the filename extension
+    (.json/.lua), defaulting to Lua.
 
-  --store-json-config[=<filename>]
-    store initial machine config as JSON to <filename>.
-    If <filename> is omitted, print the initial machine config to stdout.
-
-  --load-config=<filename>
-    load initial machine config from Lua script <filename>. If a field is omitted on
-    the config table, it will fall back into the respective command-line
-    argument or into the default value.
-
-  --load-json-config=<filename>
-    load initial machine config from JSON <filename>. If a field is omitted on
+  --load-config=<filename>[,format:<lua|json>]
+    load initial machine config from <filename>. If a field is omitted on
     the config table, it will fall back into the respective command-line
     argument or into the default value.
+    the format is taken from format: if given, else the filename extension
+    (.json/.lua), defaulting to Lua.
 
   --uarch-ram-image=<filename>
     name of file containing microarchitecture RAM image.
 
-  --dump-address-ranges[=<dir>]
-    dump all address ranges to files under <dir>.
+  --dump-memory-ranges[=<dir>]
+    dump all memory ranges to files under <dir>.
     If <dir> is omitted, files are written to the current directory.
 
   --assert-rolling-template
@@ -703,17 +810,17 @@ where options are:
   --no-init-splash
     don't show cartesi machine splash on boot.
 
-  -u=<name> or --user=<name>
+  -u <name> or --user=<name>
     appends to init the user who should execute the entrypoint command.
     when omitted, the user is set to "dapp" by rootfs init script.
 
-  -e=<name>=<value> or --env=<name>=<value>
+  -e <name>=<value> or --env=<name>=<value>
     appends to init an environment variable export.
 
-  -w=<dir> or --workdir=<dir>
+  -w <dir> or --workdir=<dir>
     appends to init the entrypoint working directory.
 
-  -h=<name> or --hostname=<name>
+  -h <name> or --hostname=<name>
     appends to init a machine hostname change.
 
   --append-init=<string>
@@ -762,7 +869,7 @@ and command and arguments:
   arguments
     the given command arguments.
 
-<number> can be specified in decimal (e.g., 16) or hexadeximal (e.g., 0x10),
+<number> can be specified in decimal (e.g., 16) or hexadecimal (e.g., 0x10),
 with a suffix multiplier (i.e., Ki, Mi, Gi for 2^10, 2^20, 2^30, respectively),
 or a left shift (e.g., 2 << 20).
 
@@ -780,9 +887,7 @@ local remote_shutdown = false
 local remote_create = true
 local remote_destroy = true
 local perform_rollbacks = true
-local default_config = cartesi.machine:get_default_config()
 local images_path = adjust_images_path(os.getenv("CARTESI_IMAGES_PATH"))
-
 local flash_label_to_index = { root = 1 }
 local flash_drives = {
     {
@@ -794,66 +899,66 @@ local flash_drive_count = 1
 local nvram_label_to_index = {}
 local nvrams = {}
 local nvram_count = 0
-local virtio = {}
 local virtio_net_user_config
 local virtio_volume_count = 0
 local has_virtio_console = false
 local has_network = false
 local has_sync_init_date = false
 local memory_range_replace = {}
-local ram = {
-    length = 128 << 20, -- 128MB
-    backing_store = {
-        data_filename = images_path .. "linux.bin",
-        dht_filename = "",
-        dpt_filename = "",
-    },
-}
 local init_splash = true
 local append_bootargs = ""
 local append_init = ""
 local append_entrypoint = ""
-local dtb = {
-    init = "",
-    entrypoint = "",
-    bootargs = default_config.dtb.bootargs,
-}
-local tlb = {}
-local cmio = {
-    rx_buffer = {},
-    tx_buffer = {},
-}
 local cmio_advance
 local cmio_inspect
-local processor = {
-    registers = {
-        iunrep = 0,
-        htif = {
-            iconsole = cartesi.HTIF_CONSOLE_CMD_PUTCHAR_MASK,
-            iyield = cartesi.HTIF_YIELD_CMD_AUTOMATIC_MASK | cartesi.HTIF_YIELD_CMD_MANUAL_MASK,
-        },
-    },
-}
-local uarch = {
+-- The machine configuration, assembled in place by the option handlers below and passed to
+-- machine:create. It is the requested ("command line") config; after creation, the machine's
+-- actual config is read back into initial_config.
+local cmdline_config = {
     processor = {
-        registers = {},
-        backing_store = {
-            data_filename = "",
-            dht_filename = "",
-            dpt_filename = "",
+        registers = {
+            iunrep = 0,
         },
     },
     ram = {
+        length = 128 << 20, -- 128MB
         backing_store = {
-            data_filename = "",
+            data_filename = images_path .. "linux.bin",
             dht_filename = "",
             dpt_filename = "",
         },
     },
-}
-local pmas = {}
-local hash_tree = {
-    hash_function = default_config.hash_tree.hash_function,
+    dtb = {
+        init = "",
+        entrypoint = "",
+    },
+    flash_drive = {},
+    nvram = {},
+    tlb = {},
+    virtio = {},
+    cmio = {
+        rx_buffer = {},
+        tx_buffer = {},
+    },
+    pmas = {},
+    uarch = {
+        processor = {
+            registers = {},
+            backing_store = {
+                data_filename = "",
+                dht_filename = "",
+                dpt_filename = "",
+            },
+        },
+        ram = {
+            backing_store = {
+                data_filename = "",
+                dht_filename = "",
+                dpt_filename = "",
+            },
+        },
+    },
+    hash_tree = {},
 }
 local console = {}
 local concurrency_update_hash_tree = 0
@@ -867,7 +972,7 @@ local periodic_hashes_period = math.maxinteger
 local periodic_hashes_start = 0
 local dense_uarch_hashes_start
 local dense_uarch_hashes_end
-local dump_address_ranges_dir = false
+local dump_memory_ranges_dir = false
 local max_mcycle = math.maxinteger
 local max_uarch_cycle = 0
 local log_step_uarch = false
@@ -881,9 +986,9 @@ local load_sharing
 local store_sharing
 local cmdline_opts_finished = false
 local store_config = false
-local store_json_config = false
+local store_config_format
 local load_config = false
-local load_json_config = false
+local load_config_format
 local gdb_address
 local exec_arguments = {}
 local assert_rolling_template = false
@@ -898,8 +1003,8 @@ local function set_empty_omitted_filenames(f)
     bs.dpt_filename = bs.dpt_filename or ""
 end
 
-local function parse_memory_range(opts, all, accepted)
-    local f = util.parse_options(opts, all, accepted)
+local function parse_memory_range(keys, all, opts)
+    local f = util.parse_options(keys, all, opts)
     f.backing_store = {
         data_filename = f.data_filename,
         dht_filename = f.dht_filename,
@@ -917,6 +1022,26 @@ local function parse_memory_range(opts, all, accepted)
     return f
 end
 
+-- Map a sharing sub-option ("none"/"config"/"all") to its constant. The map is
+-- populated once cartesi is required, since the options table that calls
+-- to_sharing is built before that.
+local to_sharing_map
+local function to_sharing(s)
+    if not s then return nil end
+    return assert(to_sharing_map[s])
+end
+
+-- Resolve the serialization format for a dump/load: an explicit format sub-key
+-- wins, else the filename extension (.json/.lua), else Lua (the default).
+local function resolve_format(format, filename)
+    if format then return format end
+    if filename then
+        local ext = filename:match("%.([^.]+)$")
+        if ext == "json" or ext == "lua" then return ext end
+    end
+    return "lua"
+end
+
 -- Override existing boolean with a new one
 local function override_bool(prev, b)
     if b == nil then return prev end
@@ -942,15 +1067,21 @@ local function override_memory_range(entry, opts)
     entry_bs.truncate = override_bool(entry_bs.truncate, opts_bs.truncate)
 end
 
-local function parse_backing_store(opts, all, def)
-    local f = util.parse_options(opts, all, {
-        data_filename = "string",
-        dht_filename = "string",
-        dpt_filename = "string",
-        shared = "boolean",
-        create = "boolean",
-        truncate = "boolean",
-    })
+-- Backing-store sub-keys shared by every plain backing-store option (--ram=,
+-- --dtb=, --processor=, --uarch-ram=, --uarch-processor=, --pmas=,
+-- --cmio-rx-buffer=, --cmio-tx-buffer=). Referenced as the bash-completion
+-- hint on each of those option entries.
+local backing_store_keys = {
+    data_filename = "file",
+    dht_filename = "file",
+    dpt_filename = "file",
+    shared = "boolean",
+    create = "boolean",
+    truncate = "boolean",
+}
+
+local function parse_backing_store(keys, all, opts, def)
+    local f = util.parse_options(keys, all, opts)
     if def then
         for i, v in pairs(def) do
             if f[i] == nil then f[i] = v end
@@ -961,7 +1092,7 @@ end
 
 local function handle_sync_init_date()
     if has_sync_init_date then return true end
-    processor.registers.iunrep = 1
+    cmdline_config.processor.registers.iunrep = 1
     has_sync_init_date = true
     -- round up time by 1, to decrease chance of guest time being in the past
     local seconds = os.time() + 1
@@ -970,16 +1101,16 @@ local function handle_sync_init_date()
 end
 
 local function handle_virtio_9p(tag, host_directory)
-    processor.registers.iunrep = 1
-    table.insert(virtio, { type = "p9fs", tag = tag, host_directory = host_directory })
+    cmdline_config.processor.registers.iunrep = 1
+    table.insert(cmdline_config.virtio, { type = "p9fs", tag = tag, host_directory = host_directory })
     return true
 end
 
 local function handle_volume_option(host_directory, guest_directory)
-    processor.registers.iunrep = 1
+    cmdline_config.processor.registers.iunrep = 1
     local tag = "vfs" .. virtio_volume_count
     virtio_volume_count = virtio_volume_count + 1
-    table.insert(virtio, { type = "p9fs", tag = tag, host_directory = host_directory })
+    table.insert(cmdline_config.virtio, { type = "p9fs", tag = tag, host_directory = host_directory })
     append_init = append_init .. "busybox mkdir -p " .. guest_directory .. " && "
     append_init = append_init .. "busybox mount -t 9p " .. tag .. " " .. guest_directory .. "\n"
     -- sync guest date with host date, otherwise file system updates will have wrong dates
@@ -988,29 +1119,32 @@ local function handle_volume_option(host_directory, guest_directory)
 end
 
 local function handle_htif_console_getchar()
-    processor.registers.htif.iconsole = processor.registers.htif.iconsole | cartesi.HTIF_CONSOLE_CMD_GETCHAR_MASK
-    processor.registers.iunrep = 1
+    cmdline_config.processor.registers.htif.iconsole = cmdline_config.processor.registers.htif.iconsole
+        | cartesi.HTIF_CONSOLE_CMD_GETCHAR_MASK
+    cmdline_config.processor.registers.iunrep = 1
     console.input_source = console.input_source or "from_stdin"
     console.output_flush_mode = console.output_flush_mode or "every_char"
     return true
 end
 
-local function handle_user(user)
+local function handle_user(_, _, user)
     append_init = append_init .. "USER=" .. user .. "\n"
     return true
 end
 
-local function handle_env(name, value)
+local function handle_env(_, _, opts)
+    local name, value = opts:match("^([%w_]+)=(.+)$")
+    assertf(name and value, "invalid env %s, expected NAME=VALUE", opts)
     append_init = append_init .. "export " .. name .. "=" .. value .. "\n"
     return true
 end
 
-local function handle_workdir(value)
+local function handle_workdir(_, _, value)
     append_init = append_init .. "WORKDIR=" .. value .. "\n"
     return true
 end
 
-local function handle_hostname(name)
+local function handle_hostname(_, _, name)
     append_init = append_init .. "busybox hostname " .. name .. "\n"
     return true
 end
@@ -1018,65 +1152,47 @@ end
 local function parse_ipv4(s)
     local a, b, c, d = s:match("^([0-9]+)%.([0-9]+)%.([0-9]+)%.([0-9]+)$")
     a, b, c, d = tonumber(a), tonumber(b), tonumber(c), tonumber(d)
-    assert(a and b and c and d and a <= 255 and b <= 255 and c <= 255 and d <= 255, "malformed IPv4 " .. s)
+    assertf(a and b and c and d and a <= 255 and b <= 255 and c <= 255 and d <= 255, "malformed IPv4 %s", s)
     return (a << 24) | (b << 18) | (c << 8) | d
 end
 
-local function handle_port_forward_option(opts)
-    if not opts then return false end
+-- Parse a port-forward address "[ip:]port" into (ip-or-nil, port).
+local function parse_port_forward_address(s, all)
+    local ip, port = s:match("^(%d+%.%d+%.%d+%.%d+):(%d+)$")
+    if ip then return parse_ipv4(ip), tonumber(port) end
+    port = s:match("^(%d+)$")
+    assertf(port, "invalid address %q in %s", s, all)
+    return nil, tonumber(port)
+end
+
+local function add_port_forward(host_ip, host_port, guest_ip, guest_port, is_udp)
     assert(virtio_net_user_config, "--port-forward option requires --network or --virtio-net=user option")
-    local host_ip, guest_ip, host_port, guest_port, proto
-    for s in opts:gmatch("[%w.]+") do
-        if (not host_port or not guest_port) and s:find("^[0-9]+$") then
-            if not host_port then
-                host_port = tonumber(s)
-            else
-                guest_port = tonumber(s)
-            end
-        elseif (not host_ip or not guest_ip) and s:find("^[0-9]+%.[0-9]+%.[0-9]+%.[0-9]+$") then
-            if not host_ip then
-                host_ip = parse_ipv4(s)
-            else
-                guest_ip = parse_ipv4(s)
-            end
-        elseif proto == nil and (s == "tcp" or s == "udp") then
-            proto = s
-        else
-            error("malformed --port-forward option")
-        end
-    end
-    host_ip = host_ip or parse_ipv4("127.0.0.1")
-    guest_ip = guest_ip or parse_ipv4("10.0.2.15")
-    assert(host_port, "malformed --port-forward option")
-    guest_port = guest_port or host_port
-    local is_udp = proto == "udp"
+    assert(host_port, "missing host port in port forward")
     virtio_net_user_config.hostfwd = virtio_net_user_config.hostfwd or {}
     table.insert(virtio_net_user_config.hostfwd, {
         is_udp = is_udp,
-        host_ip = host_ip,
-        guest_ip = guest_ip,
+        host_ip = host_ip or parse_ipv4("127.0.0.1"),
+        guest_ip = guest_ip or parse_ipv4("10.0.2.15"),
         host_port = host_port,
-        guest_port = guest_port,
+        guest_port = guest_port or host_port,
     })
     return true
 end
 
-local function handle_virtio_net(mode, opts)
-    if not mode then return false end
-    processor.registers.iunrep = 1
+local function handle_virtio_net(mode)
+    cmdline_config.processor.registers.iunrep = 1
     if mode == "user" then
         if not virtio_net_user_config then
             virtio_net_user_config = { type = "net-user" }
-            table.insert(virtio, virtio_net_user_config)
+            table.insert(cmdline_config.virtio, virtio_net_user_config)
         end
     else
-        table.insert(virtio, { type = "net-tuntap", iface = opts })
+        table.insert(cmdline_config.virtio, { type = "net-tuntap", iface = mode })
     end
     return true
 end
 
-local function handle_network_option(opts)
-    if not opts then return false end
+local function handle_network_option()
     if has_network then return true end
     handle_virtio_net("user")
     has_network = true
@@ -1095,13 +1211,13 @@ end
 
 local function handle_virtio_console()
     if has_virtio_console then return true end
-    processor.registers.iunrep = 1
+    cmdline_config.processor.registers.iunrep = 1
     console.input_source = console.input_source or "from_stdin"
     console.output_flush_mode = console.output_flush_mode or "every_char"
     has_virtio_console = true
     -- Switch from HTIF Console (hvc0) to VirtIO console (hvc1)
-    dtb.bootargs = dtb.bootargs:gsub("console=hvc0", "console=hvc1")
-    table.insert(virtio, 1, { type = "console" })
+    cmdline_config.dtb.bootargs = cmdline_config.dtb.bootargs:gsub("console=hvc0", "console=hvc1")
+    table.insert(cmdline_config.virtio, 1, { type = "console" })
     return true
 end
 
@@ -1115,6 +1231,19 @@ local function handle_interactive()
     return true
 end
 
+local options -- forward declaration for handle_bash_completion
+
+local function handle_bash_completion()
+    -- Register the canonical names plus whatever the user invoked
+    -- this script as (e.g. ./cartesi-machine), so `source <(...)`
+    -- works from any invocation path.
+    local progs = { "cartesi-machine", "cartesi-machine.lua" }
+    local self = arg[0]
+    if self and self ~= progs[1] and self ~= progs[2] then progs[#progs + 1] = self end
+    bash.dump_bash_completion(options, progs)
+    os.exit()
+end
+
 -- List of supported options
 -- Options are processed in order
 -- For each option,
@@ -1122,9 +1251,15 @@ end
 --   second entry is a callback
 --     if callback returns true, the option is accepted.
 --     if callback returns false, the option is rejected.
-local options = {
-    {
-        "^%-h$",
+--   optional third entry is a bash-completion hint: a string like "file",
+--     "dir", "number", "hostport", "netif" (trailing `?` means the value is
+--     optional, i.e. the flag accepts both bare and `=value` forms), or a
+--     util.parse_options keys spec for compound `key:val,...` arguments. If
+--     present, the dispatcher forwards it to the callback as a first
+--     leading argument (callbacks that ignore the hint declare `_`).
+options = {
+    {
+        "--help",
         function()
             print_help()
             os.exit()
@@ -1132,15 +1267,11 @@ local options = {
         end,
     },
     {
-        "^%-%-help$",
-        function()
-            print_help()
-            os.exit()
-            -- return true
-        end,
+        "--bash-completion",
+        handle_bash_completion,
     },
     {
-        "^%-%-version$",
+        "--version",
         function()
             print(string.format("cartesi-machine %s", cartesi.VERSION))
             if cartesi.GIT_COMMIT then print(string.format("git commit: %s", cartesi.GIT_COMMIT)) end
@@ -1153,7 +1284,7 @@ local options = {
         end,
     },
     {
-        "^%-%-version%-json$",
+        "--version-json",
         function()
             print("{")
             print(string.format('  "version": "%s",', cartesi.VERSION))
@@ -1173,47 +1304,48 @@ local options = {
         end,
     },
     {
-        "^%-%-assert%-version%=(%d+)%.(%d+)%.?(%d*)$",
-        function(major, minor, patch)
+        "--assert-version=",
+        function(_, all, v)
+            local major, minor, patch = v:match("^(%d+)%.(%d+)%.?(%d*)$")
+            assertf(major, "invalid option %s", all)
             major, minor, patch = tonumber(major), tonumber(minor), tonumber(patch)
             if
                 major ~= cartesi.VERSION_MAJOR
                 or minor ~= cartesi.VERSION_MINOR
                 or (patch and patch ~= cartesi.VERSION_PATCH)
             then
-                error(
-                    string.format(
-                        "emulator version mismatch, expected (%d.%d.%s) but got (%d.%d.%d)",
-                        major,
-                        minor,
-                        patch or "x",
-                        cartesi.VERSION_MAJOR,
-                        cartesi.VERSION_MINOR,
-                        cartesi.VERSION_PATCH
-                    )
+                errorf(
+                    "emulator version mismatch, expected (%d.%d.%s) but got (%d.%d.%d)",
+                    major,
+                    minor,
+                    patch or "x",
+                    cartesi.VERSION_MAJOR,
+                    cartesi.VERSION_MINOR,
+                    cartesi.VERSION_PATCH
                 )
             end
             return true
         end,
     },
     {
-        "^%-%-dtb%-image%=(.+)$",
-        function(opts)
-            dtb.backing_store = dtb.backing_store or {}
-            dtb.backing_store.data_filename = opts
+        "--dtb-image=",
+        function(_, _, opts)
+            cmdline_config.dtb.backing_store = cmdline_config.dtb.backing_store or {}
+            cmdline_config.dtb.backing_store.data_filename = opts
             return true
         end,
+        "file",
     },
     {
-        "^%-%-no%-bootargs$",
+        "--no-bootargs",
         function()
-            dtb.bootargs = ""
+            cmdline_config.dtb.bootargs = ""
             return true
         end,
     },
     {
-        "^%-%-append%-bootargs%=(.+)$",
-        function(opts)
+        "--append-bootargs=",
+        function(_, _, opts)
             if #append_bootargs == 0 then
                 append_bootargs = opts
             else
@@ -1223,169 +1355,215 @@ local options = {
         end,
     },
     {
-        "^(%-%-dtb%=(.+))$",
-        function(all, opts)
-            dtb.backing_store = parse_backing_store(opts, all, dtb.backing_store)
+        "--dtb=",
+        function(keys, all, opts)
+            cmdline_config.dtb.backing_store = parse_backing_store(keys, all, opts, cmdline_config.dtb.backing_store)
             return true
         end,
+        backing_store_keys,
     },
     {
-        "^(%-%-processor%=(.+))$",
-        function(all, opts)
-            processor.backing_store = parse_backing_store(opts, all, processor.backing_store)
+        "--processor=",
+        function(keys, all, opts)
+            cmdline_config.processor.backing_store =
+                parse_backing_store(keys, all, opts, cmdline_config.processor.backing_store)
             return true
         end,
+        backing_store_keys,
     },
     {
-        "^(%-%-uarch%-processor%=(.+))$",
-        function(all, opts)
-            uarch.processor.backing_store = parse_backing_store(opts, all, uarch.processor.backing_store)
+        "--uarch-processor=",
+        function(keys, all, opts)
+            cmdline_config.uarch.processor.backing_store =
+                parse_backing_store(keys, all, opts, cmdline_config.uarch.processor.backing_store)
             return true
         end,
+        backing_store_keys,
     },
     {
-        "^%-%-ram%-length%=(.+)$",
-        function(n)
-            ram.length = assert(util.parse_number(n), "invalid RAM length " .. n)
+        "--ram-length=",
+        function(_, _, n)
+            cmdline_config.ram.length = assertf(util.parse_number(n), "invalid RAM length %s", n)
             return true
         end,
     },
     {
-        "^%-%-ram%-image%=(.+)$",
-        function(opts)
-            ram.backing_store.data_filename = opts
+        "--ram-image=",
+        function(_, _, opts)
+            cmdline_config.ram.backing_store.data_filename = opts
             return true
         end,
+        "file",
     },
     {
-        "^%-%-no%-ram%-image$",
+        "--no-ram-image",
         function()
-            ram.backing_store.data_filename = ""
+            cmdline_config.ram.backing_store.data_filename = ""
             return true
         end,
     },
     {
-        "^(%-%-ram%=(.+))$",
-        function(all, opts)
-            ram.backing_store = parse_backing_store(opts, all, ram.backing_store)
+        "--ram=",
+        function(keys, all, opts)
+            cmdline_config.ram.backing_store = parse_backing_store(keys, all, opts, cmdline_config.ram.backing_store)
             return true
         end,
+        backing_store_keys,
     },
     {
-        "^(%-%-pmas%=(.+))$",
-        function(all, opts)
-            pmas.backing_store = parse_backing_store(opts, all, pmas.backing_store)
+        "--pmas=",
+        function(keys, all, opts)
+            cmdline_config.pmas.backing_store = parse_backing_store(keys, all, opts, cmdline_config.pmas.backing_store)
             return true
         end,
+        backing_store_keys,
     },
     {
-        "^%-%-uarch%-ram%-image%=(.+)$",
-        function(opts)
-            uarch.ram.backing_store.data_filename = opts
+        "--uarch-ram-image=",
+        function(_, _, opts)
+            cmdline_config.uarch.ram.backing_store.data_filename = opts
             return true
         end,
+        "file",
     },
     {
-        "^(%-%-uarch%-ram%=(.+))$",
-        function(all, opts)
-            uarch.ram.backing_store = parse_backing_store(opts, all, uarch.ram.backing_store)
+        "--uarch-ram=",
+        function(keys, all, opts)
+            cmdline_config.uarch.ram.backing_store =
+                parse_backing_store(keys, all, opts, cmdline_config.uarch.ram.backing_store)
             return true
         end,
+        backing_store_keys,
     },
     {
-        "^(%-%-hash%-tree%=(.+))$",
-        function(all, opts)
-            local h = util.parse_options(opts, all, {
-                hash_function = "string",
-                sht_filename = "string",
-                phtc_filename = "string",
-                phtc_size = "number",
-                shared = "boolean",
-            })
+        "--hash-tree=",
+        function(keys, all, opts)
+            local h = util.parse_options(keys, all, opts)
             h.sht_filename = h.sht_filename or ""
             h.phtc_filename = h.phtc_filename or ""
             h.hash_function = h.hash_function or "keccak256"
             for i, v in pairs(h) do
-                hash_tree[i] = v
+                cmdline_config.hash_tree[i] = v
             end
             return true
         end,
+        {
+            hash_function = { keccak256 = "keccak256", sha256 = "sha256" },
+            sht_filename = "file",
+            phtc_filename = "file",
+            phtc_size = "number",
+            shared = "boolean",
+        },
     },
     {
-        "^%-%-unreproducible$",
+        "--unreproducible",
         function()
-            processor.registers.iunrep = 1
+            cmdline_config.processor.registers.iunrep = 1
             return true
         end,
     },
     {
-        "^%-%-sync%-init%-date$",
+        "--sync-init-date",
         handle_sync_init_date,
     },
     {
-        "^%-%-virtio%-9p%=([%w_-]+):(.*)$",
-        handle_virtio_9p,
+        "--virtio-9p=",
+        function(keys, all, opts)
+            local p = util.parse_options(keys, all, opts)
+            assertf(p.tag and p.host_directory, "need tag and host_directory in %s", all)
+            return handle_virtio_9p(p.tag, p.host_directory)
+        end,
+        { tag = "string", host_directory = "dir" },
     },
     {
-        "^%-v%=([^:]+):(.*)$",
-        handle_volume_option,
+        "--volume=",
+        function(keys, all, opts)
+            local v = util.parse_options(keys, all, opts)
+            assertf(v.host_directory and v.guest_directory, "need host_directory and guest_directory in %s", all)
+            return handle_volume_option(v.host_directory, v.guest_directory)
+        end,
+        { host_directory = "dir", guest_directory = "dir" },
     },
     {
-        "^%-%-volume%=([^:]+):(.*)$",
-        handle_volume_option,
+        -- docker bind-mount short form: -v <host_dir>:<guest_dir>
+        "-v=",
+        function(_, all, value)
+            local host_dir, guest_dir = value:match("^([^:]+):(.+)$")
+            assertf(host_dir, "invalid option %s", all)
+            return handle_volume_option(host_dir, guest_dir)
+        end,
+        "dir",
     },
     {
-        "^%-%-virtio%-console$",
+        "--virtio-console",
         handle_virtio_console,
     },
     {
-        "^%-%-virtio%-net%=([%w+]+),?([%w:,]*)$",
-        handle_virtio_net,
+        "--virtio-net=",
+        function(_, _, value) return handle_virtio_net(value) end,
     },
     {
-        "^%-%-network=?([%w:,]*)$",
+        "--network",
         handle_network_option,
     },
     {
-        "^%-n=?([%w:,]*)$",
+        "-n",
         handle_network_option,
     },
     {
-        "^%-%-port%-forward=([0-9:.]+/?[udptcp]*)$",
-        handle_port_forward_option,
+        "--port-forward=",
+        function(keys, all, opts)
+            local p = util.parse_options(keys, all, opts)
+            assertf(p.host_address, "need host_address in %s", all)
+            local host_ip, host_port = parse_port_forward_address(p.host_address, all)
+            local guest_ip, guest_port
+            if p.guest_address then
+                guest_ip, guest_port = parse_port_forward_address(p.guest_address, all)
+            end
+            return add_port_forward(host_ip, host_port, guest_ip, guest_port, p.protocol == "udp")
+        end,
+        { host_address = "string", guest_address = "string", protocol = { tcp = "tcp", udp = "udp" } },
     },
     {
-        "^%-p=([0-9:.]+/?[udptcp]*)$",
-        handle_port_forward_option,
+        -- docker publish short form: -p [hostip:]hostport:guestport[/protocol]
+        "-p=",
+        function(_, all, value)
+            local body, protocol = value:match("^(.-)/([a-z]+)$")
+            if not body then
+                body, protocol = value, "tcp"
+            end
+            assertf(protocol == "tcp" or protocol == "udp", "invalid protocol in %s", all)
+            local host_ip, host_port, guest_port = body:match("^(%d+%.%d+%.%d+%.%d+):(%d+):(%d+)$")
+            if host_ip then
+                return add_port_forward(
+                    parse_ipv4(host_ip),
+                    tonumber(host_port),
+                    nil,
+                    tonumber(guest_port),
+                    protocol == "udp"
+                )
+            end
+            host_port, guest_port = body:match("^(%d+):(%d+)$")
+            assertf(host_port, "invalid option %s", all)
+            return add_port_forward(nil, tonumber(host_port), nil, tonumber(guest_port), protocol == "udp")
+        end,
     },
     {
-        "^%-%-htif%-console%-getchar$",
+        "--htif-console-getchar",
         handle_htif_console_getchar,
     },
     {
-        "^%-i$",
+        "-i",
         handle_htif_console_getchar,
     },
     {
-        "^%-it$",
+        "-it",
         handle_interactive,
     },
     {
-        "^(%-%-console%-io%=(.+))$",
-        function(all, opts)
-            local c = util.parse_options(opts, all, {
-                output_destination = "string",
-                output_flush_mode = "string",
-                output_buffer_size = "number",
-                output_fd = "number",
-                output_filename = "string",
-                input_source = "string",
-                input_buffer_size = "number",
-                input_fd = "number",
-                input_filename = "string",
-                tty_cols = "number",
-                tty_rows = "number",
-            })
+        "--console-io=",
+        function(keys, all, opts)
+            local c = util.parse_options(keys, all, opts)
             if c.output_fd then
                 assert(
                     c.output_destination == nil or c.output_destination == "to_fd",
@@ -1424,41 +1602,57 @@ local options = {
             if c.tty_rows then console.tty_rows = c.tty_rows end
             return true
         end,
+        {
+            output_destination = {
+                to_null = "to_null",
+                to_stdout = "to_stdout",
+                to_stderr = "to_stderr",
+                to_fd = "to_fd",
+                to_file = "to_file",
+                to_buffer = "to_buffer",
+            },
+            output_flush_mode = {
+                when_full = "when_full",
+                every_char = "every_char",
+                every_line = "every_line",
+            },
+            output_buffer_size = "number",
+            output_fd = "number",
+            output_filename = "file",
+            input_source = {
+                from_null = "from_null",
+                from_stdin = "from_stdin",
+                from_fd = "from_fd",
+                from_file = "from_file",
+                from_buffer = "from_buffer",
+            },
+            input_buffer_size = "number",
+            input_fd = "number",
+            input_filename = "file",
+            tty_cols = "number",
+            tty_rows = "number",
+        },
     },
     {
-        "^%-%-no%-htif%-yield%-manual$",
-        function(all)
-            if not all then return false end
-            processor.registers.htif.iyield = processor.registers.htif.iyield & ~cartesi.HTIF_YIELD_CMD_MANUAL_MASK
+        "--no-htif-yield-manual",
+        function()
+            cmdline_config.processor.registers.htif.iyield = cmdline_config.processor.registers.htif.iyield
+                & ~cartesi.HTIF_YIELD_CMD_MANUAL_MASK
             return true
         end,
     },
     {
-        "^%-%-no%-htif%-yield%-automatic$",
-        function(all)
-            if not all then return false end
-            processor.registers.htif.iyield = processor.registers.htif.iyield & ~cartesi.HTIF_YIELD_CMD_AUTOMATIC_MASK
+        "--no-htif-yield-automatic",
+        function()
+            cmdline_config.processor.registers.htif.iyield = cmdline_config.processor.registers.htif.iyield
+                & ~cartesi.HTIF_YIELD_CMD_AUTOMATIC_MASK
             return true
         end,
     },
     {
-        "^(%-%-flash%-drive%=(.+))$",
-        function(all, opts)
-            local f = parse_memory_range(opts, all, {
-                label = "string",
-                data_filename = "string",
-                dht_filename = "string",
-                dpt_filename = "string",
-                shared = "boolean",
-                create = "boolean",
-                truncate = "boolean",
-                length = "number",
-                start = "number",
-                read_only = "boolean",
-                mount = "string",
-                mke2fs = "boolean",
-                user = "string",
-            })
+        "--flash-drive=",
+        function(keys, all, opts)
+            local f = parse_memory_range(keys, all, opts)
             if f.label and flash_label_to_index[f.label] then
                 local prev_f = flash_drives[flash_label_to_index[f.label]]
                 override_memory_range(prev_f, f)
@@ -1471,23 +1665,27 @@ local options = {
             end
             return true
         end,
+        {
+            "data_filename", -- positional: --flash-drive=foo.ext2
+            label = "string",
+            data_filename = "file",
+            dht_filename = "file",
+            dpt_filename = "file",
+            shared = "boolean",
+            create = "boolean",
+            truncate = "boolean",
+            length = "number",
+            start = "number",
+            read_only = "boolean",
+            mount = "string",
+            mke2fs = "boolean",
+            user = "string",
+        },
     },
     {
-        "^(%-%-nvram%=(.+))$",
-        function(all, opts)
-            local f = parse_memory_range(opts, all, {
-                label = "string",
-                data_filename = "string",
-                dht_filename = "string",
-                dpt_filename = "string",
-                shared = "boolean",
-                create = "boolean",
-                truncate = "boolean",
-                length = "number",
-                start = "number",
-                read_only = "boolean",
-                user = "string",
-            })
+        "--nvram=",
+        function(keys, all, opts)
+            local f = parse_memory_range(keys, all, opts)
             if f.label and nvram_label_to_index[f.label] then
                 local prev_f = nvrams[nvram_label_to_index[f.label]]
                 override_memory_range(prev_f, f)
@@ -1498,65 +1696,98 @@ local options = {
             end
             return true
         end,
+        {
+            "data_filename", -- positional: --nvram=foo.bin
+            label = "string",
+            data_filename = "file",
+            dht_filename = "file",
+            dpt_filename = "file",
+            shared = "boolean",
+            create = "boolean",
+            truncate = "boolean",
+            length = "number",
+            start = "number",
+            read_only = "boolean",
+            user = "string",
+        },
     },
     {
-        "^(%-%-replace%-memory%-range%=(.+))$",
-        function(all, opts)
-            local f = parse_memory_range(opts, all, {
-                label = "string",
-                data_filename = "string",
-                dht_filename = "string",
-                dpt_filename = "string",
-                shared = "boolean",
-                length = "number",
-                start = "number",
-                read_only = "boolean",
-            })
+        "--replace-memory-range=",
+        function(keys, all, opts)
+            local f = parse_memory_range(keys, all, opts)
             memory_range_replace[#memory_range_replace + 1] = f
             return true
         end,
+        {
+            label = "string",
+            data_filename = "file",
+            dht_filename = "file",
+            dpt_filename = "file",
+            shared = "boolean",
+            length = "number",
+            start = "number",
+            read_only = "boolean",
+        },
     },
     {
-        "^(%-%-cmio%-advance%-state%=(.+))$",
-        function(all, opts)
-            local r = util.parse_options(opts, all, {
-                input = "string",
-                input_index_begin = "number",
-                input_index_end = "number",
-                output_hashes_root_hash = "string",
-                output = "string",
-                report = "string",
-                hashes = "boolean",
-            })
+        "--cmio-advance-state=",
+        function(keys, all, opts)
+            local r = util.parse_options(keys, all, opts)
             r.input = r.input or "input-%i.bin"
             r.input_index_begin = r.input_index_begin or 0
             r.input_index_end = r.input_index_end or 0
-            r.output = r.output or "input-%i-output-%o.bin"
+            -- %o is the global output index (the proof's target_address), %i the input it came from.
+            -- An empty value ("") disables writing that file.
+            r.output = r.output or "output-%o-input-%i.bin"
+            r.rejected_output = r.rejected_output or "rejected-output-%o-input-%i.bin"
+            -- When the user does not override output_proof, the default filename's extension tracks
+            -- "format" (default lua), so format:json alone yields a .json file. An explicit
+            -- output_proof is left as the user wrote it (format still selects the content).
+            r.output_proof = r.output_proof or ("output-%o-input-%i-proof." .. (r.format or "lua"))
             r.report = r.report or "input-%i-report-%o.bin"
-            r.output_hashes_root_hash = r.output_hashes_root_hash or "input-%i-output-hahes-root-hash.bin"
+            r.output_hashes_root_hash = r.output_hashes_root_hash or "input-%i-output-hashes-root-hash.bin"
+            -- Like output_proof, the default extension tracks "format" while an explicit value is left as-is.
+            r.output_hashes_root_hash_proof = r.output_hashes_root_hash_proof
+                or ("input-%i-output-hashes-root-hash-proof." .. (r.format or "lua"))
+            if r.check_output_hashes_root_hash == nil then r.check_output_hashes_root_hash = true end
             r.next_input_index = r.input_index_begin
             cmio_advance = r
             return true
         end,
+        {
+            input = "file",
+            input_index_begin = "number",
+            input_index_end = "number",
+            output_hashes_root_hash = "file",
+            output_hashes_root_hash_proof = "file",
+            output = "file",
+            rejected_output = "file",
+            output_proof = "file",
+            last_output_proof = "file",
+            format = { lua = "lua", json = "json" },
+            report = "file",
+            check_output_hashes_root_hash = "boolean",
+            hashes = "boolean",
+        },
     },
     {
-        "^(%-%-cmio%-inspect%-state%=(.+))$",
-        function(all, opts)
-            local r = util.parse_options(opts, all, {
-                query = "string",
-                report = "string",
-                hashes = "boolean",
-            })
+        "--cmio-inspect-state=",
+        function(keys, all, opts)
+            local r = util.parse_options(keys, all, opts)
             r.query = r.query or "query.bin"
             r.report = r.report or "query-report-%o.bin"
             cmio_inspect = r
             return true
         end,
+        {
+            query = "file",
+            report = "file",
+            hashes = "boolean",
+        },
     },
     {
-        "^%-%-cmio%-inspect%-state$",
-        function(all)
-            if not all then return false end
+        "--cmio-inspect-state",
+        function()
             cmio_inspect = {
                 query = "query.bin",
                 report = "query-report-%o.bin",
@@ -1565,495 +1796,555 @@ local options = {
         end,
     },
     {
-        "^(%-%-concurrency%=(.+))$",
-        function(all, opts)
-            local c = util.parse_options(opts, all, {
-                update_hash_tree = "number",
-            })
-            c.update_hash_tree = assert(c.update_hash_tree, "invalid update_hash_tree number in " .. all)
+        "--concurrency=",
+        function(keys, all, opts)
+            local c = util.parse_options(keys, all, opts)
+            c.update_hash_tree = assertf(c.update_hash_tree, "invalid update_hash_tree number in %s", all)
             concurrency_update_hash_tree = c.update_hash_tree
             return true
         end,
+        { update_hash_tree = "number" },
     },
     {
-        "^%-%-skip%-version%-check$",
-        function(all)
-            if not all then return false end
+        "--skip-version-check",
+        function()
             skip_version_check = true
             return true
         end,
     },
     {
-        "^%-%-no%-reserve$",
-        function(all)
-            if not all then return false end
+        "--no-reserve",
+        function()
             no_reserve = true
             return true
         end,
     },
     {
-        "^(%-%-initial%-proof%=(.+))$",
-        function(all, opts)
-            local p = util.parse_options(opts, all, {
-                address = "number",
-                log2_size = "number",
-                filename = "string",
-            })
+        "--initial-proof=",
+        function(keys, all, opts)
+            local p = util.parse_options(keys, all, opts)
+            assertf(p.address and p.log2_size or p.label, "need address and log2_size or label in %s", all)
             p.cmdline = all
-            assert(p.log2_size >= 3, "log2_size must be at least 3 in " .. all)
+            p.format = resolve_format(p.format, p.filename)
             initial_proof[#initial_proof + 1] = p
             return true
         end,
+        {
+            label = "string",
+            address = "number",
+            log2_size = "number",
+            filename = "file",
+            format = { lua = "lua", json = "json" },
+        },
     },
     {
-        "^(%-%-final%-proof%=(.+))$",
-        function(all, opts)
-            if not opts then return false end
-            local p = util.parse_options(opts, all, {
-                address = "number",
-                log2_size = "number",
-                filename = "string",
-            })
+        "--final-proof=",
+        function(keys, all, opts)
+            local p = util.parse_options(keys, all, opts)
+            assertf(p.address and p.log2_size or p.label, "need address and log2_size or label in %s", all)
             p.cmdline = all
-            assert(p.log2_size >= 3, "log2_size must be at least 3 in " .. all)
+            p.format = resolve_format(p.format, p.filename)
             final_proof[#final_proof + 1] = p
             return true
         end,
+        {
+            label = "string",
+            address = "number",
+            log2_size = "number",
+            filename = "file",
+            format = { lua = "lua", json = "json" },
+        },
     },
     {
-        "^%-%-no%-root%-flash%-drive$",
-        function(all)
-            if not all then return false end
+        "--no-root-flash-drive",
+        function()
             assert(flash_drives[1] and flash_drives[1].label == "root", "no root flash drive to remove")
             flash_drives[1] = nil
             flash_label_to_index.root = nil
-            dtb.bootargs = dtb.bootargs:gsub(cartesi.DTB_BOOTARGS_ROOT:gsub("[^%w]", "%%%1"), "")
+            cmdline_config.dtb.bootargs =
+                cmdline_config.dtb.bootargs:gsub(cartesi.DTB_BOOTARGS_ROOT_PART:gsub("[^%w]", "%%%1"), "")
+            cmdline_config.dtb.bootargs =
+                cmdline_config.dtb.bootargs:gsub(cartesi.DTB_BOOTARGS_INIT_PART:gsub("[^%w]", "%%%1"), "")
             return true
         end,
     },
     {
-        "^%-%-dump%-address%-ranges(%=?)(%g*)$",
-        function(opts, v)
-            if not opts then return false end
-            if opts == "=" then
-                if not v or #v < 1 then return false end
-                dump_address_ranges_dir = v
-            elseif #v ~= 0 then
-                return false
-            else
-                dump_address_ranges_dir = true
-            end
+        "--dump-memory-ranges",
+        function()
+            dump_memory_ranges_dir = true
+            return true
+        end,
+    },
+    {
+        "--dump-memory-ranges=",
+        function(_, _, v)
+            dump_memory_ranges_dir = v
             return true
         end,
+        "dir",
     },
     {
-        "^%-%-assert%-rolling%-template$",
-        function(all)
-            if not all then return false end
+        "--assert-rolling-template",
+        function()
             assert_rolling_template = true
             return true
         end,
     },
     {
-        "^%-%-quiet$",
-        function(all)
-            if not all then return false end
+        "--quiet",
+        function()
             stderr = function() end
             return true
         end,
     },
     {
-        "^%-%-log%-step%=(.*),(.*)$",
-        function(count, filename)
-            if (not count) or not filename then return false end
-            log_step_mcycle_count = assert(util.parse_number(count), "invalid steps " .. count)
-            log_step_filename = filename
+        "--log-step=",
+        function(keys, all, opts)
+            local o = util.parse_options(keys, all, opts)
+            assertf(o.filename and o.count, "need filename and count in %s", all)
+            log_step_mcycle_count = o.count
+            log_step_filename = o.filename
             return true
         end,
+        {
+            "filename",
+            filename = "file",
+            count = "number",
+        },
     },
     {
-        "^%-%-log%-step%-uarch$",
-        function(all)
-            if not all then return false end
+        "--log-step-uarch",
+        function()
             log_step_uarch = true
             return true
         end,
     },
     {
-        "^%-%-log%-reset%-uarch$",
-        function(all)
-            if not all then return false end
+        "--log-reset-uarch",
+        function()
             log_reset_uarch = true
             return true
         end,
     },
     {
-        "^(%-%-max%-mcycle%=(.*))$",
-        function(all, n)
-            if not n then return false end
-            max_mcycle = assert(util.parse_number(n), "invalid option " .. all)
+        "--max-mcycle=",
+        function(_, all, n)
+            max_mcycle = assertf(util.parse_number(n), "invalid option %s", all)
             return true
         end,
     },
     {
-        "^(%-%-max%-uarch%-cycle%=(.*))$",
-        function(all, n)
-            if not n then return false end
-            max_uarch_cycle = assert(util.parse_number(n), "invalid option " .. all)
+        "--max-uarch-cycle=",
+        function(_, all, n)
+            max_uarch_cycle = assertf(util.parse_number(n), "invalid option %s", all)
             return true
         end,
     },
     {
-        "^%-%-auto%-reset%-uarch$",
-        function(all)
-            if not all then return false end
+        "--auto-reset-uarch",
+        function()
             auto_reset_uarch = true
             return true
         end,
     },
     {
-        "^%-%-create%=(.*)$",
-        function(opts)
+        "--create=",
+        function(_, _, opts)
             if not opts or #opts < 1 then return false end
             create_dir = opts
             return true
         end,
+        "dir",
     },
     {
-        "^%-%-load%=(([^,]+),?(.*))$",
-        function(all, dir, opts)
-            if not all or not dir then return false end
-            if #opts > 0 then
-                local o = util.parse_options(opts, all, {
-                    clone = "string",
-                    sharing = {
-                        none = cartesi.SHARING_NONE,
-                        config = cartesi.SHARING_CONFIG,
-                        all = cartesi.SHARING_ALL,
-                    },
-                })
-                clone_dir = o.clone
-                load_sharing = o.sharing
-                if clone_dir and not load_sharing then load_sharing = cartesi.SHARING_ALL end
-            end
-            load_dir = dir
+        "--load=",
+        function(keys, all, opts)
+            local o = util.parse_options(keys, all, opts)
+            assertf(o.directory, "need directory in %s", all)
+            clone_dir = o.clone
+            load_sharing = to_sharing(o.sharing)
+            if clone_dir and not load_sharing then load_sharing = cartesi.SHARING_ALL end
+            load_dir = o.directory
             return true
         end,
+        {
+            "directory",
+            directory = "dir",
+            clone = "dir",
+            sharing = { none = "none", config = "config", all = "all" },
+        },
     },
     {
-        "^%-%-store%=(([^,]+),?(.*))$",
-        function(all, dir, opts)
-            if not all or not dir then return false end
-            if #opts > 0 then
-                local o = util.parse_options(opts, all, {
-                    sharing = {
-                        none = cartesi.SHARING_NONE,
-                        config = cartesi.SHARING_CONFIG,
-                        all = cartesi.SHARING_ALL,
-                    },
-                })
-                store_sharing = o.sharing
-            end
-            store_dir = dir
+        "--store=",
+        function(keys, all, opts)
+            local o = util.parse_options(keys, all, opts)
+            assertf(o.directory, "need directory in %s", all)
+            store_sharing = to_sharing(o.sharing)
+            store_dir = o.directory
             return true
         end,
+        {
+            "directory",
+            directory = "dir",
+            sharing = { none = "none", config = "config", all = "all" },
+        },
     },
     {
-        "^%-%-remote%-spawn$",
-        function(opts)
-            if not opts then return false end
+        "--remote-spawn",
+        function()
             remote_spawn = true
             return true
         end,
     },
     {
-        "^%-%-remote%-address%=(.*)$",
-        function(opts)
+        "--remote-address=",
+        function(_, _, opts)
             if not opts or #opts < 1 then return false end
             remote_address = opts
             return true
         end,
     },
     {
-        "^%-%-remote%-fork(%=?)(.*)$",
-        function(opts, v)
-            if not opts then return false end
-            if opts == "=" then
-                if not v or #v < 1 then return false end
-                remote_fork = v
-            elseif #v ~= 0 then
-                return false
-            else
-                remote_fork = true
-            end
+        "--remote-fork",
+        function()
+            remote_fork = true
             return true
         end,
     },
     {
-        "^%-%-remote%-health%-check$",
-        function(opts)
-            if not opts then return false end
+        "--remote-fork=",
+        function(_, _, v)
+            remote_fork = v
+            return true
+        end,
+        "hostport",
+    },
+    {
+        "--remote-health-check",
+        function()
             remote_health_check = true
             return true
         end,
     },
     {
-        "^%-%-remote%-shutdown$",
-        function(opts)
-            if not opts then return false end
+        "--remote-shutdown",
+        function()
             remote_shutdown = true
             return true
         end,
     },
     {
-        "^%-%-no%-remote%-create$",
-        function(opts)
-            if not opts then return false end
+        "--no-remote-create",
+        function()
             remote_create = false
             return true
         end,
     },
     {
-        "^%-%-no%-remote%-destroy$",
-        function(opts)
-            if not opts then return false end
+        "--no-remote-destroy",
+        function()
             remote_destroy = false
             return true
         end,
     },
     {
-        "^%-%-no%-rollback$",
-        function(opts)
-            if not opts then return false end
+        "--no-rollback",
+        function()
             perform_rollbacks = false
             return true
         end,
     },
     {
-        "^%-%-initial%-hash$",
-        function(all)
-            if not all then return false end
+        "--initial-hash",
+        function()
             initial_hash = true
             return true
         end,
     },
     {
-        "^%-%-final%-hash$",
-        function(all)
-            if not all then return false end
-            final_hash = true
+        "--initial-hash=",
+        function(_, _, v)
+            initial_hash = v
             return true
         end,
+        "filename",
     },
     {
-        "^(%-%-periodic%-hashes%=(.*))$",
-        function(all, v)
-            if not v then return false end
-            string.gsub(v, "^([^%,]+),(.+)$", function(p, s)
-                periodic_hashes_period = assert(util.parse_number(p), "invalid period " .. all)
-                periodic_hashes_start = assert(util.parse_number(s), "invalid start " .. all)
-            end)
-            if periodic_hashes_period == math.maxinteger then
-                periodic_hashes_period = assert(util.parse_number(v), "invalid period " .. all)
-                periodic_hashes_start = 0
-            end
-            initial_hash = true
+        "--final-hash",
+        function()
             final_hash = true
             return true
         end,
     },
     {
-        "^(%-%-dense%-uarch%-hashes%=(.*))$",
-        function(all, v)
-            if not v then return false end
-            string.gsub(v, "^([^%,]+),(.+)$", function(l, s)
-                dense_uarch_hashes_start = assert(util.parse_number(s), "invalid start " .. all)
-                dense_uarch_hashes_end = dense_uarch_hashes_start
-                    + assert(util.parse_number(l), "invalid length " .. all)
-            end)
-            if not dense_uarch_hashes_start then
-                dense_uarch_hashes_start = 0
-                dense_uarch_hashes_end = dense_uarch_hashes_start
-                    + assert(util.parse_number(v), "invalid length " .. all)
-            end
+        "--final-hash=",
+        function(_, _, v)
+            final_hash = v
             return true
         end,
+        "filename",
     },
     {
-        "^%-%-store%-config(%=?)(%g*)$",
-        function(opts, v)
-            if not opts then return false end
-            if opts == "=" then
-                if not v or #v < 1 then return false end
-                store_config = v
-            elseif #v ~= 0 then
-                return false
-            else
-                store_config = true
-            end
+        "--periodic-hashes=",
+        function(keys, all, opts)
+            local o = util.parse_options(keys, all, opts)
+            periodic_hashes_period = assertf(o.period, "need period in %s", all)
+            periodic_hashes_start = o.start or 0
+            initial_hash = true
+            final_hash = true
             return true
         end,
+        {
+            "period",
+            period = "number",
+            start = "number",
+        },
     },
     {
-        "^%-%-store%-json%-config(%=?)(%g*)$",
-        function(opts, v)
-            if not opts then return false end
-            if opts == "=" then
-                if not v or #v < 1 then return false end
-                store_json_config = v
-            elseif #v ~= 0 then
-                return false
-            else
-                store_json_config = true
-            end
+        "--dense-uarch-hashes=",
+        function(keys, all, opts)
+            local o = util.parse_options(keys, all, opts)
+            assertf(o.count, "need count in %s", all)
+            dense_uarch_hashes_start = o.start or 0
+            dense_uarch_hashes_end = dense_uarch_hashes_start + o.count
             return true
         end,
+        {
+            "count",
+            count = "number",
+            start = "number",
+        },
     },
     {
-        "^%-%-load%-config%=(%g*)$",
-        function(opts)
-            if not opts or #opts < 1 then return false end
-            load_config = opts
+        -- bare: dump config to stdout in Lua
+        "--store-config",
+        function()
+            store_config = true
+            store_config_format = resolve_format(nil, nil)
             return true
         end,
     },
     {
-        "^%-%-load%-json%-config%=(%g*)$",
-        function(opts)
-            if not opts or #opts < 1 then return false end
-            load_json_config = opts
+        -- value: a positional filename and/or a format sub-key
+        "--store-config=",
+        function(keys, all, opts)
+            local o = util.parse_options(keys, all, opts)
+            store_config = o.filename or true
+            store_config_format = resolve_format(o.format, o.filename)
             return true
         end,
+        {
+            "filename",
+            filename = "file",
+            format = { lua = "lua", json = "json" },
+        },
     },
     {
-        "^(%-%-cmio%-rx%-buffer%=(.+))$",
-        function(all, opts)
+        "--load-config=",
+        function(keys, all, opts)
+            local o = util.parse_options(keys, all, opts)
+            assertf(o.filename, "need filename in %s", all)
+            load_config = o.filename
+            load_config_format = resolve_format(o.format, o.filename)
+            return true
+        end,
+        {
+            "filename",
+            filename = "file",
+            format = { lua = "lua", json = "json" },
+        },
+    },
+    {
+        "--cmio-rx-buffer=",
+        function(keys, all, opts)
             if not opts then return false end
-            cmio.rx_buffer.backing_store = parse_backing_store(opts, all, cmio.rx_buffer.backing_store)
+            cmdline_config.cmio.rx_buffer.backing_store =
+                parse_backing_store(keys, all, opts, cmdline_config.cmio.rx_buffer.backing_store)
             return true
         end,
+        backing_store_keys,
     },
     {
-        "^(%-%-cmio%-tx%-buffer%=(.+))$",
-        function(all, opts)
+        "--cmio-tx-buffer=",
+        function(keys, all, opts)
             if not opts then return false end
-            cmio.tx_buffer.backing_store = parse_backing_store(opts, all, cmio.tx_buffer.backing_store)
+            cmdline_config.cmio.tx_buffer.backing_store =
+                parse_backing_store(keys, all, opts, cmdline_config.cmio.tx_buffer.backing_store)
             return true
         end,
+        backing_store_keys,
     },
     {
-        "^%-%-no%-init%-splash$",
-        function(all)
-            if not all then return false end
+        "--no-init-splash",
+        function()
             init_splash = false
             return true
         end,
     },
     {
-        "^%-u%=(.+)$",
+        "-u=",
         handle_user,
     },
     {
-        "^%-%-user%=(.+)$",
+        "--user=",
         handle_user,
     },
     {
-        "^%-e%=([%w_]+)%=(.+)$",
+        "-e=",
         handle_env,
     },
     {
-        "^%-%-env%=([%w_]+)%=(.+)$",
+        "--env=",
         handle_env,
     },
     {
-        "^%-w%=(.+)$",
+        "-w=",
         handle_workdir,
     },
     {
-        "^%-%-workdir%=(.+)$",
+        "--workdir=",
         handle_workdir,
     },
     {
-        "^%-h%=(.+)$",
+        "-h=",
         handle_hostname,
     },
     {
-        "^%-%-hostname%=(.+)$",
+        "--hostname=",
         handle_hostname,
     },
     {
-        "^%-%-append%-init%=(.+)$",
-        function(opts)
+        "--append-init=",
+        function(_, _, opts)
             append_init = append_init .. opts .. "\n"
             return true
         end,
     },
     {
-        "^%-%-append%-init%-file%=(.+)$",
-        function(opts)
-            local f <close> = assert(io.open(opts, "rb"))
-            local contents = assert(f:read("*a"))
+        "--append-init-file=",
+        function(_, _, opts)
+            local contents = util.read_file(opts)
             if not contents:find("\n$") then contents = contents .. "\n" end
             append_init = append_init .. contents
             return true
         end,
+        "file",
     },
     {
-        "^%-%-append%-entrypoint%=(.+)$",
-        function(opts)
+        "--append-entrypoint=",
+        function(_, _, opts)
             append_entrypoint = append_entrypoint .. opts .. "\n"
             return true
         end,
     },
     {
-        "^%-%-append%-entrypoint%-file%=(.+)$",
-        function(opts)
-            local f <close> = assert(io.open(opts, "rb"))
-            local contents = assert(f:read("*a"))
+        "--append-entrypoint-file=",
+        function(_, _, opts)
+            local contents = util.read_file(opts)
             if not contents:find("\n$") then contents = contents .. "\n" end
             append_entrypoint = append_entrypoint .. contents
             return true
         end,
+        "file",
     },
     {
-        "^%-%-gdb(%=?)(.*)$",
-        function(eq, address)
-            if eq == "=" and address ~= "" then
-                gdb_address = address
-                return true
-            elseif eq == "" and address == "" then
-                gdb_address = "127.0.0.1:1234"
-                return true
-            end
-            return false
+        "--gdb",
+        function()
+            gdb_address = "127.0.0.1:1234"
+            return true
         end,
     },
     {
-        ".*",
-        function(all)
-            local not_option = all:sub(1, 1) ~= "-"
-            if not_option or all == "--" then
-                cmdline_opts_finished = true
-                if not_option then exec_arguments = { all } end
-                return true
-            end
-            error("unrecognized option " .. all)
+        "--gdb=",
+        function(_, _, address)
+            gdb_address = address
+            return true
         end,
+        "hostport",
     },
 }
 
-local function tryoption(handler, ...)
-    if select(1, ...) ~= nil then return handler(...) end
+-- Dispatch for a plain-string option name. A trailing "=" marks a
+-- value-taking option; otherwise the entry is a flag. The handler is always
+-- called as handler(hint, all, value), with value == nil for flags and "all"
+-- the option as typed (reconstructed as name=value for the short space form).
+-- A hint table may name a positional sub-key in its array part (hint[1]); that
+-- is read by parse_options, so it needs no separate threading here.
+-- Returns whether the entry matched and whether it consumed the next argument.
+local function try_named_option(option, a, nextarg)
+    local name, handler, hint = option[1], option[2], option[3]
+    if name:sub(-1) == "=" then
+        local bare = name:sub(1, #name - 1)
+        if a:sub(1, #name) == name then -- attached: --foo=value or -x=value
+            local value = a:sub(#name + 1)
+            assertf(#value > 0, "missing value for option %s", bare)
+            handler(hint, a, value)
+            return true, false
+        elseif a == bare and bare:sub(1, 2) ~= "--" then -- bare short name
+            -- short value options additionally take the value from the next argument
+            if nextarg ~= nil and nextarg:sub(1, 1) ~= "-" then
+                handler(hint, bare .. "=" .. nextarg, nextarg)
+                return true, true
+            end
+            if bare == "-h" then error("did you mean --help?") end
+            errorf("missing value for option %s", bare)
+        end
+        -- A bare long value option ("--foo" with no "=value") is left unmatched:
+        -- an optional-value sibling flag entry ("--foo") matches it, otherwise the
+        -- catch-all reports an unrecognized option (as it does today).
+        return false, false
+    end
+    if a == name then -- flag
+        handler(hint, a, nil)
+        return true, false
+    end
+    return false, false
 end
 
+if #arg == 1 and arg[1] == "--bash-completion" then handle_bash_completion() end
+
+-- Finally load the dependencies
+cartesi = require("cartesi")
+util = require("cartesi.util")
+hash_tree = require("cartesi.hash-tree")
+
+-- And perform the dependant initializations
+local default_config = cartesi.machine:get_default_config()
+cmdline_config.dtb.bootargs = default_config.dtb.bootargs
+cmdline_config.hash_tree.hash_function = default_config.hash_tree.hash_function
+cmdline_config.processor.registers.htif = {
+    iconsole = cartesi.HTIF_CONSOLE_CMD_PUTCHAR_MASK,
+    iyield = cartesi.HTIF_YIELD_CMD_AUTOMATIC_MASK | cartesi.HTIF_YIELD_CMD_MANUAL_MASK,
+}
+to_sharing_map = {
+    none = cartesi.SHARING_NONE,
+    config = cartesi.SHARING_CONFIG,
+    all = cartesi.SHARING_ALL,
+}
+
 -- Process command line options
-for _, a in ipairs(arg) do
-    if not cmdline_opts_finished then
+local argi = 1
+while argi <= #arg do
+    local a = arg[argi]
+    if cmdline_opts_finished then
+        exec_arguments[#exec_arguments + 1] = a
+        argi = argi + 1
+    else
+        local nextarg = arg[argi + 1]
+        local matched, consumed = false, false
         for _, option in ipairs(options) do
-            if tryoption(option[2], a:match(option[1])) then break end
+            matched, consumed = try_named_option(option, a, nextarg)
+            if matched then break end
         end
-    else
-        exec_arguments[#exec_arguments + 1] = a
+        if not matched then
+            -- not a recognized option: "--" or a non-option argument ends
+            -- option processing; a leftover "-..." is an error.
+            local not_option = a:sub(1, 1) ~= "-"
+            assertf(not_option or a == "--", "unrecognized option %s", a)
+            cmdline_opts_finished = true
+            if not_option then exec_arguments = { a } end
+        end
+        argi = argi + (consumed and 2 or 1)
     end
 end
 
@@ -2070,11 +2361,27 @@ local function dump_value_proofs(machine, desired_proofs, config)
         assert(config.processor.registers.iunrep == 0, "proofs are meaningless in unreproducible mode")
     end
     for _, desired in ipairs(desired_proofs) do
+        if not desired.address or not desired.log2_size then
+            local drive = util.find_drive(config, "flash_drive", desired.label)
+                or util.find_drive(config, "nvram", desired.label)
+            assertf(drive, "flash-drive or nvram not found with label %s in %s", desired.label, desired.cmdline)
+            desired.log2_size = drive.log2_size
+            desired.address = drive.start
+        end
+        assertf(
+            desired.log2_size >= cartesi.HASH_TREE_LOG2_WORD_SIZE,
+            "log2_size must be at least %u in %s",
+            cartesi.HASH_TREE_LOG2_WORD_SIZE,
+            desired.cmdline
+        )
         local proof = machine:get_proof(desired.address, desired.log2_size)
         local out = desired.filename and assert(io.open(desired.filename, "wb")) or io.stdout
-        out:write("{\n")
-        util.dump_json_proof(proof, out, 1)
-        out:write("}\n")
+        if desired.format == "lua" then
+            out:write("return ")
+            util.dump_table(proof, out)
+        end
+        if desired.format == "json" then out:write(cartesi.tojson(proof, 2, "Proof"), "\n") end
+        if desired.filename then out:close() end
     end
 end
 
@@ -2147,20 +2454,8 @@ if load_dir then
     if clone_dir then main_machine:clone_stored(clone_dir, load_dir) end
     main_machine = main_machine:load(load_dir, runtime_config, load_sharing)
 elseif not (remote_address and not remote_create) then
-    -- Build machine config
-    local config = {
-        processor = processor,
-        ram = ram,
-        dtb = dtb,
-        flash_drive = {},
-        nvram = {},
-        tlb = tlb,
-        virtio = virtio,
-        cmio = cmio,
-        pmas = pmas,
-        uarch = uarch,
-        hash_tree = hash_tree,
-    }
+    -- Use the command-line config (a --load-config file may still override it below).
+    local config = cmdline_config
 
     -- show splash on init
     if init_splash then
@@ -2184,7 +2479,7 @@ echo "
         local entry = flash_drives[idx]
         if entry then -- skip removed drives (e.g. --no-root-flash-drive)
             set_empty_omitted_filenames(entry)
-            local dt_label = "flashdrive" .. #config.flash_drive
+            local dt_label = entry.label or "flashdrive" .. #config.flash_drive
             if not entry.length then entry.length = -1 end
             if entry.mke2fs == nil then entry.mke2fs = entry.backing_store.data_filename == "" end
             if entry.mount == nil then
@@ -2208,23 +2503,21 @@ echo "
                 entry.mount = false
             end
             if entry.label == "root" and entry.read_only then -- Mount root filesystem as read-only
-                dtb.bootargs = dtb.bootargs:gsub("%f[^%s%z]rw%f[%s%z]", "ro")
+                config.dtb.bootargs = config.dtb.bootargs:gsub("%f[^%s%z]rw%f[%s%z]", "ro")
             end
             config.flash_drive[#config.flash_drive + 1] = entry
             if entry.label ~= "root" and (entry.mke2fs or entry.mount or entry.user) then
                 config.dtb.init = config.dtb.init .. string.format("dev=$(flashdrive %s)\n", dt_label)
                 if entry.mke2fs then
                     config.dtb.init = config.dtb.init
-                        .. string.format(
-                            'busybox mke2fs -F -b 4096 -I 256 -L "%s" "$dev" > /dev/null\n',
-                            entry.label or dt_label
-                        )
+                        .. string.format('busybox mke2fs -F -b 4096 -I 256 -L "%s" "$dev" > /dev/null\n', dt_label)
                 end
                 if entry.mount then
                     config.dtb.init = config.dtb.init
                         .. string.format(
-                            'busybox mkdir -p "%s" && busybox mount "$dev" "%s"\n',
+                            'busybox mkdir -p "%s" && busybox mount%s "$dev" "%s"\n',
                             entry.mount,
+                            entry.read_only and " -o ro" or "",
                             entry.mount
                         )
                 end
@@ -2241,14 +2534,14 @@ echo "
         local entry = nvrams[idx]
         if entry then
             set_empty_omitted_filenames(entry)
-            local dt_label = "nvram" .. #config.nvram
+            local dt_label = entry.label or "nvram" .. #config.nvram
             if not entry.length then entry.length = -1 end
             config.nvram[#config.nvram + 1] = entry
             config.dtb.init = config.dtb.init .. string.format("dev=$(nvram %s)\n", dt_label)
             if entry.read_only then
                 config.dtb.init = config.dtb.init .. 'busybox chmod 0444 "$dev"\n'
             else
-                config.dtb.init = config.dtb.init .. 'busybox chmod 0666 "$dev"\n'
+                config.dtb.init = config.dtb.init .. 'busybox chmod 0664 "$dev"\n'
             end
             if entry.user then
                 config.dtb.init = config.dtb.init .. string.format('busybox chown %s: "$dev"\n', entry.user)
@@ -2261,7 +2554,9 @@ echo "
     if #append_entrypoint > 0 then config.dtb.entrypoint = config.dtb.entrypoint .. append_entrypoint end
     if #exec_arguments > 0 then config.dtb.entrypoint = config.dtb.entrypoint .. table.concat(exec_arguments, " ") end
 
-    if load_config then
+    if load_config and load_config_format == "json" then
+        config = setmetatable(cartesi.fromjson(util.read_file(load_config)), { __index = config })
+    elseif load_config then
         local env = {}
         local chunk, err = loadfile(load_config, "t", env)
         if not chunk then
@@ -2274,56 +2569,23 @@ echo "
             error(ret)
         end
         config = setmetatable(ret, { __index = config })
-    elseif load_json_config then
-        local f <close> = assert(io.open(load_json_config, "rb"))
-        config = setmetatable(cartesi.fromjson(f:read("a")), { __index = config })
     end
 
     main_machine = main_machine:create(config, runtime_config, create_dir)
 end
 
-local function dump_config(what, whatdef, out, indent)
-    if type(what) == "table" then
-        local next_indent = indent .. "  "
-        local keys = {}
-        for k in pairs(what) do
-            table.insert(keys, k)
-        end
-        table.sort(keys)
-        if #keys > 0 then
-            out:write("{\n")
-            for _, k in ipairs(keys) do
-                local v, vdef = what[k], whatdef and whatdef[k]
-                out:write(next_indent)
-                if type(k) == "string" then out:write(k, " = ") end
-                dump_config(v, vdef, out, next_indent)
-                out:write(",")
-                if v == vdef then out:write(" -- default") end
-                out:write("\n")
-            end
-            out:write(indent, "}")
-        else
-            out:write("{}")
-        end
-    elseif math.type(what) == "integer" then
-        out:write(string.format("0x%x", what))
-    else
-        out:write(string.format("%q", what))
-    end
-end
-
 local function serialize_config(out, config, format)
     if format == "json" then
         out:write(cartesi.tojson(config, 2), "\n")
     elseif format == "lua" then
         out:write("return ")
-        dump_config(config, default_config, out, "")
+        util.dump_table(config, out, default_config)
         out:write("\n")
     end
 end
 
 -- obtain config from instantiated machine
-local main_config = main_machine:get_initial_config()
+local initial_config = main_machine:get_initial_config()
 
 for _, r in ipairs(memory_range_replace) do
     set_empty_omitted_filenames(r)
@@ -2332,33 +2594,26 @@ end
 
 if type(store_config) == "string" then
     local f <close> = assert(io.open(store_config, "w"))
-    serialize_config(f, main_config, "lua")
+    serialize_config(f, initial_config, store_config_format)
 elseif store_config then
-    serialize_config(io.stdout, main_config, "lua")
-end
-
-if type(store_json_config) == "string" then
-    local f <close> = assert(io.open(store_json_config, "w"))
-    serialize_config(f, main_config, "json")
-elseif store_json_config then
-    serialize_config(io.stdout, main_config, "json")
+    serialize_config(io.stdout, initial_config, store_config_format)
 end
 
 local cmio_yield_automatic_reason = {
-    [cartesi.CMIO_YIELD_AUTOMATIC_REASON_PROGRESS] = "progress",
-    [cartesi.CMIO_YIELD_AUTOMATIC_REASON_TX_OUTPUT] = "tx-output",
-    [cartesi.CMIO_YIELD_AUTOMATIC_REASON_TX_REPORT] = "tx-report",
+    [cartesi.HTIF_YIELD_AUTOMATIC_REASON_PROGRESS] = "progress",
+    [cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT] = "tx-output",
+    [cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT] = "tx-report",
 }
 
 local cmio_yield_manual_reason = {
-    [cartesi.CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED] = "rx-accepted",
-    [cartesi.CMIO_YIELD_MANUAL_REASON_RX_REJECTED] = "rx-rejected",
-    [cartesi.CMIO_YIELD_MANUAL_REASON_TX_EXCEPTION] = "tx-exception",
+    [cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED] = "rx-accepted",
+    [cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED] = "rx-rejected",
+    [cartesi.HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION] = "tx-exception",
 }
 
 local cmio_yield_command = {
-    [cartesi.CMIO_YIELD_COMMAND_MANUAL] = "Manual",
-    [cartesi.CMIO_YIELD_COMMAND_AUTOMATIC] = "Automatic",
+    [cartesi.HTIF_YIELD_CMD_MANUAL] = "Manual",
+    [cartesi.HTIF_YIELD_CMD_AUTOMATIC] = "Automatic",
 }
 
 local function check_cmio_htif_config(htif)
@@ -2371,7 +2626,7 @@ end
 
 local function get_and_print_yield(machine, htif)
     local cmd, reason, data = machine:receive_cmio_request()
-    if cmd == cartesi.CMIO_YIELD_COMMAND_AUTOMATIC and reason == cartesi.CMIO_YIELD_AUTOMATIC_REASON_PROGRESS then
+    if cmd == cartesi.HTIF_YIELD_CMD_AUTOMATIC and reason == cartesi.HTIF_YIELD_AUTOMATIC_REASON_PROGRESS then
         stderr(
             "Progress: %6.2f" .. ((htif.iconsole & cartesi.HTIF_CONSOLE_CMD_GETCHAR_MASK) ~= 0 and "\n" or "\r"),
             string.unpack("I4", data) / 10
@@ -2380,9 +2635,9 @@ local function get_and_print_yield(machine, htif)
     end
     local cmd_str = cmio_yield_command[cmd] or "Unknown"
     local reason_str = "unknown"
-    if cmd == cartesi.CMIO_YIELD_COMMAND_AUTOMATIC then
+    if cmd == cartesi.HTIF_YIELD_CMD_AUTOMATIC then
         reason_str = cmio_yield_automatic_reason[reason] or reason_str
-    elseif cmd == cartesi.CMIO_YIELD_COMMAND_MANUAL then
+    elseif cmd == cartesi.HTIF_YIELD_CMD_MANUAL then
         reason_str = cmio_yield_manual_reason[reason] or reason_str
     end
     stderr("\n%s yield %s (%d) (0x%06x data)\n", cmd_str, reason_str, reason, #data)
@@ -2393,78 +2648,165 @@ end
 local function instantiate_filename(pattern, values)
     -- replace escaped % with something safe
     pattern = string.gsub(pattern, "%\\%%", "\0")
+    pattern = string.gsub(pattern, "%%(%d+)(%a)", function(p, s) return string.sub(values[s] or s, 1, p) end)
     pattern = string.gsub(pattern, "%%(%a)", function(s) return values[s] or s end)
     -- restore escaped %
     return (string.gsub(pattern, "\0", "%"))
 end
 
+-- An empty pattern ("") disables writing the file. "%i" is the producing input (the just-run
+-- input), "%o" the index argument (a global output index, or a per-input report index).
 local function save_cmio_state_with_format(advance, data, format, index)
+    if format == "" then return end
     local values = { i = advance.next_input_index - 1, o = index }
     local name = instantiate_filename(format, values)
     stderr("Storing %s\n", name)
-    local f = assert(io.open(name, "wb"))
-    assert(f:write(data))
-    f:close()
+    util.write_file(data, name)
 end
 
 local function save_cmio_report(advance, data)
     return save_cmio_state_with_format(advance, data, advance.report, advance.report_index)
 end
 
-local function save_cmio_output(advance, data)
-    return save_cmio_state_with_format(advance, data, advance.output, advance.output_index)
+local function save_cmio_output(advance, data, index)
+    return save_cmio_state_with_format(advance, data, advance.output, index)
+end
+
+local function save_cmio_rejected_output(advance, data, index)
+    return save_cmio_state_with_format(advance, data, advance.rejected_output, index)
 end
 
 local function save_cmio_output_hashes_root_hash(advance, data)
     return save_cmio_state_with_format(advance, data, advance.output_hashes_root_hash)
 end
 
+-- Serializes a Proof to a string in the resolved format. Lua keeps hashes raw (like
+-- machine:get_proof), JSON base64-encodes them via the "Proof" schema.
+local function serialize_proof(proof, format)
+    if format == "json" then return cartesi.tojson(proof, 2, "Proof") .. "\n" end
+    local parts = {}
+    util.dump_table(proof, {
+        write = function(_, ...)
+            for i = 1, select("#", ...) do
+                parts[#parts + 1] = (select(i, ...))
+            end
+        end,
+    })
+    return "return " .. table.concat(parts) .. "\n"
+end
+
+-- Reads back a Proof written by serialize_proof, in the resolved format (explicit format wins,
+-- else the filename extension).
+local function read_proof(filename, format)
+    local contents = util.read_file(filename)
+    if resolve_format(format, filename) == "json" then return cartesi.fromjson(contents, "Proof") end
+    return assert(load(contents, filename, "t", {}))()
+end
+
+-- Writes the epoch's output proofs, one per accepted output, keyed by global output index
+-- "%o" (= target_address) and producing input "%i".
+local function save_cmio_output_proofs(advance)
+    if advance.output_proof == "" then return end
+    local proofs = hash_tree.frontier_next_proofs(advance.frontier, advance.output_hashes)
+    local format = resolve_format(advance.format, advance.output_proof)
+    for i, proof in ipairs(proofs) do
+        local values = { i = advance.output_inputs[i], o = proof.target_address }
+        local name = instantiate_filename(advance.output_proof, values)
+        stderr("Storing %s\n", name)
+        util.write_file(serialize_proof(proof, format), name)
+    end
+end
+
+-- Writes the proof, in the machine state in which the just-accepted input was accepted, that the
+-- output hashes root hash occupied the first word of the tx buffer (its 32 bytes are exactly one
+-- tree word). This ties the output hashes root hash, against which "output_proof" proves each output,
+-- back into the machine state hash. Must be called while the machine still sits at the accept yield.
+local function save_cmio_output_hashes_root_hash_proof(advance, proof)
+    if advance.output_hashes_root_hash_proof == "" then return end
+    local values = { i = advance.next_input_index - 1 }
+    local name = instantiate_filename(advance.output_hashes_root_hash_proof, values)
+    local format = resolve_format(advance.format, advance.output_hashes_root_hash_proof)
+    stderr("Storing %s\n", name)
+    util.write_file(serialize_proof(proof, format), name)
+end
+
+-- On the verdict of the just-run input, commit or discard its buffered outputs. Accepted outputs
+-- are saved, folded into the running frontier (for the root check), and accumulated for the
+-- end-of-epoch proofs. Rejected outputs go to their own files and never enter the tree.
+local function flush_pending_outputs(machine, advance, reason, data)
+    if reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED then
+        for _, output in ipairs(advance.pending_outputs) do
+            save_cmio_output(advance, output, advance.global_output_index)
+            local leaf = cartesi.keccak256(output)
+            advance.output_hashes[#advance.output_hashes + 1] = leaf
+            advance.output_inputs[#advance.output_inputs + 1] = advance.next_input_index - 1
+            hash_tree.frontier_push_back(advance.running_frontier, leaf)
+            advance.global_output_index = advance.global_output_index + 1
+        end
+        assert(#data == cartesi.HASH_SIZE, "expected output hashes root hash in tx buffer")
+        save_cmio_output_hashes_root_hash(advance, data)
+        if advance.check_output_hashes_root_hash then
+            assertf(
+                hash_tree.frontier_get_root_hash(advance.running_frontier) == data,
+                "output hashes root hash mismatch at input %d",
+                advance.next_input_index - 1
+            )
+        end
+        -- The accept-state proof that the tx buffer holds this root hash (target_hash = keccak256(data)).
+        local proof = machine:get_proof(cartesi.AR_CMIO_TX_BUFFER_START, cartesi.HASH_TREE_LOG2_WORD_SIZE)
+        assert(proof.target_hash == cartesi.keccak256(data), "tx buffer does not hold the output hashes root hash")
+        save_cmio_output_hashes_root_hash_proof(advance, proof)
+    elseif reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED then
+        for position, output in ipairs(advance.pending_outputs) do
+            save_cmio_rejected_output(advance, output, advance.global_output_index + position - 1)
+        end
+    end
+    advance.pending_outputs = {}
+end
+
 local function load_cmio_input(machine, advance)
     local values = { i = advance.next_input_index }
-    local filename = instantiate_filename(advance.input, values)
-    local f = assert(io.open(filename, "rb"))
-    local data = assert(f:read("*a"))
-    f:close()
-    machine:send_cmio_response(cartesi.CMIO_YIELD_REASON_ADVANCE_STATE, data)
+    local data = util.read_file(instantiate_filename(advance.input, values))
+    -- The pre-input root hash is recorded so the EVM verifier can prove a reject
+    -- restores this state, regardless of how the host implements rollback.
+    machine:send_cmio_response(machine:get_root_hash(), cartesi.HTIF_YIELD_REASON_ADVANCE_STATE, data)
 end
 
 local function load_cmio_query(machine, inspect)
-    local f = assert(io.open(inspect.query, "rb"))
-    local data = assert(f:read("*a"))
-    f:close()
-    machine:send_cmio_response(cartesi.CMIO_YIELD_REASON_INSPECT_STATE, data)
+    local data = util.read_file(inspect.query)
+    machine:send_cmio_response(machine:get_root_hash(), cartesi.HTIF_YIELD_REASON_INSPECT_STATE, data)
 end
 
 local function save_cmio_inspect_state_report(inspect, data)
+    if inspect.report == "" then return end
     local values = { o = inspect.report_index }
     local name = instantiate_filename(inspect.report, values)
     stderr("Storing %s\n", name)
-    local f = assert(io.open(name, "wb"))
-    assert(f:write(data))
-    f:close()
+    util.write_file(data, name)
 end
 
 local function store_machine(machine, config, dir, sharing)
     assert(config.processor.registers.iunrep == 0, "hashes are meaningless in unreproducible mode")
     stderr("Storing machine: please wait\n")
     local values = {}
-    if dir:find("%%h") then values.h = util.hexhash(machine:get_root_hash()) end
+    if dir:find("%%%d*h") then values.h = util.hexhash(machine:get_root_hash()) end
     local name = instantiate_filename(dir, values)
     machine:store(name, sharing)
 end
 
-local function dump_address_ranges(machine, dir)
+local function dump_memory_ranges(machine, dir)
     local prefix = type(dir) == "string" and dir .. "/" or ""
-    if prefix ~= "" then assert(os.execute("mkdir " .. dir), "could not create directory " .. dir) end
+    if prefix ~= "" then assertf(os.execute("mkdir " .. dir), "could not create directory %s", dir) end
     for _, v in ipairs(machine:get_address_ranges()) do
-        local filename = prefix .. string.format("%016x--%016x.bin", v.start, v.length)
-        local file <close> = assert(io.open(filename, "w"))
-        assert(file:write(machine:read_memory(v.start, v.length)))
+        -- Only memory ranges hold state. Device ranges are always pristine, so skip them.
+        if v.is_memory then
+            local filename = prefix .. string.format("%016x--%016x.bin", v.start, v.length)
+            util.write_file(machine:read_memory(v.start, v.length), filename)
+        end
     end
 end
 
 local machine = main_machine
-local config = main_config
 local gdb_stub
 if gdb_address then
     assert(
@@ -2476,16 +2818,44 @@ if gdb_address then
     assert(address and port, "invalid address for GDB")
     gdb_stub:listen_and_wait_gdb(address, tonumber(port))
 end
-if config.processor.registers.iunrep ~= 0 then stderr("Running in unreproducible mode!\n") end
+if initial_config.processor.registers.iunrep ~= 0 then stderr("Running in unreproducible mode!\n") end
 if cmio_advance or cmio_inspect then
-    check_cmio_htif_config(config.processor.registers.htif)
+    check_cmio_htif_config(initial_config.processor.registers.htif)
     assert(remote_address or not perform_rollbacks, "cmio requires --remote-address for snapshot/commit/rollback")
 end
+-- Seed the outputs-tree frontier once, at the epoch start. With last_output_proof, resume the
+-- genesis-rooted tree from the previous epoch's last output, so this epoch's outputs continue at
+-- their running global indices. Otherwise start empty at genesis. The seed frontier produces the
+-- end-of-epoch proofs, and a copy tracks the running per-input root check.
+if cmio_advance then
+    local depth = cartesi.CMIO_LOG2_MAX_OUTPUT_COUNT
+    if cmio_advance.last_output_proof then
+        local proof = read_proof(cmio_advance.last_output_proof, cmio_advance.format)
+        assertf(
+            proof.log2_root_size == depth and proof.log2_target_size == 0,
+            "%s is not an outputs proof",
+            cmio_advance.last_output_proof
+        )
+        cmio_advance.frontier = hash_tree.frontier(proof)
+        cmio_advance.global_output_index = proof.target_address + 1
+    else
+        cmio_advance.frontier = hash_tree.frontier(depth)
+        cmio_advance.global_output_index = 0
+    end
+    cmio_advance.running_frontier = hash_tree.frontier_copy(cmio_advance.frontier)
+    cmio_advance.output_hashes = {}
+    cmio_advance.output_inputs = {}
+    cmio_advance.pending_outputs = {}
+end
 if initial_hash then
-    assert(config.processor.registers.iunrep == 0, "hashes are meaningless in unreproducible mode")
-    print_root_hash(machine, stderr_unsilenceable)
+    assert(initial_config.processor.registers.iunrep == 0, "hashes are meaningless in unreproducible mode")
+    if type(initial_hash) == "string" then
+        util.write_file(machine:get_root_hash(), initial_hash)
+    else
+        print_root_hash(machine, stderr_unsilenceable)
+    end
 end
-dump_value_proofs(machine, initial_proof, config)
+dump_value_proofs(machine, initial_proof, initial_config)
 local exit_code = 0
 local next_hash_mcycle
 if periodic_hashes_start ~= 0 then
@@ -2601,9 +2971,9 @@ while math.ult(machine:read_reg("mcycle"), max_mcycle) do
         break
     -- deal with yield manual
     elseif machine:read_reg("iflags_Y") ~= 0 then
-        local _, reason, data = get_and_print_yield(machine, config.processor.registers.htif)
+        local _, reason, data = get_and_print_yield(machine, initial_config.processor.registers.htif)
         -- there was an exception
-        if reason == cartesi.CMIO_YIELD_MANUAL_REASON_TX_EXCEPTION then
+        if reason == cartesi.HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION then
             stderr("cmio exception with payload: %q\n", data)
             exit_code = 1
             do_rollback(machine)
@@ -2611,15 +2981,15 @@ while math.ult(machine:read_reg("mcycle"), max_mcycle) do
         -- there are advance state inputs to feed
         elseif cmio_advance and cmio_advance.next_input_index < cmio_advance.input_index_end then
             -- previous reason was an accept
-            if reason == cartesi.CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED then
+            if reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED then
                 do_commit()
-                -- save only if we have already run an input and have just accepted it
+                -- flush only if we have already run an input and have just accepted it
                 if cmio_advance.next_input_index > cmio_advance.input_index_begin then
-                    assert(#data == 32, "expected root hash in tx buffer")
-                    save_cmio_output_hashes_root_hash(cmio_advance, data)
+                    flush_pending_outputs(machine, cmio_advance, reason, data)
                 end
             -- previous reason was a reject
-            elseif reason == cartesi.CMIO_YIELD_MANUAL_REASON_RX_REJECTED then
+            elseif reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED then
+                flush_pending_outputs(machine, cmio_advance, reason, data)
                 do_rollback(machine)
             else
                 error("unexpected manual yield reason")
@@ -2629,19 +2999,21 @@ while math.ult(machine:read_reg("mcycle"), max_mcycle) do
             do_snapshot(machine)
             load_cmio_input(machine, cmio_advance)
             if cmio_advance.hashes then print_root_hash(machine) end
-            cmio_advance.output_index = 0
             cmio_advance.report_index = 0
             cmio_advance.next_input_index = cmio_advance.next_input_index + 1
         else
             if cmio_advance and cmio_advance.next_input_index > cmio_advance.input_index_begin then
-                -- there are outputs of a previous advance state to save
-                if reason == cartesi.CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED then
-                    assert(#data == 32, "expected root hash in tx buffer")
-                    save_cmio_output_hashes_root_hash(cmio_advance, data)
+                -- the last input's verdict closes the epoch
+                if reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED then
+                    flush_pending_outputs(machine, cmio_advance, reason, data)
                     do_commit()
-                elseif reason == cartesi.CMIO_YIELD_MANUAL_REASON_RX_REJECTED then
+                elseif reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED then
+                    flush_pending_outputs(machine, cmio_advance, reason, data)
                     do_rollback(machine)
                 end
+                -- all accepted outputs are known, so the per-output proofs against the final root
+                -- can be written (the proofs share the last input's checked root)
+                save_cmio_output_proofs(cmio_advance)
                 cmio_advance = nil
             end
             -- not done with inspect state query
@@ -2665,20 +3037,20 @@ while math.ult(machine:read_reg("mcycle"), max_mcycle) do
         end
     -- deal with yield automatic
     elseif machine:read_reg("iflags_X") ~= 0 then
-        local _, reason, data = get_and_print_yield(machine, config.processor.registers.htif)
+        local _, reason, data = get_and_print_yield(machine, initial_config.processor.registers.htif)
         -- we have fed an advance state input
         if cmio_advance and cmio_advance.next_input_index > cmio_advance.input_index_begin then
-            if reason == cartesi.CMIO_YIELD_AUTOMATIC_REASON_TX_OUTPUT then
-                save_cmio_output(cmio_advance, data)
-                cmio_advance.output_index = cmio_advance.output_index + 1
-            elseif reason == cartesi.CMIO_YIELD_AUTOMATIC_REASON_TX_REPORT then
+            if reason == cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT then
+                -- buffer until the input's accept/reject verdict is known
+                cmio_advance.pending_outputs[#cmio_advance.pending_outputs + 1] = data
+            elseif reason == cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT then
                 save_cmio_report(cmio_advance, data)
                 cmio_advance.report_index = cmio_advance.report_index + 1
             end
         -- ignore other reasons
         -- we have feed the inspect state query
         elseif cmio_inspect and not cmio_inspect.query then
-            if reason == cartesi.CMIO_YIELD_AUTOMATIC_REASON_TX_REPORT then
+            if reason == cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT then
                 save_cmio_inspect_state_report(cmio_inspect, data)
                 cmio_inspect.report_index = cmio_inspect.report_index + 1
             end
@@ -2721,24 +3093,28 @@ if max_uarch_cycle > 0 then
 end
 if gdb_stub then gdb_stub:close() end
 if log_step_uarch then
-    assert(config.processor.registers.iunrep == 0, "micro step proof is meaningless in unreproducible mode")
-    stderr("Gathering micro step log: please wait\n")
-    util.dump_log(machine:log_step_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS), io.stderr)
+    assert(initial_config.processor.registers.iunrep == 0, "uarch step proof is meaningless in unreproducible mode")
+    stderr("Gathering uarch step log: please wait\n")
+    util.print_log(machine:log_step_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS), io.stderr)
 end
 if log_reset_uarch then
     stderr("Resetting microarchitecture state: please wait\n")
-    util.dump_log(machine:log_reset_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS), io.stderr)
+    util.print_log(machine:log_reset_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS), io.stderr)
 end
-if dump_address_ranges_dir then dump_address_ranges(machine, dump_address_ranges_dir) end
+if dump_memory_ranges_dir then dump_memory_ranges(machine, dump_memory_ranges_dir) end
 if final_hash then
-    assert(config.processor.registers.iunrep == 0, "hashes are meaningless in unreproducible mode")
-    print_root_hash(machine, stderr_unsilenceable)
+    assert(initial_config.processor.registers.iunrep == 0, "hashes are meaningless in unreproducible mode")
+    if type(final_hash) == "string" then
+        util.write_file(machine:get_root_hash(), final_hash)
+    else
+        print_root_hash(machine, stderr_unsilenceable)
+    end
 end
-dump_value_proofs(machine, final_proof, config)
-if store_dir then store_machine(machine, config, store_dir, store_sharing) end
+dump_value_proofs(machine, final_proof, initial_config)
+if store_dir then store_machine(machine, initial_config, store_dir, store_sharing) end
 if assert_rolling_template then
     local cmd, reason = machine:receive_cmio_request()
-    if not (cmd == cartesi.CMIO_YIELD_COMMAND_MANUAL and reason == cartesi.CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED) then
+    if not (cmd == cartesi.HTIF_YIELD_CMD_MANUAL and reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED) then
         exit_code = 2
     end
 end
diff --git a/src/cartesi/bash.lua b/src/cartesi/bash.lua
new file mode 100644
index 000000000..c5427c6e4
--- /dev/null
+++ b/src/cartesi/bash.lua
@@ -0,0 +1,221 @@
+-- Copyright Cartesi and individual authors (see AUTHORS)
+-- SPDX-License-Identifier: LGPL-3.0-or-later
+--
+-- This program is free software: you can redistribute it and/or modify it under
+-- the terms of the GNU Lesser General Public License as published by the Free
+-- Software Foundation, either version 3 of the License, or (at your option) any
+-- later version.
+--
+-- This program is distributed in the hope that it will be useful, but WITHOUT ANY
+-- WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
+-- PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details.
+--
+-- You should have received a copy of the GNU Lesser General Public License along
+-- with this program (see COPYING). If not, see <https://www.gnu.org/licenses/>.
+--
+
+local _M = {}
+
+-- The option name is a plain string; a trailing "=" marks a value-taking
+-- option. Strip it to get the bare flag name.
+local function flag_name(name) return (name:gsub("=$", "")) end
+
+local function name_takes_value(name) return name:sub(-1) == "=" end
+
+-- Sentinels for subkey value kinds that bash completes specially.
+local SUBKEY_KIND_SENTINEL = {
+    file = "__file__",
+    dir = "__dir__",
+    number = "__number__",
+    string = "__string__",
+    hostport = "__string__",
+    netif = "__string__",
+}
+
+-- Reduce one options-table entry to a completion descriptor.
+local function describe_option(entry)
+    local name, hint = entry[1], entry[3]
+    local flag = flag_name(name)
+    if flag == "" or not flag:match("^%-") then return nil end
+    local has_value = name_takes_value(name)
+    -- A plain name cannot encode an optional value; optional-value options are
+    -- two entries (flag + value) merged below, which sets optional there.
+    local desc = {
+        flag = flag,
+        kind = has_value and "string" or "bare",
+        optional = false,
+    }
+    if type(hint) == "string" then
+        if hint:sub(-1) == "?" then
+            desc.kind = hint:sub(1, -2)
+            desc.optional = true
+        else
+            desc.kind = hint
+        end
+    elseif type(hint) == "table" then
+        desc.kind = "compound"
+        desc.subkeys = {}
+        desc.subkey_values = {}
+        -- The array part (hint[1]) names the positional sub-key; record its kind
+        -- so a bare value can be completed as a file/dir.
+        if hint[1] then desc.positional_kind = hint[hint[1]] end
+        for k, v in pairs(hint) do
+            -- skip the array part (the positional sub-key name, handled above)
+            if type(k) == "string" then
+                desc.subkeys[#desc.subkeys + 1] = k
+                if type(v) == "table" then
+                    local vals = {}
+                    for ek in pairs(v) do
+                        vals[#vals + 1] = ek
+                    end
+                    table.sort(vals)
+                    desc.subkey_values[k] = vals
+                elseif v == "boolean" then
+                    desc.subkey_values[k] = { "true", "false" }
+                else
+                    desc.subkey_values[k] = SUBKEY_KIND_SENTINEL[v] or "__string__"
+                end
+            end
+        end
+        table.sort(desc.subkeys)
+    end
+    return desc
+end
+
+local function bash_quote(s) return "'" .. (s:gsub("'", "'\\''")) .. "'" end
+
+local bash_completion_function = [==[
+_cartesi_complete() {
+    local cur="${COMP_WORDS[$COMP_CWORD]}"
+    local line="${COMP_LINE:0:$COMP_POINT}"
+    local logical="${line##*[[:space:]]}"
+    COMPREPLY=()
+
+    if [[ "$logical" != -* ]]; then
+        COMPREPLY=( $(compgen -f -- "$cur") )
+        return
+    fi
+
+    if [[ "$logical" != *=* ]]; then
+        local f k
+        for f in "${!_cm_flag_kind[@]}"; do
+            if [[ "$f" == "$logical"* ]]; then
+                k="${_cm_flag_kind[$f]}"
+                if [[ "$k" == "bare" ]]; then
+                    # Trailing space so cursor moves on. compopt -o nospace
+                    # below suppresses bash's auto-space, so we add it ourselves.
+                    COMPREPLY+=("$f ")
+                else
+                    COMPREPLY+=("$f=")
+                    [[ -n "${_cm_flag_optional[$f]:-}" ]] && COMPREPLY+=("$f ")
+                fi
+            fi
+        done
+        compopt -o nospace 2>/dev/null
+        return
+    fi
+
+    local flag="${logical%%=*}"
+    local rest="${logical#*=}"
+    local kind="${_cm_flag_kind[$flag]:-}"
+
+    local cur_partial="$cur"
+    while [[ "$cur_partial" == [=:]* ]]; do
+        cur_partial="${cur_partial:1}"
+    done
+
+    case "$kind" in
+        file) COMPREPLY=( $(compgen -f -- "$cur_partial") ); compopt -o nospace 2>/dev/null ;;
+        dir)  COMPREPLY=( $(compgen -d -- "$cur_partial") ); compopt -o nospace 2>/dev/null ;;
+        number|hostport|netif|string) ;;
+        compound)
+            local last_segment="${rest##*,}"
+            if [[ "$last_segment" == *:* ]]; then
+                local subkey="${last_segment%%:*}"
+                local val_prefix="${last_segment#*:}"
+                local values="${_cm_subkey_values[${flag},${subkey}]:-}"
+                case "$values" in
+                    __file__) COMPREPLY=( $(compgen -f -- "$val_prefix") ); compopt -o nospace 2>/dev/null ;;
+                    __dir__)  COMPREPLY=( $(compgen -d -- "$val_prefix") ); compopt -o nospace 2>/dev/null ;;
+                    __number__|__string__|"") ;;
+                    *)        COMPREPLY=( $(compgen -W "$values" -- "$val_prefix") ) ;;
+                esac
+            else
+                local subkeys="${_cm_compound_keys[$flag]:-}"
+                local partial="$last_segment"
+                local prefix="${cur_partial%$partial}"
+                local matched=( $(compgen -W "$subkeys" -- "$partial") )
+                local i
+                for i in "${!matched[@]}"; do
+                    matched[$i]="${prefix}${matched[$i]}:"
+                done
+                COMPREPLY=("${matched[@]}")
+                # a bare value (no subkey:) may be the positional; offer files/dirs
+                case "${_cm_positional_kind[$flag]:-}" in
+                    file) COMPREPLY+=( $(compgen -f -- "$partial") ) ;;
+                    dir)  COMPREPLY+=( $(compgen -d -- "$partial") ) ;;
+                esac
+                compopt -o nospace 2>/dev/null
+            fi
+            ;;
+    esac
+}
+]==]
+
+-- Walk an options table and emit a self-contained bash completion script
+-- registering the given program names. Writes to io.stdout.
+function _M.dump_bash_completion(options, program_names)
+    local flags = {}
+    local ordered = {}
+    for _, entry in ipairs(options) do
+        local d = describe_option(entry)
+        if d then
+            local prev = flags[d.flag]
+            if prev then
+                if prev.kind == "bare" and d.kind ~= "bare" then
+                    prev.kind, prev.subkeys, prev.subkey_values = d.kind, d.subkeys, d.subkey_values
+                    prev.positional_kind = d.positional_kind
+                    prev.optional = true
+                elseif d.kind == "bare" and prev.kind ~= "bare" then
+                    prev.optional = true
+                else
+                    prev.optional = prev.optional or d.optional
+                end
+            else
+                flags[d.flag] = d
+                ordered[#ordered + 1] = d.flag
+            end
+        end
+    end
+    table.sort(ordered)
+
+    local w = function(s) io.write(s, "\n") end
+
+    w("# bash completion for " .. table.concat(program_names, ", "))
+    w("# Generated by cartesi.bash.dump_bash_completion. Do not edit by hand.")
+    w("declare -gA _cm_flag_kind=()")
+    w("declare -gA _cm_flag_optional=()")
+    w("declare -gA _cm_compound_keys=()")
+    w("declare -gA _cm_subkey_values=()")
+    w("declare -gA _cm_positional_kind=()")
+    for _, flag in ipairs(ordered) do
+        local d = flags[flag]
+        w(string.format("_cm_flag_kind[%s]=%s", bash_quote(flag), bash_quote(d.kind)))
+        if d.optional then w(string.format("_cm_flag_optional[%s]=1", bash_quote(flag))) end
+        if d.positional_kind then
+            w(string.format("_cm_positional_kind[%s]=%s", bash_quote(flag), bash_quote(d.positional_kind)))
+        end
+        if d.subkeys then
+            w(string.format("_cm_compound_keys[%s]=%s", bash_quote(flag), bash_quote(table.concat(d.subkeys, " "))))
+            for _, k in ipairs(d.subkeys) do
+                local v = d.subkey_values[k]
+                local val_str = type(v) == "table" and table.concat(v, " ") or v
+                w(string.format("_cm_subkey_values[%s,%s]=%s", bash_quote(flag), bash_quote(k), bash_quote(val_str)))
+            end
+        end
+    end
+    w(bash_completion_function)
+    w("complete -F _cartesi_complete " .. table.concat(program_names, " "))
+end
+
+return _M
diff --git a/src/cartesi/hash-tree.lua b/src/cartesi/hash-tree.lua
new file mode 100644
index 000000000..1ff507337
--- /dev/null
+++ b/src/cartesi/hash-tree.lua
@@ -0,0 +1,267 @@
+local cartesi = require("cartesi")
+
+-- Tree leaves are words, the smallest proof target.
+local WORD_LOG2_SIZE = cartesi.HASH_TREE_LOG2_WORD_SIZE
+local WORD_LENGTH = 1 << WORD_LOG2_SIZE
+
+-- docs:begin roll_hash_up_tree
+local function roll_hash_up_tree(proof, target_hash)
+    local hash = target_hash
+    for log2_size = proof.log2_target_size, proof.log2_root_size - 1 do
+        local sibling = assert(proof.sibling_hashes[log2_size - proof.log2_target_size + 1], "too few siblings")
+        local bit = (proof.target_address & (1 << log2_size)) ~= 0
+        local first, second
+        if bit then
+            first, second = sibling, hash
+        else
+            first, second = hash, sibling
+        end
+        hash = cartesi.keccak256(first, second)
+    end
+    return hash
+end
+-- docs:end roll_hash_up_tree
+
+-- docs:begin verify_slice
+local function verify_slice(proof)
+    assert(roll_hash_up_tree(proof, proof.target_hash) == proof.root_hash, "target node not in tree")
+end
+-- docs:end verify_slice
+
+-- docs:begin verify_splice
+local function verify_splice(proof, new_target_hash, new_root_hash)
+    verify_slice(proof)
+    assert(roll_hash_up_tree(proof, new_target_hash) == new_root_hash, "target node not in tree")
+end
+-- docs:end verify_splice
+
+-- Computes the Merkle tree root of a byte string laid at the base of a tree covering
+-- 2^log2_root_size bytes. The data need not fill the tree or be a power of two long. Leaves
+-- are word-size keccak256 hashes, a trailing partial word zero-padded, and inner nodes hash
+-- their two children. Every node the data does not reach takes its level's pristine hash, the
+-- root of an all-zero subtree, which doubles each level climbed. Overflow is rejected.
+-- docs:begin get_root_hash
+local function get_root_hash(data, log2_root_size)
+    assert(#data <= (1 << log2_root_size), "data does not fit in the tree")
+    -- Level zero is one hash per word, a trailing partial word zero-padded after the loop.
+    local level = {}
+    local full = #data - #data % WORD_LENGTH
+    for i = 1, full, WORD_LENGTH do
+        level[#level + 1] = cartesi.keccak256(data:sub(i, i + WORD_LENGTH - 1))
+    end
+    if full < #data then
+        local word = data:sub(full + 1)
+        level[#level + 1] = cartesi.keccak256(word .. string.rep("\0", WORD_LENGTH - #word))
+    end
+    -- Pair upward to the root, the pristine hash standing in for every node the data misses.
+    local pristine = cartesi.keccak256(string.rep("\0", WORD_LENGTH))
+    for _ = WORD_LOG2_SIZE, log2_root_size - 1 do
+        local parents = {}
+        for i = 1, #level, 2 do
+            parents[#parents + 1] = cartesi.keccak256(level[i], level[i + 1] or pristine)
+        end
+        level, pristine = parents, cartesi.keccak256(pristine, pristine)
+    end
+    return level[1]
+end
+-- docs:end get_root_hash
+
+-- The functions below are a generic incremental keccak Merkle accumulator (a "back merkle
+-- tree") for the cmio outputs tree: a fixed-height tree whose leaves are keccak256(output),
+-- accumulating from genesis and padded on the right with pristine subtrees. Unlike the
+-- word-leaf memory tree above, its pristine leaf is literally HASH_SIZE zero bytes (not a
+-- hash of them), matching libcmt's cmt_merkle_t and tests/lua/cmio-test.lua. Nothing here is
+-- output-specific; the caller feeds keccak256(output) leaves.
+--
+-- A frontier captures the complete left subtrees standing over the leaves seen so far. It is a
+-- length-log2_max_leaves array indexed by a 1-based level, where level 1 corresponds to bit 0 (the
+-- 0-based leaves). Entry level holds that level's complete left subtree when the matching bit of
+-- the leaf count is set, else false (false, not nil, so the array stays dense and round-trips as
+-- JSON). The present subtrees' sizes sum to the leaf count, so the count is recovered from the
+-- array rather than stored.
+
+-- The pristine leaf, the all-zero subtree of height 0, is literally HASH_SIZE zero bytes. Larger
+-- pristine subtrees double on demand inside each loop (keccak256(pristine, pristine)).
+local pristine_leaf = string.rep("\0", cartesi.HASH_SIZE)
+
+-- The leaf count standing under a frontier: a level is filled exactly when its bit of the count is
+-- set, so summing those bit values over the filled levels recovers it.
+local function frontier_leaf_count(frontier)
+    local leaf_count = 0
+    for level = 1, #frontier do
+        local bit = level - 1
+        if frontier[level] then leaf_count = leaf_count | (1 << bit) end
+    end
+    return leaf_count
+end
+
+-- The hash of node "index" at one level, given that level's frontier entry (the complete left
+-- subtree to the left, or false) and pristine entry (the all-pristine subtree to the right). The
+-- three regions read left-to-right as they sit in the tree: the frontier, the active region
+-- covering global indices base..base+#active-1, and pristine.
+-- docs:begin frontier_node
+local function frontier_node(frontier_entry, base, active, pristine_entry, index)
+    local lo, hi = base, base + #active - 1
+    if index < lo then
+        return frontier_entry -- fell left: a complete left subtree from the frontier
+    elseif index > hi then
+        return pristine_entry -- fell right: an all-pristine subtree
+    else
+        return active[index - lo + 1] -- inside the active region
+    end
+end
+-- docs:end frontier_node
+
+-- Folds one new leaf into the frontier by the binary-carry update: combine with the present
+-- low levels up to the first empty one, O(1) amortized. Mutates the frontier in place.
+-- docs:begin frontier_push_back
+local function frontier_push_back(frontier, hash)
+    local right = hash
+    local level = 1
+    while frontier[level] do
+        right = cartesi.keccak256(frontier[level], right)
+        frontier[level] = false
+        level = level + 1
+    end
+    frontier[level] = right
+end
+-- docs:end frontier_push_back
+
+-- Pristine-pads the current frontier up to its root, O(log2_max_leaves). Does not mutate the
+-- frontier.
+-- docs:begin frontier_get_root_hash
+local function frontier_get_root_hash(frontier)
+    local root = pristine_leaf
+    local pristine = pristine_leaf
+    for level = 1, #frontier do
+        if frontier[level] then
+            root = cartesi.keccak256(frontier[level], root)
+        else
+            root = cartesi.keccak256(root, pristine)
+        end
+        pristine = cartesi.keccak256(pristine, pristine)
+    end
+    return root
+end
+-- docs:end frontier_get_root_hash
+
+-- Given the frontier at the start of an epoch and the ordered keccak256(output) leaves accepted
+-- during it, returns one Proof per new output, all against the single final root (the tree of all
+-- leaves padded to height log2_max_leaves). proofs[i] belongs to next_output_hashes[i] (no
+-- reordering). The proofs are computed in one batch because an early output's low-level siblings
+-- depend on later leaves of the same epoch. Does not mutate the frontier.
+-- O(next_output_count * log2_max_leaves).
+-- docs:begin frontier_next_proofs
+local function frontier_next_proofs(frontier, next_output_hashes)
+    local log2_max_leaves = #frontier
+    local next_output_count = #next_output_hashes
+    if next_output_count == 0 then return {} end
+    local leaf_count = frontier_leaf_count(frontier)
+    -- siblings[i] is the i-th new output's sibling array.
+    local siblings = {}
+    for i = 1, next_output_count do
+        siblings[i] = {}
+    end
+    -- active holds the node hashes covering global indices [base, base + #active - 1] at the
+    -- current level; start at the leaves over [leaf_count, leaf_count + next_output_count).
+    local active = next_output_hashes
+    local base = leaf_count
+    local pristine = pristine_leaf -- the all-pristine subtree at the current level
+    for level = 1, log2_max_leaves do
+        local bit = level - 1
+        local frontier_entry = frontier[level]
+        -- Each output's proof sibling at this level is its node's neighbour (toggle the low bit).
+        for i = 1, next_output_count do
+            local node = (leaf_count + i - 1) >> bit
+            siblings[i][level] = frontier_node(frontier_entry, base, active, pristine, node ~ 1)
+        end
+        -- Climb one level: parent p has children 2p and 2p+1; the leftmost index halves.
+        local parents = {}
+        local parents_base = base >> 1
+        for p = parents_base, (base + #active - 1) >> 1 do
+            local left = frontier_node(frontier_entry, base, active, pristine, 2 * p)
+            local right = frontier_node(frontier_entry, base, active, pristine, 2 * p + 1)
+            parents[p - parents_base + 1] = cartesi.keccak256(left, right)
+        end
+        active, base = parents, parents_base
+        pristine = cartesi.keccak256(pristine, pristine)
+    end
+    local root_hash = active[1] -- after the last level the single active node is the root
+    local proofs = {}
+    for i = 1, next_output_count do
+        proofs[i] = {
+            target_address = leaf_count + i - 1,
+            log2_target_size = 0,
+            log2_root_size = log2_max_leaves,
+            target_hash = next_output_hashes[i],
+            root_hash = root_hash,
+            sibling_hashes = siblings[i],
+        }
+    end
+    return proofs
+end
+-- docs:end frontier_next_proofs
+
+-- An empty frontier of the given height: all log2_max_leaves levels unfilled (false).
+local function frontier_genesis(log2_max_leaves)
+    local f = {}
+    for level = 1, log2_max_leaves do
+        f[level] = false
+    end
+    return f
+end
+
+-- A shallow copy of a frontier, so the original keeps its leaves while the copy advances independently.
+local function frontier_copy(frontier) return { table.unpack(frontier, 1, #frontier) } end
+
+-- Whether a frontier constructor argument is a last-output proof rather than a tree height.
+local function is_proof(log2_max_leaves_or_last_proof) return type(log2_max_leaves_or_last_proof) == "table" end
+
+-- The single frontier constructor. A number is the tree height log2_max_leaves and yields an empty
+-- frontier (leaf count 0) used for genesis. Otherwise the argument is the previous epoch's
+-- last-output Proof, and the result is the left frontier for the start of the next epoch, rebuilt
+-- from that proof (its height taken from log2_root_size). The last leaf has index target_address,
+-- so the leaf count is target_address + 1. The lowest complete level is the level whose complete
+-- left subtree ends exactly at the leaf count.
+-- docs:begin frontier
+local function frontier(log2_max_leaves_or_last_proof)
+    if is_proof(log2_max_leaves_or_last_proof) then
+        local proof = log2_max_leaves_or_last_proof
+        local log2_max_leaves = proof.log2_root_size
+        local f = frontier_genesis(log2_max_leaves)
+        local leaf_count = proof.target_address + 1
+        local lowest_complete_level = 1
+        while leaf_count & (1 << (lowest_complete_level - 1)) == 0 do
+            lowest_complete_level = lowest_complete_level + 1
+        end
+        -- Above the lowest complete level, where the leaf count's bit at that level is set, the last leaf
+        -- is a right child, so its proof sibling there is exactly the complete left subtree we need.
+        for level = lowest_complete_level + 1, log2_max_leaves do
+            local bit = level - 1
+            if leaf_count & (1 << bit) ~= 0 then f[level] = proof.sibling_hashes[level] end
+        end
+        -- At the lowest complete level, the last leaf is a right child at every lower level, so rolling it
+        -- up through the siblings below rebuilds that level's complete left subtree, which ends at the leaf
+        -- count.
+        local hash = proof.target_hash
+        for level = 1, lowest_complete_level - 1 do
+            hash = cartesi.keccak256(proof.sibling_hashes[level], hash)
+        end
+        f[lowest_complete_level] = hash
+        return f
+    end
+    return frontier_genesis(log2_max_leaves_or_last_proof)
+end
+-- docs:end frontier
+
+return {
+    roll_hash_up_tree = roll_hash_up_tree,
+    verify_slice = verify_slice,
+    verify_splice = verify_splice,
+    get_root_hash = get_root_hash,
+    frontier = frontier,
+    frontier_copy = frontier_copy,
+    frontier_push_back = frontier_push_back,
+    frontier_get_root_hash = frontier_get_root_hash,
+    frontier_next_proofs = frontier_next_proofs,
+}
diff --git a/src/cartesi/util.lua b/src/cartesi/util.lua
index 4b5190c39..ed50726d4 100644
--- a/src/cartesi/util.lua
+++ b/src/cartesi/util.lua
@@ -30,113 +30,39 @@ local hexhash = hexstring
 _M.hexstring = hexstring
 _M.hexhash = hexstring
 
-local function dump_json_sibling_hashes(sibling_hashes, out, indent)
-    for i, h in ipairs(sibling_hashes) do
-        indentout(out, indent, '"%s"', hexhash(h))
-        if sibling_hashes[i + 1] then
-            out:write(",\n")
-        else
-            out:write("\n")
-        end
-    end
-end
-
-local function dump_json_proof(proof, out, indent)
-    indentout(out, indent, '"target_address": %u,\n', proof.target_address)
-    indentout(out, indent, '"log2_target_size": %u,\n', proof.log2_target_size)
-    indentout(out, indent, '"log2_root_size": %u,\n', proof.log2_root_size)
-    indentout(out, indent, '"target_hash": "%s",\n', hexhash(proof.target_hash))
-    indentout(out, indent, '"sibling_hashes": [\n')
-    dump_json_sibling_hashes(proof.sibling_hashes, out, indent + 1)
-    indentout(out, indent, "],\n")
-    indentout(out, indent, '"root_hash": "%s"\n', hexhash(proof.root_hash))
-end
-
-_M.dump_json_proof = dump_json_proof
-
-local function dump_json_log_notes(notes, out, indent)
-    local n = #notes
-    for i, note in ipairs(notes) do
-        indentout(out, indent, '"%s"', note)
-        if i < n then
-            out:write(",\n")
-        else
-            out:write("\n")
+local function dump_table(what, out, whatdef, indent)
+    whatdef = whatdef or {}
+    indent = indent or ""
+    if type(what) == "table" then
+        local next_indent = indent .. "  "
+        local keys = {}
+        for k in pairs(what) do
+            table.insert(keys, k)
         end
-    end
-end
-
-local function dump_json_log_brackets(brackets, out, indent)
-    local n = #brackets
-    for i, bracket in ipairs(brackets) do
-        indentout(out, indent, "{\n")
-        indentout(out, indent + 1, '"type": "%s",\n', bracket.type)
-        indentout(out, indent + 1, '"where": %u,\n', bracket.where)
-        indentout(out, indent + 1, '"text": "%s"\n', bracket.text)
-        indentout(out, indent, "}")
-        if i < n then
-            out:write(",\n")
+        table.sort(keys)
+        if #keys > 0 then
+            out:write("{\n")
+            for _, k in ipairs(keys) do
+                local v, vdef = what[k], whatdef and whatdef[k]
+                out:write(next_indent)
+                if type(k) == "string" then out:write(k, " = ") end
+                dump_table(v, out, vdef, next_indent)
+                out:write(",")
+                if v == vdef then out:write(" -- default") end
+                out:write("\n")
+            end
+            out:write(indent, "}")
         else
-            out:write("\n")
+            out:write("{}")
         end
-    end
-end
-
-local function dump_json_log_access(access, out, indent)
-    indentout(out, indent, "{\n")
-    indentout(out, indent + 1, '"type": "%s",\n', access.type)
-    indentout(out, indent + 1, '"address": %u,\n', access.address)
-    indentout(out, indent + 1, '"read": "%s"', hexstring(access.read))
-    if access.type == "write" then
-        out:write(",\n")
-        indentout(out, indent + 1, '"written": "%s"', hexstring(access.written))
-    end
-    if access.proof then
-        out:write(",\n")
-        indentout(out, indent + 1, '"proof": {\n')
-        dump_json_proof(access.proof, out, indent + 2)
-        indentout(out, indent + 1, "}\n")
+    elseif math.type(what) == "integer" then
+        out:write(string.format("0x%x", what))
     else
-        out:write("\n")
+        out:write(string.format("%q", what))
     end
-    indentout(out, indent, "}")
 end
 
-local function dump_json_log_accesses(accesses, out, indent)
-    local n = #accesses
-    for i, access in ipairs(accesses) do
-        dump_json_log_access(access, out, indent)
-        if i < n then
-            out:write(",\n")
-        else
-            out:write("\n")
-        end
-    end
-end
-
-function _M.dump_json_log(log, init_mcycle, init_uarch_cycle, final_mcycle, final_uarch_cycle, out, indent)
-    indent = indent or 0
-    indentout(out, indent, "{\n")
-    indentout(out, indent + 1, '"init_mcycle": %u,\n', init_mcycle)
-    indentout(out, indent + 1, '"init_uarch_cycle": %u,\n', init_uarch_cycle)
-    indentout(out, indent + 1, '"final_mcycle": %u,\n', final_mcycle)
-    indentout(out, indent + 1, '"final_uarch_cycle": %u,\n', final_uarch_cycle)
-    indentout(out, indent + 1, '"accesses": [\n')
-    dump_json_log_accesses(log.accesses, out, indent + 2)
-    indentout(out, indent + 1, "]")
-    if log.log_type.annotations then
-        out:write(",\n")
-        indentout(out, indent + 1, '"notes": [\n')
-        dump_json_log_notes(log.notes, out, indent + 2)
-        indentout(out, indent + 1, "],\n")
-        indentout(out, indent + 1, '"brackets": [\n')
-        dump_json_log_brackets(log.brackets, out, indent + 2)
-        indentout(out, indent + 1, "]\n")
-    else
-        out:write("\n")
-    end
-    indentout(out, indent, "}")
-end
+_M.dump_table = dump_table
 
 function _M.parse_number(n)
     if not n then return nil end
@@ -174,7 +100,23 @@ function _M.parse_boolean(b)
     return nil
 end
 
-function _M.parse_options(s, all, keys)
+-- String-shaped kinds: all parsed identically as strings, but the subtype
+-- carries a hint used by bash completion to pick the right candidates.
+local string_kinds = {
+    string = true,
+    file = true,
+    dir = true,
+    hostport = true,
+    netif = true,
+}
+_M.string_kinds = string_kinds
+
+-- The array part of "keys" (keys[1], optional) names the key that receives a
+-- bare value: a comma item with no colon that is not itself a declared key. At
+-- most one such positional is allowed. A colon inside a positional value must be
+-- escaped, since an unescaped colon always means key:value (so typos still error).
+function _M.parse_options(keys, all, opts)
+    local positional_key = keys[1]
     local function escape(v)
         -- replace escaped \, :, and , with something "safe"
         v = string.gsub(v, "%\\%\\", "\0")
@@ -188,16 +130,24 @@ function _M.parse_options(s, all, keys)
     end
     -- split at commas and validate key
     local options = {}
-    string.gsub(escape(s) .. ",", "(.-)%,", function(o)
+    local positional_seen = false
+    string.gsub(escape(opts) .. ",", "(.-)%,", function(o)
         local k, v = string.match(o, "(.-):(.*)")
         if k and v then
             k = unescape(k)
             v = unescape(v)
-        else
+            assert(keys[k], string.format("unknown option %q in '%s'", k, all))
+        elseif keys[unescape(o)] ~= nil then
             k = unescape(o)
             v = nil
+        else
+            -- not a declared key: treat as the positional value
+            k = unescape(o)
+            assert(positional_key, string.format("unknown option %q in '%s'", k, all))
+            assert(not positional_seen, string.format("only one positional value allowed in '%s'", all))
+            positional_seen = true
+            v, k = k, positional_key
         end
-        assert(keys[k], string.format("unknown option %q in '%s'", k, all))
         if keys[k] == "array" then
             options[k] = options[k] or {}
             table.insert(options[k], v)
@@ -213,7 +163,7 @@ function _M.parse_options(s, all, keys)
             v = _M.parse_number(v)
             if v == nil then error(string.format("invalid number for option %q in '%s'", k, all)) end
             options[k] = v
-        elseif keys[k] == "string" then
+        elseif string_kinds[keys[k]] then
             if v == nil then error(string.format("missing string for option %q in '%s'", k, all)) end
             options[k] = v
         elseif type(keys[k]) == "table" then
@@ -252,7 +202,7 @@ local function accessdatastring(data, data_hash, data_log2_size, address)
     end
 end
 
-function _M.dump_log(log, out)
+function _M.print_log(log, out)
     local indent = 0
     local j = 1 -- Bracket index
     local i = 1 -- Access index
@@ -299,4 +249,62 @@ function _M.dump_log(log, out)
     end
 end
 
+function _M.ilog2(n)
+    n = assert(math.tointeger(n), "expected integer")
+    assert(n ~= 0, "expected non-zero integer")
+    local v = n - 1
+    local r = 0
+    if v & 0xFFFFFFFF00000000 ~= 0 then
+        v = v >> 32
+        r = r + 32
+    end
+    if v & 0x00000000FFFF0000 ~= 0 then
+        v = v >> 16
+        r = r + 16
+    end
+    if v & 0x000000000000FF00 ~= 0 then
+        v = v >> 8
+        r = r + 8
+    end
+    if v & 0x00000000000000F0 ~= 0 then
+        v = v >> 4
+        r = r + 4
+    end
+    if v & 0x000000000000000C ~= 0 then
+        v = v >> 2
+        r = r + 2
+    end
+    if v & 0x0000000000000002 ~= 0 then
+        v = v >> 1
+        r = r + 1
+    end
+    if v ~= 0 then r = r + 1 end
+    return r
+end
+
+-- Returns the drive in config[what] (e.g. "nvram" or "flash_drive") whose label matches, after
+-- filling in its log2_size from its length. Returns nil and an error message when there is no such
+-- drive, so a caller can simply wrap the call in assert().
+function _M.find_drive(config, what, label)
+    for _, drive in ipairs(config[what]) do
+        if drive.label == label then
+            drive.log2_size = _M.ilog2(drive.length)
+            return drive
+        end
+    end
+    return nil, string.format("missing %s %s", label, what)
+end
+
+-- Reads the entire contents of a file as a binary string.
+function _M.read_file(filename)
+    local f <close> = assert(io.open(filename, "rb"))
+    return assert(f:read("a"))
+end
+
+-- Writes a binary string as the entire contents of a file.
+function _M.write_file(contents, filename)
+    local f <close> = assert(io.open(filename, "wb"))
+    assert(f:write(contents))
+end
+
 return _M
diff --git a/src/clua-cartesi-jsonrpc.cpp b/src/clua-cartesi-jsonrpc.cpp
index 03a247743..d437036dc 100644
--- a/src/clua-cartesi-jsonrpc.cpp
+++ b/src/clua-cartesi-jsonrpc.cpp
@@ -84,7 +84,7 @@ static int jsonrpc_machine_obj_index_get_server_version(lua_State *L) {
     if (cm_jsonrpc_get_server_version(m.get(), &version) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_json_table(L, version);
+    clua_fromjson(L, version);
     return 1;
 }
 
diff --git a/src/clua-cartesi.cpp b/src/clua-cartesi.cpp
index c78b25929..782db40ad 100644
--- a/src/clua-cartesi.cpp
+++ b/src/clua-cartesi.cpp
@@ -136,9 +136,11 @@ static int cartesi_mod_frombase64(lua_State *L) try {
 }
 
 static int cartesi_mod_tojson(lua_State *L) try {
+    lua_settop(L, 4);
     const int indent = static_cast<int>(luaL_optinteger(L, 2, -1));
+    const char *schema_name = luaL_optstring(L, 3, nullptr);
+    clua_tojson(L, 1, indent, schema_name, clua_tojsonschemadict(L, 4));
     lua_settop(L, 1);
-    clua_check_json_string(L, 1, indent);
     return 1;
 } catch (const std::exception &e) {
     luaL_error(L, "%s", e.what());
@@ -146,7 +148,9 @@ static int cartesi_mod_tojson(lua_State *L) try {
 }
 
 static int cartesi_mod_fromjson(lua_State *L) try {
-    clua_push_json_table(L, luaL_checkstring(L, 1));
+    lua_settop(L, 3);
+    const char *schema_name = luaL_optstring(L, 2, nullptr);
+    clua_fromjson(L, luaL_checkstring(L, 1), schema_name, clua_tojsonschemadict(L, 3));
     return 1;
 } catch (const std::exception &e) {
     luaL_error(L, "%s", e.what());
@@ -221,6 +225,7 @@ CM_API int luaopen_cartesi(lua_State *L) {
     clua_setintegerfield(L, CM_HASH_TREE_LOG2_WORD_SIZE, "HASH_TREE_LOG2_WORD_SIZE", -1);
     clua_setintegerfield(L, CM_HASH_TREE_LOG2_PAGE_SIZE, "HASH_TREE_LOG2_PAGE_SIZE", -1);
     clua_setintegerfield(L, CM_HASH_TREE_LOG2_ROOT_SIZE, "HASH_TREE_LOG2_ROOT_SIZE", -1);
+    clua_setintegerfield(L, CM_CMIO_LOG2_MAX_OUTPUT_COUNT, "CMIO_LOG2_MAX_OUTPUT_COUNT", -1);
     clua_setintegerfield(L, CM_BREAK_REASON_FAILED, "BREAK_REASON_FAILED", -1);
     clua_setintegerfield(L, CM_BREAK_REASON_HALTED, "BREAK_REASON_HALTED", -1);
     clua_setintegerfield(L, CM_BREAK_REASON_YIELDED_MANUALLY, "BREAK_REASON_YIELDED_MANUALLY", -1);
@@ -234,16 +239,14 @@ CM_API int luaopen_cartesi(lua_State *L) {
     clua_setintegerfield(L, CM_UARCH_BREAK_REASON_CYCLE_OVERFLOW, "UARCH_BREAK_REASON_CYCLE_OVERFLOW", -1);
     clua_setintegerfield(L, CM_ACCESS_LOG_TYPE_ANNOTATIONS, "ACCESS_LOG_TYPE_ANNOTATIONS", -1);
     clua_setintegerfield(L, CM_ACCESS_LOG_TYPE_LARGE_DATA, "ACCESS_LOG_TYPE_LARGE_DATA", -1);
-    clua_setintegerfield(L, CM_CMIO_YIELD_COMMAND_AUTOMATIC, "CMIO_YIELD_COMMAND_AUTOMATIC", -1);
-    clua_setintegerfield(L, CM_CMIO_YIELD_COMMAND_MANUAL, "CMIO_YIELD_COMMAND_MANUAL", -1);
-    clua_setintegerfield(L, CM_CMIO_YIELD_AUTOMATIC_REASON_PROGRESS, "CMIO_YIELD_AUTOMATIC_REASON_PROGRESS", -1);
-    clua_setintegerfield(L, CM_CMIO_YIELD_AUTOMATIC_REASON_TX_OUTPUT, "CMIO_YIELD_AUTOMATIC_REASON_TX_OUTPUT", -1);
-    clua_setintegerfield(L, CM_CMIO_YIELD_AUTOMATIC_REASON_TX_REPORT, "CMIO_YIELD_AUTOMATIC_REASON_TX_REPORT", -1);
-    clua_setintegerfield(L, CM_CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED, "CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED", -1);
-    clua_setintegerfield(L, CM_CMIO_YIELD_MANUAL_REASON_RX_REJECTED, "CMIO_YIELD_MANUAL_REASON_RX_REJECTED", -1);
-    clua_setintegerfield(L, CM_CMIO_YIELD_MANUAL_REASON_TX_EXCEPTION, "CMIO_YIELD_MANUAL_REASON_TX_EXCEPTION", -1);
-    clua_setintegerfield(L, CM_CMIO_YIELD_REASON_ADVANCE_STATE, "CMIO_YIELD_REASON_ADVANCE_STATE", -1);
-    clua_setintegerfield(L, CM_CMIO_YIELD_REASON_INSPECT_STATE, "CMIO_YIELD_REASON_INSPECT_STATE", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_AUTOMATIC_REASON_PROGRESS, "HTIF_YIELD_AUTOMATIC_REASON_PROGRESS", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT, "HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT, "HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED, "HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_MANUAL_REASON_RX_REJECTED, "HTIF_YIELD_MANUAL_REASON_RX_REJECTED", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION, "HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_REASON_ADVANCE_STATE, "HTIF_YIELD_REASON_ADVANCE_STATE", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_REASON_INSPECT_STATE, "HTIF_YIELD_REASON_INSPECT_STATE", -1);
     clua_setintegerfield(L, CM_SHARING_NONE, "SHARING_NONE", -1);
     clua_setintegerfield(L, CM_SHARING_CONFIG, "SHARING_CONFIG", -1);
     clua_setintegerfield(L, CM_SHARING_ALL, "SHARING_ALL", -1);
@@ -259,22 +262,60 @@ CM_API int luaopen_cartesi(lua_State *L) {
     clua_setintegerfield(L, CM_AR_SHADOW_TLB_START, "AR_SHADOW_TLB_START", -1);
     clua_setintegerfield(L, CM_AR_PMAS_START, "AR_PMAS_START", -1);
     clua_setintegerfield(L, CM_AR_PMAS_LENGTH, "AR_PMAS_LENGTH", -1);
+    clua_setintegerfield(L, CM_PMA_EMPTY_DID, "PMA_EMPTY_DID", -1);
+    clua_setintegerfield(L, CM_PMA_MEMORY_DID, "PMA_MEMORY_DID", -1);
+    clua_setintegerfield(L, CM_PMA_SHADOW_STATE_DID, "PMA_SHADOW_STATE_DID", -1);
+    clua_setintegerfield(L, CM_PMA_FLASH_DRIVE_DID, "PMA_FLASH_DRIVE_DID", -1);
+    clua_setintegerfield(L, CM_PMA_CLINT_DID, "PMA_CLINT_DID", -1);
+    clua_setintegerfield(L, CM_PMA_HTIF_DID, "PMA_HTIF_DID", -1);
+    clua_setintegerfield(L, CM_PMA_PLIC_DID, "PMA_PLIC_DID", -1);
+    clua_setintegerfield(L, CM_PMA_CMIO_RX_BUFFER_DID, "PMA_CMIO_RX_BUFFER_DID", -1);
+    clua_setintegerfield(L, CM_PMA_CMIO_TX_BUFFER_DID, "PMA_CMIO_TX_BUFFER_DID", -1);
+    clua_setintegerfield(L, CM_PMA_SHADOW_UARCH_STATE_DID, "PMA_SHADOW_UARCH_STATE_DID", -1);
+    clua_setintegerfield(L, CM_PMA_VIRTIO_DID, "PMA_VIRTIO_DID", -1);
+    clua_setintegerfield(L, CM_PMA_NVRAM_DID, "PMA_NVRAM_DID", -1);
     clua_setintegerfield(L, CM_AR_DTB_START, "AR_DTB_START", -1);
     clua_setintegerfield(L, CM_AR_DTB_LENGTH, "AR_DTB_LENGTH", -1);
     clua_setintegerfield(L, CM_AR_CLINT_START, "AR_CLINT_START", -1);
     clua_setintegerfield(L, CM_AR_CLINT_LENGTH, "AR_CLINT_LENGTH", -1);
     clua_setintegerfield(L, CM_AR_HTIF_START, "AR_HTIF_START", -1);
     clua_setintegerfield(L, CM_AR_HTIF_LENGTH, "AR_HTIF_LENGTH", -1);
+    clua_setintegerfield(L, CM_RTC_FREQ_DIV, "RTC_FREQ_DIV", -1);
     clua_setintegerfield(L, CM_AR_PLIC_START, "AR_PLIC_START", -1);
     clua_setintegerfield(L, CM_AR_PLIC_LENGTH, "AR_PLIC_LENGTH", -1);
     clua_setintegerfield(L, CM_AR_FIRST_VIRTIO_START, "AR_FIRST_VIRTIO_START", -1);
     clua_setintegerfield(L, CM_AR_LAST_VIRTIO_END, "AR_LAST_VIRTIO_END", -1);
-    clua_setintegerfield(L, CM_AR_DRIVE_START, "AR_DRIVE_START", -1);
-    clua_setintegerfield(L, CM_AR_DRIVE_OFFSET, "AR_DRIVE_OFFSET", -1);
-    clua_setstringfield(L, CM_DTB_BOOTARGS_CONSOLE, "DTB_BOOTARGS_CONSOLE", -1);
-    clua_setstringfield(L, CM_DTB_BOOTARGS_UIO, "DTB_BOOTARGS_UIO", -1);
-    clua_setstringfield(L, CM_DTB_BOOTARGS_ROOT, "DTB_BOOTARGS_ROOT", -1);
+    clua_setstringfield(L, CM_DTB_BOOTARGS_CONSOLE_PART, "DTB_BOOTARGS_CONSOLE_PART", -1);
+    clua_setstringfield(L, CM_DTB_BOOTARGS_UIO_PART, "DTB_BOOTARGS_UIO_PART", -1);
+    clua_setstringfield(L, CM_DTB_BOOTARGS_ROOT_PART, "DTB_BOOTARGS_ROOT_PART", -1);
+    clua_setstringfield(L, CM_DTB_BOOTARGS_INIT_PART, "DTB_BOOTARGS_INIT_PART", -1);
     clua_setstringfield(L, CM_DTB_BOOTARGS_INIT, "DTB_BOOTARGS_INIT", -1);
+    // HTIF register fields
+    clua_setintegerfield(L, CM_HTIF_DEV_SHIFT, "HTIF_DEV_SHIFT", -1);
+    clua_setintegerfield(L, CM_HTIF_CMD_SHIFT, "HTIF_CMD_SHIFT", -1);
+    clua_setintegerfield(L, CM_HTIF_REASON_SHIFT, "HTIF_REASON_SHIFT", -1);
+    clua_setintegerfield(L, CM_HTIF_DATA_SHIFT, "HTIF_DATA_SHIFT", -1);
+    clua_setintegerfield(L, CM_HTIF_DEV_MASK, "HTIF_DEV_MASK", -1);
+    clua_setintegerfield(L, CM_HTIF_CMD_MASK, "HTIF_CMD_MASK", -1);
+    clua_setintegerfield(L, CM_HTIF_REASON_MASK, "HTIF_REASON_MASK", -1);
+    clua_setintegerfield(L, CM_HTIF_DATA_MASK, "HTIF_DATA_MASK", -1);
+    // HTIF devices and commands
+    clua_setintegerfield(L, CM_HTIF_DEV_HALT, "HTIF_DEV_HALT", -1);
+    clua_setintegerfield(L, CM_HTIF_DEV_CONSOLE, "HTIF_DEV_CONSOLE", -1);
+    clua_setintegerfield(L, CM_HTIF_DEV_YIELD, "HTIF_DEV_YIELD", -1);
+    clua_setintegerfield(L, CM_HTIF_HALT_CMD_HALT, "HTIF_HALT_CMD_HALT", -1);
+    clua_setintegerfield(L, CM_HTIF_CONSOLE_CMD_GETCHAR, "HTIF_CONSOLE_CMD_GETCHAR", -1);
+    clua_setintegerfield(L, CM_HTIF_CONSOLE_CMD_PUTCHAR, "HTIF_CONSOLE_CMD_PUTCHAR", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_CMD_AUTOMATIC, "HTIF_YIELD_CMD_AUTOMATIC", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_CMD_MANUAL, "HTIF_YIELD_CMD_MANUAL", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_AUTOMATIC_REASON_PROGRESS, "HTIF_YIELD_AUTOMATIC_REASON_PROGRESS", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT, "HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT, "HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED, "HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_MANUAL_REASON_RX_REJECTED, "HTIF_YIELD_MANUAL_REASON_RX_REJECTED", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION, "HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_REASON_ADVANCE_STATE, "HTIF_YIELD_REASON_ADVANCE_STATE", -1);
+    clua_setintegerfield(L, CM_HTIF_YIELD_REASON_INSPECT_STATE, "HTIF_YIELD_REASON_INSPECT_STATE", -1);
     // HTIF masks
     clua_setintegerfield(L, HTIF_HALT_CMD_HALT_MASK, "HTIF_HALT_CMD_HALT_MASK", -1);
     clua_setintegerfield(L, HTIF_CONSOLE_CMD_GETCHAR_MASK, "HTIF_CONSOLE_CMD_GETCHAR_MASK", -1);
@@ -290,7 +331,6 @@ CM_API int luaopen_cartesi(lua_State *L) {
     clua_setintegerfield(L, UARCH_RAM_START_ADDRESS, "UARCH_RAM_START_ADDRESS", -1);
     clua_setintegerfield(L, UARCH_ECALL_FN_HALT, "UARCH_ECALL_FN_HALT", -1);
     clua_setintegerfield(L, UARCH_ECALL_FN_PUTCHAR, "UARCH_ECALL_FN_PUTCHAR", -1);
-    clua_setintegerfield(L, UARCH_ECALL_FN_MARK_DIRTY_PAGE, "UARCH_ECALL_FN_MARK_DIRTY_PAGE", -1);
     clua_setintegerfield(L, UARCH_ECALL_FN_WRITE_TLB, "UARCH_ECALL_FN_WRITE_TLB", -1);
     // NOLINTNEXTLINE(cppcoreguidelines-pro-type-reinterpret-cast)
     clua_setlstringfield(L, reinterpret_cast<const char *>(uarch_pristine_hash), uarch_pristine_hash_len,
diff --git a/src/clua-i-machine.cpp b/src/clua-i-machine.cpp
index 744f9024c..0ea7a6cae 100644
--- a/src/clua-i-machine.cpp
+++ b/src/clua-i-machine.cpp
@@ -17,7 +17,6 @@
 #include "clua-i-machine.hpp"
 
 #include <algorithm>
-#include <cassert>
 #include <cstddef>
 #include <cstdint>
 #include <cstring>
@@ -26,6 +25,7 @@
 #include <string>
 #include <string_view>
 #include <unordered_map>
+#include <utility>
 
 #include <json.hpp>
 
@@ -271,18 +271,73 @@ static int64_t clua_get_array_table_len(lua_State *L, int tabidx) {
     return len;
 }
 
-static const nlohmann::json &clua_get_json_field_schema(const std::string_view field_name, const nlohmann::json &schema,
-    const nlohmann::json &schema_dict) {
+static const nlohmann::json &clua_get_machine_schema_dict(lua_State *L);
+
+/// \brief Resolves a named type against the user dictionary first, then the machine dictionary.
+/// \details nullptr yields an empty (passthrough) schema; an unknown name is an error.
+/// \brief Resolves a type name to its schema definition, following alias chains.
+/// \details A name is looked up in the user dictionary first, then the machine dictionary. It maps
+/// either to an object schema, which is returned, or to a string. A string naming a different type
+/// is an alias and is followed. A string naming itself is a leaf primitive (Base64, ArrayIndex,
+/// Schema) and is returned as is. Following aliases is what lets a user type be a bare top-level
+/// alias to a compound machine type (e.g. "AccessLog"), not just to a leaf. An unknown name or a
+/// cyclic chain is an error.
+static const nlohmann::json &clua_resolve_type_schema(lua_State *L, std::string_view type_name,
+    const nlohmann::json &user_schema_dict) {
+    static const nlohmann::json empty_schema;
+    // The chain cannot be longer than the number of distinct names, so bound the walk generously
+    // to turn a cyclic user dictionary into an error rather than an infinite loop.
+    for (int hops = 0; hops < 1024; ++hops) {
+        // "Default" and the empty name carry no schema, so the value passes through untranslated,
+        // as a plain table. This holds for a top-level name and for a field type alike.
+        if (type_name.empty() || type_name == "Default") {
+            return empty_schema;
+        }
+        const nlohmann::json *value = nullptr;
+        if (user_schema_dict.contains(type_name)) {
+            value = &user_schema_dict.at(type_name);
+        } else {
+            const auto &machine_schema_dict = clua_get_machine_schema_dict(L);
+            if (!machine_schema_dict.contains(type_name)) {
+                throw std::runtime_error{"type \"" + std::string{type_name} + "\" is not defined in schema dictionary"};
+            }
+            value = &machine_schema_dict.at(type_name);
+        }
+        if (!value->is_string()) {
+            return *value; // object schema
+        }
+        const auto next = value->template get<std::string_view>();
+        if (next == type_name) {
+            return *value; // self-referential leaf primitive
+        }
+        type_name = next; // follow the alias
+    }
+    throw std::runtime_error{"type \"" + std::string{type_name} + "\" has a cyclic schema definition"};
+}
+
+static const nlohmann::json &clua_get_type_schema(lua_State *L, const char *type_name,
+    const nlohmann::json &user_schema_dict = nlohmann::json()) {
+    static const nlohmann::json empty_schema;
+    if (type_name == nullptr) {
+        return empty_schema;
+    }
+    return clua_resolve_type_schema(L, type_name, user_schema_dict);
+}
+
+/// \brief Resolves the schema of a field within a parent definition.
+/// \details A field absent in the parent yields an empty (passthrough) schema. The field's type name
+/// is resolved through the same alias chain as a top-level name.
+static const nlohmann::json &clua_get_field_schema(lua_State *L, const std::string_view field_name,
+    const nlohmann::json &schema, const nlohmann::json &user_schema_dict) {
     static const nlohmann::json empty_schema;
     if (!schema.contains(field_name)) {
         return empty_schema;
     }
-    const auto &type_name = schema.at(field_name).template get<std::string_view>();
-    return schema_dict.at(type_name);
+    return clua_resolve_type_schema(L, schema.at(field_name).template get<std::string_view>(), user_schema_dict);
 }
 
-static nlohmann::json &clua_push_json_value_ref(lua_State *L, int idx, int ctxidx, const nlohmann::json &schema,
-    const nlohmann::json &schema_dict) {
+static nlohmann::json &clua_push_managed_toclose_json_ref(lua_State *L, int idx, const nlohmann::json &schema,
+    const nlohmann::json &user_schema_dict, int ctxidx) {
     nlohmann::json &j = *clua_push_new_managed_toclose_ptr(L, nlohmann::json(), ctxidx);
     idx -= idx < 0 ? 1 : 0; // adjust offset after pushing j reference
     switch (lua_type(L, idx)) {
@@ -290,10 +345,10 @@ static nlohmann::json &clua_push_json_value_ref(lua_State *L, int idx, int ctxid
             const int64_t len = clua_get_array_table_len(L, idx);
             if (len >= 0) { // array
                 j = nlohmann::json::array();
-                const auto &field_schema = clua_get_json_field_schema("items", schema, schema_dict);
+                const auto &field_schema = clua_get_field_schema(L, "items", schema, user_schema_dict);
                 for (int64_t i = 1; i <= len; ++i) {
                     lua_geti(L, idx, i);
-                    j.push_back(clua_push_json_value_ref(L, -1, ctxidx, field_schema, schema_dict));
+                    j.push_back(clua_push_managed_toclose_json_ref(L, -1, field_schema, user_schema_dict, ctxidx));
                     lua_pop(L, 2); // pop value, child j reference
                 }
             } else { // object
@@ -305,8 +360,8 @@ static nlohmann::json &clua_push_json_value_ref(lua_State *L, int idx, int ctxid
                         luaL_error(L, "table maps cannot contain keys of type %s", lua_typename(L, lua_type(L, -2)));
                     }
                     const char *field_name = lua_tostring(L, -2);
-                    const auto &field_schema = clua_get_json_field_schema(field_name, schema, schema_dict);
-                    j[field_name] = clua_push_json_value_ref(L, -1, ctxidx, field_schema, schema_dict);
+                    const auto &field_schema = clua_get_field_schema(L, field_name, schema, user_schema_dict);
+                    j[field_name] = clua_push_managed_toclose_json_ref(L, -1, field_schema, user_schema_dict, ctxidx);
                     lua_pop(L, 2); // pop value, child j reference
                 }
                 lua_pop(L, 1); // pop table
@@ -349,35 +404,15 @@ static nlohmann::json &clua_push_json_value_ref(lua_State *L, int idx, int ctxid
     return j;
 }
 
-const char *clua_check_json_string(lua_State *L, int idx, int indent, int ctxidx, const nlohmann::json &schema,
-    const nlohmann::json &schema_dict) {
-    assert(idx > 0);
-    if (!lua_istable(L, idx)) {
-        luaL_error(L, "failed to parse JSON from a Lua value: expected a table but got type \"%s\"",
-            lua_typename(L, lua_type(L, idx)));
-    }
-    try {
-        const nlohmann::json &j = clua_push_json_value_ref(L, idx, ctxidx, schema, schema_dict);
-        std::string &s = *clua_push_new_managed_toclose_ptr(L, j.dump(indent), ctxidx);
-        lua_pushlstring(L, s.data(), s.size());
-        lua_replace(L, idx);             // replace the Lua value with its JSON string representation
-        lua_pop(L, 2);                   // pop s, j references
-        return luaL_checkstring(L, idx); // return the string
-    } catch (const std::exception &e) {
-        luaL_error(L, "failed to parse JSON from a Lua table: %s", e.what());
-        return nullptr;
-    }
-}
-
-static void clua_push_json_value(lua_State *L, const nlohmann::json &j, int ctxidx, const nlohmann::json &schema,
-    const nlohmann::json &schema_dict) {
+static void clua_push_json_value(lua_State *L, const nlohmann::json &j, const nlohmann::json &schema,
+    const nlohmann::json &user_schema_dict, int ctxidx) {
     switch (j.type()) {
         case nlohmann::json::value_t::array: {
-            const auto &field_schema = clua_get_json_field_schema("items", schema, schema_dict);
+            const auto &field_schema = clua_get_field_schema(L, "items", schema, user_schema_dict);
             lua_createtable(L, static_cast<int>(j.size()), 0);
             int64_t i = 1;
             for (auto it = j.begin(); it != j.end(); ++it, ++i) {
-                clua_push_json_value(L, *it, ctxidx, field_schema, schema_dict);
+                clua_push_json_value(L, *it, field_schema, user_schema_dict, ctxidx);
                 lua_rawseti(L, -2, i);
             }
             break;
@@ -386,8 +421,8 @@ static void clua_push_json_value(lua_State *L, const nlohmann::json &j, int ctxi
             lua_createtable(L, 0, static_cast<int>(j.size()));
             for (const auto &el : j.items()) {
                 const auto &field_name = el.key();
-                const auto &field_schema = clua_get_json_field_schema(field_name, schema, schema_dict);
-                clua_push_json_value(L, el.value(), ctxidx, field_schema, schema_dict);
+                const auto &field_schema = clua_get_field_schema(L, field_name, schema, user_schema_dict);
+                clua_push_json_value(L, el.value(), field_schema, user_schema_dict, ctxidx);
                 lua_setfield(L, -2, field_name.c_str());
             }
             break;
@@ -402,7 +437,7 @@ static void clua_push_json_value(lua_State *L, const nlohmann::json &j, int ctxi
                 lua_pop(L, 1);      // pop binary_data reference
             } else if (schema.is_object() && schema.contains(data)) {
                 static const nlohmann::json empty_schema;
-                clua_push_json_value(L, schema.at(data), ctxidx, empty_schema, schema_dict);
+                clua_push_json_value(L, schema.at(data), empty_schema, user_schema_dict, ctxidx);
             } else {
                 lua_pushlstring(L, data.data(), data.length());
             }
@@ -439,19 +474,6 @@ static void clua_push_json_value(lua_State *L, const nlohmann::json &j, int ctxi
     }
 }
 
-void clua_push_json_table(lua_State *L, const char *s, int ctxidx, const nlohmann::json &schema,
-    const nlohmann::json &schema_dict) {
-    try {
-        lua_pushnil(L); // reserve a slot in the stack (needed because of lua_toclose semantics)
-        const nlohmann::json &j = *clua_push_new_managed_toclose_ptr(L, nlohmann::json::parse(s), ctxidx);
-        clua_push_json_value(L, j, ctxidx, schema, schema_dict);
-        lua_replace(L, -3); // move into the placeholder slot
-        lua_pop(L, 1);      // pop j reference
-    } catch (const std::exception &e) {
-        luaL_error(L, "failed to parse JSON from a string: %s", e.what());
-    }
-}
-
 static const nlohmann::json &clua_get_machine_schema_dict(lua_State *L) try {
     // In order to convert Lua tables <-> JSON objects we have to define a schema
     // to transform some special fields, we only care about:
@@ -460,6 +482,7 @@ static const nlohmann::json &clua_get_machine_schema_dict(lua_State *L) try {
     // - Array indexes (translate 0 based index in JSON to 1 based index in Lua)
     static const nlohmann::json machine_schema_dict = {
         {"Base64", "Base64"},
+        {"Schema", "Schema"},
         {"InterpreterBreakReason",
             {{"failed", CM_BREAK_REASON_FAILED}, {"halted", CM_BREAK_REASON_HALTED},
                 {"yielded_manually", CM_BREAK_REASON_YIELDED_MANUALLY},
@@ -528,22 +551,47 @@ static const nlohmann::json &clua_get_machine_schema_dict(lua_State *L) try {
     return dummy;
 }
 
-const char *clua_check_schemed_json_string(lua_State *L, int idx, const std::string &schema_name, int ctxidx) {
-    const auto &machine_schema_dict = clua_get_machine_schema_dict(L);
-    const auto it = machine_schema_dict.find(schema_name);
-    if (it == machine_schema_dict.end()) {
-        luaL_error(L, "type \"%s\" is not defined in machine schema dictionary", schema_name.c_str());
+const nlohmann::json &clua_tojsonschemadict(lua_State *L, int idx, int ctxidx) {
+    if (lua_isnoneornil(L, idx)) {
+        static const nlohmann::json empty_object = nlohmann::json::object();
+        return empty_object;
     }
-    return clua_check_json_string(L, idx, -1, ctxidx, *it, machine_schema_dict);
+    // A schema dictionary is plain JSON with only string/int leaves and no translated fields,
+    // so the "Schema" primitive makes converting one a pure passthrough. The returned reference stays
+    // valid while, and only while, the slot it pushes onto the stack remains there.
+    const auto &schema = clua_get_type_schema(L, "Schema");
+    return clua_push_managed_toclose_json_ref(L, idx, schema, nlohmann::json(), ctxidx);
 }
 
-void clua_push_schemed_json_table(lua_State *L, const char *s, const std::string &schema_name, int ctxidx) {
-    const auto &machine_schema_dict = clua_get_machine_schema_dict(L);
-    const auto it = machine_schema_dict.find(schema_name);
-    if (it == machine_schema_dict.end()) {
-        luaL_error(L, "type \"%s\" is not defined in machine schema dictionary", schema_name.c_str());
+const char *clua_tojson(lua_State *L, int idx, int indent, const char *schema_name,
+    const nlohmann::json &user_schema_dict, int ctxidx) {
+    idx = lua_absindex(L, idx);
+    try {
+        const nlohmann::json &schema = clua_get_type_schema(L, schema_name, user_schema_dict);
+        const nlohmann::json &j = clua_push_managed_toclose_json_ref(L, idx, schema, user_schema_dict, ctxidx);
+        std::string &s = *clua_push_new_managed_toclose_ptr(L, j.dump(indent), ctxidx);
+        lua_pushlstring(L, s.data(), s.size());
+        lua_replace(L, idx);             // replace the Lua value with its JSON string representation
+        lua_pop(L, 2);                   // pop s, j references
+        return luaL_checkstring(L, idx); // return the string
+    } catch (const std::exception &e) {
+        luaL_error(L, "failed to convert a Lua value to JSON: %s", e.what());
+        return nullptr;
+    }
+}
+
+void clua_fromjson(lua_State *L, const char *s, const char *schema_name, const nlohmann::json &user_schema_dict,
+    int ctxidx) {
+    try {
+        const nlohmann::json &schema = clua_get_type_schema(L, schema_name, user_schema_dict);
+        lua_pushnil(L); // reserve a slot in the stack (needed because of lua_toclose semantics)
+        const nlohmann::json &j = *clua_push_new_managed_toclose_ptr(L, nlohmann::json::parse(s), ctxidx);
+        clua_push_json_value(L, j, schema, user_schema_dict, ctxidx);
+        lua_replace(L, -3); // move into the placeholder slot
+        lua_pop(L, 1);      // pop j reference
+    } catch (const std::exception &e) {
+        luaL_error(L, "failed to parse JSON from a string: %s", e.what());
     }
-    clua_push_json_table(L, s, ctxidx, *it, machine_schema_dict);
 }
 
 /// \brief This is the machine:get_proof() method implementation.
@@ -558,7 +606,7 @@ static int machine_obj_index_get_proof(lua_State *L) {
     if (cm_get_proof(m.get(), address, log2_target_size, log2_root_size, &proof) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_schemed_json_table(L, proof, "Proof");
+    clua_fromjson(L, proof, "Proof");
     return 1;
 }
 
@@ -572,7 +620,7 @@ static int machine_obj_index_get_hash_tree_stats(lua_State *L) {
     if (cm_get_hash_tree_stats(m.get(), clear, &stats) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_json_table(L, stats);
+    clua_fromjson(L, stats);
     return 1;
 }
 
@@ -582,7 +630,7 @@ static int machine_obj_index_get_initial_config(lua_State *L) {
     if (cm_get_initial_config(m.get(), &config) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_json_table(L, config);
+    clua_fromjson(L, config);
     return 1;
 }
 
@@ -594,7 +642,7 @@ static int machine_obj_index_get_runtime_config(lua_State *L) {
     if (cm_get_runtime_config(m.get(), &runtime_config) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_json_table(L, runtime_config);
+    clua_fromjson(L, runtime_config);
     return 1;
 }
 
@@ -602,7 +650,7 @@ static int machine_obj_index_get_runtime_config(lua_State *L) {
 /// \param L Lua state.
 static int machine_obj_index_set_runtime_config(lua_State *L) {
     auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
-    const char *runtime_config = clua_check_json_string(L, 2);
+    const char *runtime_config = clua_tojson(L, 2);
     if (cm_set_runtime_config(m.get(), runtime_config) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
@@ -621,6 +669,30 @@ static int machine_obj_index_get_root_hash(lua_State *L) {
     return 1;
 }
 
+/// \brief This is the machine:read_revert_root_hash() method implementation.
+/// \param L Lua state.
+static int machine_obj_index_read_revert_root_hash(lua_State *L) {
+    auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
+    cm_hash revert_root_hash{};
+    if (cm_read_revert_root_hash(m.get(), &revert_root_hash) != 0) {
+        return luaL_error(L, "%s", cm_get_last_error_message());
+    }
+    clua_push_cm_hash(L, &revert_root_hash);
+    return 1;
+}
+
+/// \brief This is the machine:write_revert_root_hash() method implementation.
+/// \param L Lua state.
+static int machine_obj_index_write_revert_root_hash(lua_State *L) {
+    auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
+    cm_hash revert_root_hash{};
+    clua_check_cm_hash(L, 2, &revert_root_hash);
+    if (cm_write_revert_root_hash(m.get(), &revert_root_hash) != 0) {
+        return luaL_error(L, "%s", cm_get_last_error_message());
+    }
+    return 0;
+}
+
 /// \brief This is the machine:get_node_hash() method implementation.
 /// \param L Lua state.
 static int machine_obj_index_get_node_hash(lua_State *L) {
@@ -746,7 +818,7 @@ static int machine_obj_index_get_address_ranges(lua_State *L) {
     if (cm_get_address_ranges(m.get(), &ranges) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_json_table(L, ranges);
+    clua_fromjson(L, ranges);
     return 1;
 }
 
@@ -759,7 +831,7 @@ static int machine_obj_index_log_reset_uarch(lua_State *L) {
     if (cm_log_reset_uarch(m.get(), log_type, &log) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_schemed_json_table(L, log, "AccessLog");
+    clua_fromjson(L, log, "AccessLog");
     return 1;
 }
 
@@ -785,7 +857,7 @@ static int machine_obj_index_log_step_uarch(lua_State *L) {
     if (cm_log_step_uarch(m.get(), log_type, &log) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_schemed_json_table(L, log, "AccessLog");
+    clua_fromjson(L, log, "AccessLog");
     return 1;
 }
 
@@ -976,7 +1048,7 @@ static int machine_obj_index_write_console_input(lua_State *L) {
 static int machine_obj_index_replace_memory_range(lua_State *L) {
     lua_settop(L, 2);
     auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
-    const char *range_config = clua_check_json_string(L, 2);
+    const char *range_config = clua_tojson(L, 2);
     if (cm_replace_memory_range(m.get(), range_config) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
@@ -1023,11 +1095,13 @@ static int machine_obj_index_receive_cmio_request(lua_State *L) {
 /// \param L Lua state.
 static int machine_obj_index_send_cmio_response(lua_State *L) {
     auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
-    const auto reason = static_cast<uint16_t>(luaL_checkinteger(L, 2));
+    cm_hash revert_root_hash{};
+    clua_check_cm_hash(L, 2, &revert_root_hash);
+    const auto reason = static_cast<uint16_t>(luaL_checkinteger(L, 3));
     size_t length{0};
     // NOLINTNEXTLINE(cppcoreguidelines-pro-type-reinterpret-cast)
-    const auto *data = reinterpret_cast<const unsigned char *>(luaL_checklstring(L, 3, &length));
-    if (cm_send_cmio_response(m.get(), reason, data, length) != 0) {
+    const auto *data = reinterpret_cast<const unsigned char *>(luaL_checklstring(L, 4, &length));
+    if (cm_send_cmio_response(m.get(), &revert_root_hash, reason, data, length) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
     return 0;
@@ -1037,16 +1111,18 @@ static int machine_obj_index_send_cmio_response(lua_State *L) {
 /// \param L Lua state.
 static int machine_obj_index_log_send_cmio_response(lua_State *L) {
     auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
-    const auto reason = static_cast<uint16_t>(luaL_checkinteger(L, 2));
-    const int log_type = static_cast<int>(luaL_optinteger(L, 4, 0));
+    cm_hash revert_root_hash{};
+    clua_check_cm_hash(L, 2, &revert_root_hash);
+    const auto reason = static_cast<uint16_t>(luaL_checkinteger(L, 3));
+    const int log_type = static_cast<int>(luaL_optinteger(L, 5, 0));
     size_t length{0};
     // NOLINTNEXTLINE(cppcoreguidelines-pro-type-reinterpret-cast)
-    const auto *data = reinterpret_cast<const unsigned char *>(luaL_checklstring(L, 3, &length));
+    const auto *data = reinterpret_cast<const unsigned char *>(luaL_checklstring(L, 4, &length));
     const char *log = nullptr;
-    if (cm_log_send_cmio_response(m.get(), reason, data, length, log_type, &log) != 0) {
+    if (cm_log_send_cmio_response(m.get(), &revert_root_hash, reason, data, length, log_type, &log) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_schemed_json_table(L, log, "AccessLog");
+    clua_fromjson(L, log, "AccessLog");
     return 1;
 }
 
@@ -1067,10 +1143,10 @@ static int machine_obj_index_is_empty(lua_State *L) {
 static int machine_obj_index_create(lua_State *L) {
     lua_settop(L, 4);
     auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
-    const char *runtime_config = !lua_isnil(L, 3) ? clua_check_json_string(L, 3) : nullptr;
+    const char *runtime_config = !lua_isnil(L, 3) ? clua_tojson(L, 3) : nullptr;
     const char *dir = luaL_optstring(L, 4, nullptr);
     // Create or load a machine depending on the type of the first argument
-    const char *config = clua_check_json_string(L, 2);
+    const char *config = clua_tojson(L, 2);
     if (cm_create(m.get(), config, runtime_config, dir) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
@@ -1087,29 +1163,30 @@ static int machine_obj_index_collect_mcycle_root_hashes(lua_State *L) {
     const uint64_t mcycle_period = luaL_checkinteger(L, 3);
     const uint64_t mcycle_phase = luaL_optinteger(L, 4, 0);
     const auto log2_bundle_uarch_cycle_count = static_cast<int32_t>(luaL_optinteger(L, 5, 0));
-    const char *previous_back_tree =
-        !lua_isnil(L, 6) ? clua_check_schemed_json_string(L, 6, "BackMerkleTree") : nullptr;
+    const char *previous_back_tree = !lua_isnil(L, 6) ? clua_tojson(L, 6, -1, "BackMerkleTree") : nullptr;
     const char *result = nullptr;
     if (cm_collect_mcycle_root_hashes(m.get(), mcycle_end, mcycle_period, mcycle_phase, log2_bundle_uarch_cycle_count,
             previous_back_tree, &result) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_schemed_json_table(L, result, "McycleRootHashes");
+    clua_fromjson(L, result, "McycleRootHashes");
     return 1;
 }
 
 /// \brief This is the machine:collect_uarch_cycle_root_hashes() method implementation.
 /// \param L Lua state.
 static int machine_obj_index_collect_uarch_cycle_root_hashes(lua_State *L) {
-    lua_settop(L, 3);
+    lua_settop(L, 4);
     auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
     const uint64_t mcycle_end = luaL_checkinteger(L, 2);
     const auto log2_bundle_uarch_cycle_count = static_cast<int32_t>(luaL_optinteger(L, 3, 0));
+    const char *revert_uarch_tail = !lua_isnil(L, 4) ? clua_tojson(L, 4, -1, "Base64Array") : nullptr;
     const char *result = nullptr;
-    if (cm_collect_uarch_cycle_root_hashes(m.get(), mcycle_end, log2_bundle_uarch_cycle_count, &result) != 0) {
+    if (cm_collect_uarch_cycle_root_hashes(m.get(), mcycle_end, log2_bundle_uarch_cycle_count, revert_uarch_tail,
+            &result) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_schemed_json_table(L, result, "UarchCycleRootHashes");
+    clua_fromjson(L, result, "UarchCycleRootHashes");
     return 1;
 }
 
@@ -1118,7 +1195,7 @@ static int machine_obj_index_collect_uarch_cycle_root_hashes(lua_State *L) {
 static int machine_obj_index_load(lua_State *L) {
     lua_settop(L, 4);
     auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
-    const char *runtime_config = !lua_isnil(L, 3) ? clua_check_json_string(L, 3) : nullptr;
+    const char *runtime_config = !lua_isnil(L, 3) ? clua_tojson(L, 3) : nullptr;
     const char *dir = luaL_checkstring(L, 2);
     const auto sharing = static_cast<cm_sharing_mode>(luaL_optinteger(L, 4, CM_SHARING_NONE));
     if (cm_load(m.get(), dir, runtime_config, sharing) != 0) {
@@ -1136,7 +1213,7 @@ static int machine_obj_index_get_default_config(lua_State *L) {
     if (cm_get_default_config(m.get(), &config) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    clua_push_json_table(L, config);
+    clua_fromjson(L, config);
     return 1;
 }
 
@@ -1188,7 +1265,7 @@ static int machine_obj_index_verify_step_uarch(lua_State *L) {
     auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
     cm_hash root_hash{};
     clua_check_cm_hash(L, 2, &root_hash);
-    const char *log = clua_check_schemed_json_string(L, 3, "AccessLog");
+    const char *log = clua_tojson(L, 3, -1, "AccessLog");
     cm_hash target_hash{};
     clua_check_cm_hash(L, 4, &target_hash);
     if (cm_verify_step_uarch(m.get(), &root_hash, log, &target_hash) != 0) {
@@ -1204,7 +1281,7 @@ static int machine_obj_index_verify_reset_uarch(lua_State *L) {
     auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
     cm_hash root_hash{};
     clua_check_cm_hash(L, 2, &root_hash);
-    const char *log = clua_check_schemed_json_string(L, 3, "AccessLog");
+    const char *log = clua_tojson(L, 3, -1, "AccessLog");
     cm_hash target_hash{};
     clua_check_cm_hash(L, 4, &target_hash);
     if (cm_verify_reset_uarch(m.get(), &root_hash, log, &target_hash) != 0) {
@@ -1216,18 +1293,21 @@ static int machine_obj_index_verify_reset_uarch(lua_State *L) {
 /// \brief This is the machine:verify_send_cmio_response() method implementation.
 /// \param L Lua state.
 static int machine_obj_index_verify_send_cmio_response(lua_State *L) {
-    lua_settop(L, 6);
+    lua_settop(L, 7);
     auto &m = clua_check<clua_managed_cm_ptr<cm_machine>>(L, 1);
-    const auto reason = static_cast<uint16_t>(luaL_checkinteger(L, 2));
+    cm_hash revert_root_hash{};
+    clua_check_cm_hash(L, 2, &revert_root_hash);
+    const auto reason = static_cast<uint16_t>(luaL_checkinteger(L, 3));
     size_t length{0};
     // NOLINTNEXTLINE(cppcoreguidelines-pro-type-reinterpret-cast)
-    const auto *data = reinterpret_cast<const unsigned char *>(luaL_checklstring(L, 3, &length));
+    const auto *data = reinterpret_cast<const unsigned char *>(luaL_checklstring(L, 4, &length));
     cm_hash root_hash{};
-    clua_check_cm_hash(L, 4, &root_hash);
-    const char *log = clua_check_schemed_json_string(L, 5, "AccessLog");
+    clua_check_cm_hash(L, 5, &root_hash);
+    const char *log = clua_tojson(L, 6, -1, "AccessLog");
     cm_hash target_hash{};
-    clua_check_cm_hash(L, 6, &target_hash);
-    if (cm_verify_send_cmio_response(m.get(), reason, data, length, &root_hash, log, &target_hash) != 0) {
+    clua_check_cm_hash(L, 7, &target_hash);
+    if (cm_verify_send_cmio_response(m.get(), &revert_root_hash, reason, data, length, &root_hash, log, &target_hash) !=
+        0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
     return 0;
@@ -1256,6 +1336,8 @@ static const auto machine_obj_index = cartesi::clua_make_luaL_Reg_array({
     {"get_hash_tree_stats", machine_obj_index_get_hash_tree_stats},
     {"get_reg_address", machine_obj_index_get_reg_address},
     {"get_root_hash", machine_obj_index_get_root_hash},
+    {"read_revert_root_hash", machine_obj_index_read_revert_root_hash},
+    {"write_revert_root_hash", machine_obj_index_write_revert_root_hash},
     {"get_node_hash", machine_obj_index_get_node_hash},
     {"get_runtime_config", machine_obj_index_get_runtime_config},
     {"is_empty", machine_obj_index_is_empty},
@@ -1307,10 +1389,10 @@ static int machine_meta_call(lua_State *L) {
     if (cm_clone_empty(m.get(), &new_m.get()) != 0) {
         return luaL_error(L, "%s", cm_get_last_error_message());
     }
-    const char *runtime_config = !lua_isnil(L, 3) ? clua_check_json_string(L, 3) : nullptr;
+    const char *runtime_config = !lua_isnil(L, 3) ? clua_tojson(L, 3) : nullptr;
     // Create or load a machine depending on the type of the first argument
     if (lua_isstring(L, 2) == 0) {
-        const char *config = clua_check_json_string(L, 2);
+        const char *config = clua_tojson(L, 2);
         const char *dir = luaL_optstring(L, 4, nullptr);
         if (cm_create(new_m.get(), config, runtime_config, dir) != 0) {
             return luaL_error(L, "%s", cm_get_last_error_message());
diff --git a/src/clua-i-machine.hpp b/src/clua-i-machine.hpp
index cc03f2867..8f00b2245 100644
--- a/src/clua-i-machine.hpp
+++ b/src/clua-i-machine.hpp
@@ -153,44 +153,39 @@ void clua_push_cm_hash(lua_State *L, const cm_hash *hash);
 /// \param c_hash Receives hash
 void clua_check_cm_hash(lua_State *L, int idx, cm_hash *c_hash);
 
-/// \brief Replaces a Lua table with its JSON string representation and returns the string
+/// \brief Converts a Lua schema-dictionary table to JSON, once at the Lua boundary
 /// \param L Lua state
-/// \param idx Lua table stack index which will be converted to a Lua string
+/// \param idx Stack index of the Lua schema-dictionary table
+/// \param ctxidx Index (or pseudo-index) of clua context
+/// \returns Reference to the schema dictionary as a JSON object (a shared empty object when idx is nil or none)
+/// \details The returned reference stays valid while, and only while, the slot it pushes onto the stack
+/// remains there.
+const nlohmann::json &clua_tojsonschemadict(lua_State *L, int idx, int ctxidx = lua_upvalueindex(1));
+
+/// \brief Replaces a Lua value with its JSON string representation and returns the string
+/// \param L Lua state
+/// \param idx Stack index of the Lua value which will be converted to a Lua string
 /// \param indent JSON indentation when converting it to a string
+/// \param schema_name Name of the root type, resolved in user_schema_dict then the machine dictionary
+/// (nullptr means no schema)
+/// \param user_schema_dict User-supplied schema dictionary (empty object means none)
 /// \param ctxidx Index (or pseudo-index) of clua context
-/// \param schema Schema for the table
-/// \param schema_dict Dictionary containing schema for all types
 /// \returns It traverses the Lua value while converting to a JSON object
-/// \details In case the Lua valua is already a string, it just returns it
-const char *clua_check_json_string(lua_State *L, int idx, int indent = -1, int ctxidx = lua_upvalueindex(1),
-    const nlohmann::json &schema = nlohmann::json(), const nlohmann::json &schema_dict = nlohmann::json());
+/// \details The value may be a table, string, number, boolean or nil, allowing a bare hash or scalar to
+/// be serialized (e.g. a binary string under the "Base64" schema), not only a table
+const char *clua_tojson(lua_State *L, int idx, int indent = -1, const char *schema_name = nullptr,
+    const nlohmann::json &user_schema_dict = nlohmann::json(), int ctxidx = lua_upvalueindex(1));
 
 /// \brief Parses a JSON from a string and pushes it as a Lua table
 /// \param L Lua state
 /// \param s JSON string
+/// \param schema_name Name of the root type, resolved in user_schema_dict then the machine dictionary
+/// (nullptr means no schema)
+/// \param user_schema_dict User-supplied schema dictionary (empty object means none)
 /// \param ctxidx Index (or pseudo-index) of clua context
-/// \param schema Schema for the table
-/// \param schema_dict Dictionary containing schema for all types
 /// \returns It traverses the JSON object while converting to a Lua object
-void clua_push_json_table(lua_State *L, const char *s, int ctxidx = lua_upvalueindex(1),
-    const nlohmann::json &schema = nlohmann::json(), const nlohmann::json &schema_dict = nlohmann::json());
-
-/// \brief Replaces a Lua table with its JSON string representation and returns the string (schemed version)
-/// \param L Lua state
-/// \param idx Lua table stack index which will be converted to a Lua string
-/// \param schema_name Schema name to be used while converting the table
-/// \param ctxidx Index (or pseudo-index) of clua context
-const char *clua_check_schemed_json_string(lua_State *L, int idx, const std::string &schema_name,
-    int ctxidx = lua_upvalueindex(1));
-
-/// \brief Parses a JSON from a string and pushes it as a Lua table (schemed version)
-/// \param L Lua state
-/// \param s JSON string
-/// \param idx Lua table stack index which will be converted to a Lua string
-/// \param schema_name Schema name to be used while converting the table
-/// \param ctxidx Index (or pseudo-index) of clua context
-void clua_push_schemed_json_table(lua_State *L, const char *s, const std::string &schema_name,
-    int ctxidx = lua_upvalueindex(1));
+void clua_fromjson(lua_State *L, const char *s, const char *schema_name = nullptr,
+    const nlohmann::json &user_schema_dict = nlohmann::json(), int ctxidx = lua_upvalueindex(1));
 
 } // namespace cartesi
 
diff --git a/src/cm.cpp b/src/cm.cpp
index 29af542c6..3fa4087fd 100644
--- a/src/cm.cpp
+++ b/src/cm.cpp
@@ -57,7 +57,10 @@
 #include "machine-runtime-config.hpp"
 #include "machine.hpp"
 #include "os-features.hpp"
+#include "pmas-defines.h"
 #include "ranges.hpp"
+#include "rtc-defines.h"
+#include "send-cmio-response.hpp"
 #include "sha-256-hasher.hpp"
 #include "uarch-defines.h"
 
@@ -69,6 +72,7 @@ static std::string &get_last_err_msg_storage() {
 static_assert(static_cast<int>(cartesi::FLASH_DRIVE_MAX) == CM_FLASH_DRIVE_MAX);
 static_assert(static_cast<int>(cartesi::NVRAM_MAX) == CM_NVRAM_MAX);
 static_assert(static_cast<int>(cartesi::MEMORY_RANGE_LABEL_MAX) == CM_MEMORY_RANGE_LABEL_MAX);
+static_assert(static_cast<int>(cartesi::CMIO_LOG2_MAX_OUTPUT_COUNT) == CM_CMIO_LOG2_MAX_OUTPUT_COUNT);
 
 static_assert(AR_CMIO_RX_BUFFER_START_DEF == CM_AR_CMIO_RX_BUFFER_START);
 static_assert(AR_CMIO_RX_BUFFER_LOG2_SIZE_DEF == CM_AR_CMIO_RX_BUFFER_LOG2_SIZE);
@@ -80,6 +84,18 @@ static_assert(AR_SHADOW_STATE_START_DEF == CM_AR_SHADOW_STATE_START);
 static_assert(AR_SHADOW_STATE_LENGTH_DEF == CM_AR_SHADOW_STATE_LENGTH);
 static_assert(AR_PMAS_START_DEF == CM_AR_PMAS_START);
 static_assert(AR_PMAS_LENGTH_DEF == CM_AR_PMAS_LENGTH);
+static_assert(PMA_EMPTY_DID_DEF == CM_PMA_EMPTY_DID);
+static_assert(PMA_MEMORY_DID_DEF == CM_PMA_MEMORY_DID);
+static_assert(PMA_SHADOW_STATE_DID_DEF == CM_PMA_SHADOW_STATE_DID);
+static_assert(PMA_FLASH_DRIVE_DID_DEF == CM_PMA_FLASH_DRIVE_DID);
+static_assert(PMA_CLINT_DID_DEF == CM_PMA_CLINT_DID);
+static_assert(PMA_HTIF_DID_DEF == CM_PMA_HTIF_DID);
+static_assert(PMA_PLIC_DID_DEF == CM_PMA_PLIC_DID);
+static_assert(PMA_CMIO_RX_BUFFER_DID_DEF == CM_PMA_CMIO_RX_BUFFER_DID);
+static_assert(PMA_CMIO_TX_BUFFER_DID_DEF == CM_PMA_CMIO_TX_BUFFER_DID);
+static_assert(PMA_SHADOW_UARCH_STATE_DID_DEF == CM_PMA_SHADOW_UARCH_STATE_DID);
+static_assert(PMA_VIRTIO_DID_DEF == CM_PMA_VIRTIO_DID);
+static_assert(PMA_NVRAM_DID_DEF == CM_PMA_NVRAM_DID);
 static_assert(AR_CLINT_START_DEF == CM_AR_CLINT_START);
 static_assert(AR_CLINT_LENGTH_DEF == CM_AR_CLINT_LENGTH);
 static_assert(AR_HTIF_START_DEF == CM_AR_HTIF_START);
@@ -92,23 +108,40 @@ static_assert((UINT64_C(1) << AR_CMIO_RX_BUFFER_LOG2_SIZE_DEF) == CM_AR_CMIO_RX_
 static_assert((UINT64_C(1) << AR_CMIO_TX_BUFFER_LOG2_SIZE_DEF) == CM_AR_CMIO_TX_BUFFER_LENGTH);
 static_assert(AR_DTB_START_DEF == CM_AR_DTB_START);
 static_assert(AR_DTB_LENGTH_DEF == CM_AR_DTB_LENGTH);
-static_assert(AR_DRIVE_START_DEF == CM_AR_DRIVE_START);
-static_assert(AR_DRIVE_OFFSET_DEF == CM_AR_DRIVE_OFFSET);
-static_assert(std::string_view{DTB_BOOTARGS_CONSOLE} == std::string_view{CM_DTB_BOOTARGS_CONSOLE});
-static_assert(std::string_view{DTB_BOOTARGS_UIO} == std::string_view{CM_DTB_BOOTARGS_UIO});
-static_assert(std::string_view{DTB_BOOTARGS_ROOT} == std::string_view{CM_DTB_BOOTARGS_ROOT});
+static_assert(std::string_view{DTB_BOOTARGS_CONSOLE_PART} == std::string_view{CM_DTB_BOOTARGS_CONSOLE_PART});
+static_assert(std::string_view{DTB_BOOTARGS_UIO_PART} == std::string_view{CM_DTB_BOOTARGS_UIO_PART});
+static_assert(std::string_view{DTB_BOOTARGS_ROOT_PART} == std::string_view{CM_DTB_BOOTARGS_ROOT_PART});
+static_assert(std::string_view{DTB_BOOTARGS_INIT_PART} == std::string_view{CM_DTB_BOOTARGS_INIT_PART});
 static_assert(std::string_view{DTB_BOOTARGS_INIT} == std::string_view{CM_DTB_BOOTARGS_INIT});
 
 static_assert(UARCH_CYCLE_MAX_DEF == CM_UARCH_CYCLE_MAX);
-
-static_assert(HTIF_YIELD_AUTOMATIC_REASON_PROGRESS_DEF == CM_CMIO_YIELD_AUTOMATIC_REASON_PROGRESS);
-static_assert(HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT_DEF == CM_CMIO_YIELD_AUTOMATIC_REASON_TX_OUTPUT);
-static_assert(HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT_DEF == CM_CMIO_YIELD_AUTOMATIC_REASON_TX_REPORT);
-static_assert(HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED_DEF == CM_CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED);
-static_assert(HTIF_YIELD_MANUAL_REASON_RX_REJECTED_DEF == CM_CMIO_YIELD_MANUAL_REASON_RX_REJECTED);
-static_assert(HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION_DEF == CM_CMIO_YIELD_MANUAL_REASON_TX_EXCEPTION);
-static_assert(HTIF_YIELD_REASON_ADVANCE_STATE_DEF == CM_CMIO_YIELD_REASON_ADVANCE_STATE);
-static_assert(HTIF_YIELD_REASON_INSPECT_STATE_DEF == CM_CMIO_YIELD_REASON_INSPECT_STATE);
+static_assert(RTC_FREQ_DIV_DEF == CM_RTC_FREQ_DIV);
+
+static_assert(HTIF_DEV_SHIFT_DEF == CM_HTIF_DEV_SHIFT);
+static_assert(HTIF_CMD_SHIFT_DEF == CM_HTIF_CMD_SHIFT);
+static_assert(HTIF_REASON_SHIFT_DEF == CM_HTIF_REASON_SHIFT);
+static_assert(HTIF_DATA_SHIFT_DEF == CM_HTIF_DATA_SHIFT);
+static_assert(HTIF_DEV_MASK_DEF == CM_HTIF_DEV_MASK);
+static_assert(HTIF_CMD_MASK_DEF == CM_HTIF_CMD_MASK);
+static_assert(HTIF_REASON_MASK_DEF == CM_HTIF_REASON_MASK);
+static_assert(HTIF_DATA_MASK_DEF == CM_HTIF_DATA_MASK);
+static_assert(HTIF_DEV_HALT_DEF == CM_HTIF_DEV_HALT);
+static_assert(HTIF_DEV_CONSOLE_DEF == CM_HTIF_DEV_CONSOLE);
+static_assert(HTIF_DEV_YIELD_DEF == CM_HTIF_DEV_YIELD);
+static_assert(HTIF_HALT_CMD_HALT_DEF == CM_HTIF_HALT_CMD_HALT);
+static_assert(HTIF_CONSOLE_CMD_GETCHAR_DEF == CM_HTIF_CONSOLE_CMD_GETCHAR);
+static_assert(HTIF_CONSOLE_CMD_PUTCHAR_DEF == CM_HTIF_CONSOLE_CMD_PUTCHAR);
+static_assert(HTIF_YIELD_CMD_AUTOMATIC_DEF == CM_HTIF_YIELD_CMD_AUTOMATIC);
+static_assert(HTIF_YIELD_CMD_MANUAL_DEF == CM_HTIF_YIELD_CMD_MANUAL);
+
+static_assert(HTIF_YIELD_AUTOMATIC_REASON_PROGRESS_DEF == CM_HTIF_YIELD_AUTOMATIC_REASON_PROGRESS);
+static_assert(HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT_DEF == CM_HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT);
+static_assert(HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT_DEF == CM_HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT);
+static_assert(HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED_DEF == CM_HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED);
+static_assert(HTIF_YIELD_MANUAL_REASON_RX_REJECTED_DEF == CM_HTIF_YIELD_MANUAL_REASON_RX_REJECTED);
+static_assert(HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION_DEF == CM_HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION);
+static_assert(HTIF_YIELD_REASON_ADVANCE_STATE_DEF == CM_HTIF_YIELD_REASON_ADVANCE_STATE);
+static_assert(HTIF_YIELD_REASON_INSPECT_STATE_DEF == CM_HTIF_YIELD_REASON_INSPECT_STATE);
 
 uint64_t cm_get_version() {
     return CM_VERSION_NUM;
@@ -665,12 +698,15 @@ cm_error cm_collect_mcycle_root_hashes(cm_machine *m, uint64_t mcycle_end, uint6
 }
 
 cm_error cm_collect_uarch_cycle_root_hashes(cm_machine *m, uint64_t mcycle_end, int32_t log2_bundle_uarch_cycle_count,
-    const char **result) try {
+    const char *revert_uarch_tail, const char **result) try {
     if (result == nullptr) {
         throw std::invalid_argument("invalid result output");
     }
     auto *cpp_m = convert_from_c(m);
-    const auto cpp_res = cpp_m->collect_uarch_cycle_root_hashes(mcycle_end, log2_bundle_uarch_cycle_count);
+    const auto cpp_revert_uarch_tail =
+        cartesi::from_json<cartesi::machine_hashes>(revert_uarch_tail, "revert_uarch_tail");
+    const auto cpp_res =
+        cpp_m->collect_uarch_cycle_root_hashes(mcycle_end, log2_bundle_uarch_cycle_count, cpp_revert_uarch_tail);
     *result = cm_set_temp_string(cartesi::to_json(cpp_res).dump());
     return cm_result_success();
 } catch (...) {
@@ -851,6 +887,24 @@ cm_error cm_get_root_hash(const cm_machine *m, cm_hash *hash) try {
     return cm_result_failure();
 }
 
+cm_error cm_read_revert_root_hash(const cm_machine *m, cm_hash *hash) try {
+    const auto *cpp_m = convert_from_c(m);
+    const cartesi::machine_hash cpp_hash = cpp_m->read_revert_root_hash();
+    convert_to_c(cpp_hash, hash);
+    return cm_result_success();
+} catch (...) {
+    return cm_result_failure();
+}
+
+cm_error cm_write_revert_root_hash(cm_machine *m, const cm_hash *hash) try {
+    auto *cpp_m = convert_from_c(m);
+    const cartesi::machine_hash cpp_hash = convert_from_c(hash);
+    cpp_m->write_revert_root_hash(cpp_hash);
+    return cm_result_success();
+} catch (...) {
+    return cm_result_failure();
+}
+
 cm_error cm_get_node_hash(const cm_machine *m, uint64_t address, int log2_size, cm_hash *hash) try {
     const auto *cpp_m = convert_from_c(m);
     const cartesi::machine_hash cpp_hash = cpp_m->get_node_hash(address, log2_size);
@@ -1190,22 +1244,26 @@ cm_error cm_receive_cmio_request(const cm_machine *m, uint8_t *cmd, uint16_t *re
     return cm_result_failure();
 }
 
-cm_error cm_send_cmio_response(cm_machine *m, uint16_t reason, const uint8_t *data, uint64_t length) try {
+cm_error cm_send_cmio_response(cm_machine *m, const cm_hash *revert_root_hash, uint16_t reason, const uint8_t *data,
+    uint64_t length) try {
     auto *cpp_m = convert_from_c(m);
-    cpp_m->send_cmio_response(reason, data, length);
+    const cartesi::machine_hash cpp_revert_root_hash = convert_from_c(revert_root_hash);
+    cpp_m->send_cmio_response(cpp_revert_root_hash, reason, data, length);
     return cm_result_success();
 } catch (...) {
     return cm_result_failure();
 }
 
-cm_error cm_log_send_cmio_response(cm_machine *m, uint16_t reason, const uint8_t *data, uint64_t length,
-    int32_t log_type, const char **log) try {
+cm_error cm_log_send_cmio_response(cm_machine *m, const cm_hash *revert_root_hash, uint16_t reason, const uint8_t *data,
+    uint64_t length, int32_t log_type, const char **log) try {
     if (log == nullptr) {
         throw std::invalid_argument("invalid access log output");
     }
     auto *cpp_m = convert_from_c(m);
+    const cartesi::machine_hash cpp_revert_root_hash = convert_from_c(revert_root_hash);
     const cartesi::access_log::type cpp_log_type(log_type);
-    const cartesi::access_log cpp_log = cpp_m->log_send_cmio_response(reason, data, length, cpp_log_type);
+    const cartesi::access_log cpp_log =
+        cpp_m->log_send_cmio_response(cpp_revert_root_hash, reason, data, length, cpp_log_type);
     *log = cm_set_temp_string(cartesi::to_json(cpp_log).dump());
     return cm_result_success();
 } catch (...) {
@@ -1215,21 +1273,24 @@ cm_error cm_log_send_cmio_response(cm_machine *m, uint16_t reason, const uint8_t
     return cm_result_failure();
 }
 
-cm_error cm_verify_send_cmio_response(const cm_machine *m, uint16_t reason, const uint8_t *data, uint64_t length,
-    const cm_hash *root_hash_before, const char *log, const cm_hash *root_hash_after) try {
+cm_error cm_verify_send_cmio_response(const cm_machine *m, const cm_hash *revert_root_hash, uint16_t reason,
+    const uint8_t *data, uint64_t length, const cm_hash *root_hash_before, const char *log,
+    const cm_hash *root_hash_after) try {
     if (log == nullptr) {
         throw std::invalid_argument("invalid access log");
     }
     const auto cpp_log = // NOLINTNEXTLINE(bugprone-unchecked-optional-access)
         cartesi::from_json<cartesi::not_default_constructible<cartesi::access_log>>(log, "log").value();
+    const cartesi::machine_hash cpp_revert_root_hash = convert_from_c(revert_root_hash);
     const cartesi::machine_hash cpp_root_hash_before = convert_from_c(root_hash_before);
     const cartesi::machine_hash cpp_root_hash_after = convert_from_c(root_hash_after);
     if (m != nullptr) {
         const auto *cpp_m = convert_from_c(m);
-        cpp_m->verify_send_cmio_response(reason, data, length, cpp_root_hash_before, cpp_log, cpp_root_hash_after);
-    } else {
-        cartesi::machine::verify_send_cmio_response(reason, data, length, cpp_root_hash_before, cpp_log,
+        cpp_m->verify_send_cmio_response(cpp_revert_root_hash, reason, data, length, cpp_root_hash_before, cpp_log,
             cpp_root_hash_after);
+    } else {
+        cartesi::machine::verify_send_cmio_response(cpp_revert_root_hash, reason, data, length, cpp_root_hash_before,
+            cpp_log, cpp_root_hash_after);
     }
     return cm_result_success();
 } catch (...) {
diff --git a/src/cm.h b/src/cm.h
index 57bc7f95d..0179461e3 100644
--- a/src/cm.h
+++ b/src/cm.h
@@ -39,13 +39,12 @@ extern "C" {
 static const uint64_t CM_MCYCLE_MAX = -1ULL;
 static const uint64_t CM_UARCH_CYCLE_MAX = 1ULL << 20;
 
-static const uint64_t CM_AR_DRIVE_START = 0x80000000000000ULL;  ///< Start PMA for flash drives and NVRAMs
-static const uint64_t CM_AR_DRIVE_OFFSET = 0x10000000000000ULL; ///< PMA slot stride for flash drives and NVRAMs
-
-#define CM_DTB_BOOTARGS_CONSOLE "quiet earlycon=sbi console=hvc0 "
-#define CM_DTB_BOOTARGS_UIO "uio_pdrv_genirq.of_id=generic-uio "
-#define CM_DTB_BOOTARGS_ROOT "root=/dev/pmem0 rw init=/usr/sbin/cartesi-init"
-#define CM_DTB_BOOTARGS_INIT (CM_DTB_BOOTARGS_CONSOLE CM_DTB_BOOTARGS_UIO CM_DTB_BOOTARGS_ROOT)
+#define CM_DTB_BOOTARGS_CONSOLE_PART "quiet earlycon=sbi console=hvc0 "
+#define CM_DTB_BOOTARGS_UIO_PART "uio_pdrv_genirq.of_id=generic-uio "
+#define CM_DTB_BOOTARGS_ROOT_PART "root=/dev/pmem0 rw "
+#define CM_DTB_BOOTARGS_INIT_PART "init=/usr/sbin/cartesi-init"
+#define CM_DTB_BOOTARGS_INIT                                                                                           \
+    (CM_DTB_BOOTARGS_CONSOLE_PART CM_DTB_BOOTARGS_UIO_PART CM_DTB_BOOTARGS_ROOT_PART CM_DTB_BOOTARGS_INIT_PART)
 
 // -----------------------------------------------------------------------------
 // API enums and structures
@@ -57,9 +56,11 @@ typedef enum cm_constant {
     CM_HASH_TREE_LOG2_WORD_SIZE = 5,
     CM_HASH_TREE_LOG2_PAGE_SIZE = 12,
     CM_HASH_TREE_LOG2_ROOT_SIZE = 64,
-    CM_FLASH_DRIVE_MAX = 8,         ///< Maximum number of flash drives
-    CM_NVRAM_MAX = 8,               ///< Maximum number of NVRAMs
-    CM_MEMORY_RANGE_LABEL_MAX = 31, ///< Maximum length of a memory range user label (DT alias constraint)
+    CM_CMIO_LOG2_MAX_OUTPUT_COUNT = 63, ///< Height of the cmio outputs Merkle tree (capacity 2^63 outputs)
+    CM_FLASH_DRIVE_MAX = 8,             ///< Maximum number of flash drives
+    CM_NVRAM_MAX = 8,                   ///< Maximum number of NVRAMs
+    CM_MEMORY_RANGE_LABEL_MAX = 31,     ///< Maximum length of a memory range user label (DT alias constraint)
+    CM_RTC_FREQ_DIV = 8192,             ///< mtime increments once per this many mcycle increments
 } cm_constant;
 
 /// \brief Physical memory addresses (only the most useful are exposed in the API).
@@ -90,6 +91,22 @@ typedef enum cm_pmas_constant {
     CM_AR_DTB_LENGTH = 0x100000,
 } cm_pmas_constant;
 
+/// \brief Driver IDs for PMA entries.
+typedef enum cm_pma_did {
+    CM_PMA_EMPTY_DID = 0,              ///< Driver ID for empty range
+    CM_PMA_MEMORY_DID = 1,             ///< Driver ID for memory
+    CM_PMA_SHADOW_STATE_DID = 2,       ///< Driver ID for shadow state device
+    CM_PMA_FLASH_DRIVE_DID = 3,        ///< Driver ID for flash drive device
+    CM_PMA_CLINT_DID = 4,              ///< Driver ID for CLINT device
+    CM_PMA_HTIF_DID = 5,               ///< Driver ID for HTIF device
+    CM_PMA_PLIC_DID = 6,               ///< Driver ID for PLIC device
+    CM_PMA_CMIO_RX_BUFFER_DID = 7,     ///< Driver ID for CMIO RX buffer
+    CM_PMA_CMIO_TX_BUFFER_DID = 8,     ///< Driver ID for CMIO TX buffer
+    CM_PMA_SHADOW_UARCH_STATE_DID = 9, ///< Driver ID for uarch shadow state device
+    CM_PMA_VIRTIO_DID = 10,            ///< Driver ID for VirtIO devices
+    CM_PMA_NVRAM_DID = 11,             ///< Driver ID for NVRAM
+} cm_pma_did;
+
 /// \brief Error codes returned from the C API.
 typedef enum cm_error {
     CM_ERROR_OK = 0,
@@ -142,24 +159,6 @@ typedef enum cm_access_log_type {
     CM_ACCESS_LOG_TYPE_LARGE_DATA = 2,  ///< Includes data larger than 8 bytes
 } cm_access_log_type;
 
-/// \brief Yield device commands.
-typedef enum cm_cmio_yield_command {
-    CM_CMIO_YIELD_COMMAND_AUTOMATIC,
-    CM_CMIO_YIELD_COMMAND_MANUAL,
-} cm_cmio_yield_command;
-
-/// \brief Yield reasons.
-typedef enum cm_cmio_yield_reason {
-    CM_CMIO_YIELD_AUTOMATIC_REASON_PROGRESS = 1,  ///< Progress is available
-    CM_CMIO_YIELD_AUTOMATIC_REASON_TX_OUTPUT = 2, ///< Output is available in tx buffer
-    CM_CMIO_YIELD_AUTOMATIC_REASON_TX_REPORT = 4, ///< Report is available in tx buffer
-    CM_CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED = 1,  ///< Input in rx buffer was accepted
-    CM_CMIO_YIELD_MANUAL_REASON_RX_REJECTED = 2,  ///< Input in rx buffer was rejected
-    CM_CMIO_YIELD_MANUAL_REASON_TX_EXCEPTION = 4, ///< Exception happened
-    CM_CMIO_YIELD_REASON_ADVANCE_STATE = 0,       ///< Input in rx buffer is an advance state
-    CM_CMIO_YIELD_REASON_INSPECT_STATE = 1,       ///< Input in rx buffer is an inspect state
-} cm_cmio_yield_reason;
-
 /// \brief Sharing modes.
 typedef enum cm_sharing_mode {
     CM_SHARING_NONE = 0,   ///< No sharing, all machine changes will be in-memory
@@ -167,6 +166,48 @@ typedef enum cm_sharing_mode {
     CM_SHARING_ALL = 2,    ///< Share all backing stores, all machine changes will be on-disk
 } cm_sharing_mode;
 
+/// \brief HTIF tohost/fromhost register field shifts.
+typedef enum cm_htif_shift {
+    CM_HTIF_DEV_SHIFT = 56,
+    CM_HTIF_CMD_SHIFT = 48,
+    CM_HTIF_REASON_SHIFT = 32,
+    CM_HTIF_DATA_SHIFT = 0,
+} cm_htif_shift;
+
+/// \brief HTIF tohost/fromhost register field masks.
+static const uint64_t CM_HTIF_DEV_MASK = 0xFF00000000000000ULL;
+static const uint64_t CM_HTIF_CMD_MASK = 0x00FF000000000000ULL;
+static const uint64_t CM_HTIF_REASON_MASK = 0x0000FFFF00000000ULL;
+static const uint64_t CM_HTIF_DATA_MASK = 0x00000000FFFFFFFFULL;
+
+/// \brief HTIF device identifiers (DEV field of tohost/fromhost).
+typedef enum cm_htif_device {
+    CM_HTIF_DEV_HALT = 0,    ///< Halts the machine
+    CM_HTIF_DEV_CONSOLE = 1, ///< Console input and output
+    CM_HTIF_DEV_YIELD = 2,   ///< Yield control back to the host
+} cm_htif_device;
+
+/// \brief HTIF device commands (CMD field of tohost/fromhost).
+typedef enum cm_htif_command {
+    CM_HTIF_HALT_CMD_HALT = 0,
+    CM_HTIF_CONSOLE_CMD_GETCHAR = 0,
+    CM_HTIF_CONSOLE_CMD_PUTCHAR = 1,
+    CM_HTIF_YIELD_CMD_AUTOMATIC = 0,
+    CM_HTIF_YIELD_CMD_MANUAL = 1,
+} cm_htif_command;
+
+/// \brief HTIF yield reasons (REASON field of tohost/fromhost).
+typedef enum cm_htif_yield_reason {
+    CM_HTIF_YIELD_AUTOMATIC_REASON_PROGRESS = 1,
+    CM_HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT = 2,
+    CM_HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT = 4,
+    CM_HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED = 1,
+    CM_HTIF_YIELD_MANUAL_REASON_RX_REJECTED = 2,
+    CM_HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION = 4,
+    CM_HTIF_YIELD_REASON_ADVANCE_STATE = 0,
+    CM_HTIF_YIELD_REASON_INSPECT_STATE = 1,
+} cm_htif_yield_reason;
+
 /// \brief Machine x, f, and control and status registers.
 typedef enum cm_reg {
     // Machine x registers
@@ -592,6 +633,18 @@ CM_API cm_error cm_get_address_ranges(const cm_machine *m, const char **ranges);
 /// \returns 0 for success, non zero code for error.
 CM_API cm_error cm_get_root_hash(const cm_machine *m, cm_hash *hash);
 
+/// \brief Obtains the revert root hash from the shadow state.
+/// \param m Pointer to a non-empty machine object (holds a machine instance).
+/// \param hash Valid pointer to cm_hash structure that receives the hash.
+/// \returns 0 for success, non zero code for error.
+CM_API cm_error cm_read_revert_root_hash(const cm_machine *m, cm_hash *hash);
+
+/// \brief Writes the revert root hash to the shadow state.
+/// \param m Pointer to a non-empty machine object (holds a machine instance).
+/// \param hash Valid pointer to cm_hash structure with hash to store.
+/// \returns 0 for success, non zero code for error.
+CM_API cm_error cm_write_revert_root_hash(cm_machine *m, const cm_hash *hash);
+
 /// \brief Obtains the hash of a node in the hash tree.
 /// \param m Pointer to a non-empty machine object (holds a machine instance).
 /// \param address Address of node.
@@ -766,6 +819,10 @@ CM_API cm_error cm_run(cm_machine *m, uint64_t mcycle_end, cm_break_reason *brea
 /// If "break_reason" is "yielded_manually", "halted", or if mcycle reaches CM_MCYCLE_MAX (maximum mcycle value),
 /// this means that execution stopped at a fixed point.
 ///
+/// If execution stopped on a manual yield whose reason is rx-rejected, the root hash collected at the yield
+/// and the padding that follows are substituted by the recorded revert root hash, which is the root hash
+/// verifiers accept for these state transitions.
+///
 /// When \p log2_bundle_mcycle_count is greater than 0 and execution stops at a fixed point, then
 /// the next-to-last hash in "hashes" represents a bundle that is completed by padding with repetitions of the final
 /// root hash, and the last hash in "hashes" represents a bundle consisting entirely of repetitions of that same final
@@ -795,6 +852,12 @@ CM_API cm_error cm_run_uarch(cm_machine *m, uint64_t uarch_cycle_end, cm_uarch_b
 /// \param mcycle_end End machine cycle value to execute, uarch cycle by uarch cycle.
 /// \param log2_bundle_uarch_cycle_count Log base 2 of the amount of uarch cycle root hashes to bundle.
 /// If greater than 0, it collects subtree root hashes for 2^log2_bundle_uarch_cycle_count root hashes.
+/// \param revert_uarch_tail Optional JSON array (of hashes as base64-encoded strings) with the root hashes
+/// after each uarch cycle of the period of the machine the recorded revert root hash reverts to, the last
+/// entry being the revert root hash itself (can be NULL).
+/// It is obtained by calling this function with no bundling on that machine, while it waits for a response.
+/// Required unless the machine starts at a fixed point other than a rejected manual yield, in which case
+/// the call cannot consume it and ignores it.
 /// \param result Receives an JSON object as a string, guaranteed to remain valid only until
 /// the next CM_API function is called from the same thread.
 /// The field "hashes" is an array (of hashes as base64-encoded strings) with the root hashes after each uarch cycle.
@@ -826,8 +889,13 @@ CM_API cm_error cm_run_uarch(cm_machine *m, uint64_t uarch_cycle_end, cm_uarch_b
 /// In these cases, the function will attempt to execute one additional mcycle at this fixed point,
 /// and collect the resulting root hashes as well. As a result, all root hashes collected after the next-to-last
 /// reset index correspond to this fixed point.
+///
+/// The rejected manual yield is the exception to the paragraph above. When execution stops on a manual yield
+/// whose reason is rx-rejected, the root hash after the final uarch reset is substituted by the recorded
+/// revert root hash, and instead of executing one additional mcycle, the function collects one extra period,
+/// that of the reverted machine, as given by \p revert_uarch_tail.
 CM_API cm_error cm_collect_uarch_cycle_root_hashes(cm_machine *m, uint64_t mcycle_end,
-    int32_t log2_bundle_uarch_cycle_count, const char **result);
+    int32_t log2_bundle_uarch_cycle_count, const char *revert_uarch_tail, const char **result);
 
 /// \brief Resets the entire microarchitecture state to pristine values.
 /// \param m Pointer to a non-empty machine object (holds a machine instance).
@@ -852,13 +920,18 @@ CM_API cm_error cm_receive_cmio_request(const cm_machine *m, uint8_t *cmd, uint1
 
 /// \brief Sends a cmio response.
 /// \param m Pointer to a non-empty machine object (holds a machine instance).
+/// \param revert_root_hash Machine root hash to revert to in case the response is eventually rejected.
+/// For advance-state responses, it must be the root hash of the machine itself, and the machine must be
+/// waiting on an rx-accepted manual yield, both checked before any state changes. Other responses
+/// (inspect-state queries and GIO responses) are not checked.
 /// \param reason Reason for sending the response.
 /// \param data Response data to send.
 /// \param length Length of response data.
 /// \returns 0 for success, non zero code for error.
 /// \details This method should only be called as a response to cmio requests with manual yield command,
 /// where the reason is either accepted or a GIO request, may fail otherwise.
-CM_API cm_error cm_send_cmio_response(cm_machine *m, uint16_t reason, const uint8_t *data, uint64_t length);
+CM_API cm_error cm_send_cmio_response(cm_machine *m, const cm_hash *revert_root_hash, uint16_t reason,
+    const uint8_t *data, uint64_t length);
 
 // ------------------------------------
 // Logging
@@ -870,6 +943,9 @@ CM_API cm_error cm_send_cmio_response(cm_machine *m, uint16_t reason, const uint
 /// \param log_filename Name of the log file to be generated.
 /// \param break_reason Receives reason for returning (can be NULL). Set to CM_BREAK_REASON_FAILED on failure.
 /// \returns 0 for success, non zero code for error.
+/// \details When the machine ends the step having rejected an input (a manual yield with reason rx-rejected is
+/// pending), the root hash after the step recorded in the log header is the recorded revert root hash instead of
+/// the machine root hash.
 CM_API cm_error cm_log_step(cm_machine *m, uint64_t mcycle_count, const char *log_filename,
     cm_break_reason *break_reason);
 
@@ -887,10 +963,15 @@ CM_API cm_error cm_log_step_uarch(cm_machine *m, int32_t log_type, const char **
 /// \param log Receives the state access log as a JSON object in a string,
 /// guaranteed to remain valid only until the next CM_API function is called from the same thread.
 /// \returns 0 for success, non zero code for error.
+/// \details When the machine has rejected an input (a manual yield with reason rx-rejected is pending), the
+/// canonical state after the logged operation is the one recorded in the revert root hash, even though the
+/// physical machine only has its uarch reset.
 CM_API cm_error cm_log_reset_uarch(cm_machine *m, int32_t log_type, const char **log);
 
 /// \brief Sends a cmio response logging all accesses to the state.
 /// \param m Pointer to a non-empty machine object (holds a machine instance).
+/// \param revert_root_hash Machine root hash to revert to in case the response is eventually rejected.
+/// Unlike cm_send_cmio_response, it is not checked against the machine root hash.
 /// \param reason Reason for sending the response.
 /// \param data Response data to send.
 /// \param length Length of response data.
@@ -898,8 +979,13 @@ CM_API cm_error cm_log_reset_uarch(cm_machine *m, int32_t log_type, const char *
 /// \param log Receives the state access log as a JSON object in a string,
 /// guaranteed to remain valid only until the next CM_API function is called from the same thread.
 /// \returns 0 for success, non zero code for error.
-CM_API cm_error cm_log_send_cmio_response(cm_machine *m, uint16_t reason, const uint8_t *data, uint64_t length,
-    int32_t log_type, const char **log);
+/// \details The logged operation cannot fail, so the honest party can always prove the resulting
+/// state transition. It is a no-op that leaves the state unchanged when the machine is not waiting
+/// on a manual yield, when an advance-state response finds the machine yielded with a reason other
+/// than rx-accepted (e.g., it rejected an input or threw an exception), or when the response data
+/// does not fit in the rx buffer.
+CM_API cm_error cm_log_send_cmio_response(cm_machine *m, const cm_hash *revert_root_hash, uint16_t reason,
+    const uint8_t *data, uint64_t length, int32_t log_type, const char **log);
 
 // ------------------------------------
 // Verifying
@@ -935,6 +1021,7 @@ CM_API cm_error cm_verify_reset_uarch(const cm_machine *m, const cm_hash *root_h
 
 /// \brief Checks the validity of a state transition produced by cm_log_send_cmio_response.
 /// \param m Pointer to a machine object. Can be NULL (for local machines).
+/// \param revert_root_hash The revert root hash recorded when the log was generated.
 /// \param reason Reason for sending the response.
 /// \param data The response sent when the log was generated.
 /// \param length Length of response.
@@ -942,8 +1029,9 @@ CM_API cm_error cm_verify_reset_uarch(const cm_machine *m, const cm_hash *root_h
 /// \param log State access log to be verified as a JSON object in a string.
 /// \param root_hash_after State hash after response.
 /// \returns 0 for success, non zero code for error.
-CM_API cm_error cm_verify_send_cmio_response(const cm_machine *m, uint16_t reason, const uint8_t *data, uint64_t length,
-    const cm_hash *root_hash_before, const char *log, const cm_hash *root_hash_after);
+CM_API cm_error cm_verify_send_cmio_response(const cm_machine *m, const cm_hash *revert_root_hash, uint16_t reason,
+    const uint8_t *data, uint64_t length, const cm_hash *root_hash_before, const char *log,
+    const cm_hash *root_hash_after);
 
 // ------------------------------------
 // Integrity checking
diff --git a/src/collect-mcycle-hashes-state-access.hpp b/src/collect-mcycle-hashes-state-access.hpp
index a4f546709..c928bc459 100644
--- a/src/collect-mcycle-hashes-state-access.hpp
+++ b/src/collect-mcycle-hashes-state-access.hpp
@@ -496,8 +496,6 @@ class collect_mcycle_hashes_state_access :
         return m_m.get_host_addr(paddr, pma_index);
     }
 
-    void do_mark_dirty_page(host_addr /* haddr */, uint64_t /* pma_index */) const {}
-
     bool do_putchar(uint8_t c) const { // NOLINT(readability-convert-member-functions-to-static)
         return m_m.putchar(c);
     }
diff --git a/src/collect-uarch-cycle-hashes-state-access.hpp b/src/collect-uarch-cycle-hashes-state-access.hpp
index c418259c0..34e9bac67 100644
--- a/src/collect-uarch-cycle-hashes-state-access.hpp
+++ b/src/collect-uarch-cycle-hashes-state-access.hpp
@@ -122,12 +122,6 @@ class collect_uarch_cycle_hashes_state_access :
         return false;
     }
 
-    // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
-    void do_mark_dirty_page(uint64_t paddr, uint64_t pma_index) const {
-        (void) paddr;
-        (void) pma_index;
-    }
-
     // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
     constexpr const char *do_get_name() const {
         return "collect_uarch_cycle_hashes_state_access";
diff --git a/src/dtb.cpp b/src/dtb.cpp
index c31423129..7a8b5799e 100644
--- a/src/dtb.cpp
+++ b/src/dtb.cpp
@@ -106,6 +106,7 @@ void dtb_init(const machine_config &c, unsigned char *dtb_start, uint64_t dtb_le
                 fdt.prop_u32("clock-frequency", RTC_CLOCK_FREQ);
                 { // interrupt-controller
                     fdt.begin_node("interrupt-controller");
+                    fdt.prop_u32("#address-cells", 0);
                     fdt.prop_u32("#interrupt-cells", 1);
                     fdt.prop_empty("interrupt-controller");
                     fdt.prop_string("compatible", "riscv,cpu-intc");
diff --git a/src/hash-tree-hash.cpp b/src/hash-tree-hash.cpp
index 52c190678..23870097b 100644
--- a/src/hash-tree-hash.cpp
+++ b/src/hash-tree-hash.cpp
@@ -27,6 +27,7 @@
 
 #include "assert-printf.hpp"
 #include "back-merkle-tree.hpp"
+#include "hash-tree-constants.hpp"
 #include "i-hasher.hpp"
 #include "machine-hash.hpp"
 #include "unique-c-ptr.hpp"
@@ -171,7 +172,7 @@ The hash function used is Keccak-256.
   --input=<filename>                    default: reads from standard input
   Gives the input filename.
 
-  --log2-word-size=<integer>            default: 3
+  --log2-word-size=<integer>            default: %d
   (> 0 and <= 64)
   Number of bytes subintended by each word, i.e., the number of bytes in the
   input data from which each hash is computed.
@@ -186,14 +187,14 @@ The hash function used is Keccak-256.
   --help
   Prints this message and returns.
 )",
-        name);
+        name, cartesi::HASH_TREE_LOG2_WORD_SIZE);
     exit(0);
 }
 
 int main(int argc, char *argv[]) try {
     const char *input_name = nullptr;
     const char *hash_function_name = "keccak256";
-    int log2_word_size = 3;
+    int log2_word_size = cartesi::HASH_TREE_LOG2_WORD_SIZE;
     int log2_leaf_size = 12;
     int log2_root_size = 0;
     // Process command line arguments
diff --git a/src/i-accept-dirty-pages.hpp b/src/i-accept-dirty-pages.hpp
new file mode 100644
index 000000000..09ed14323
--- /dev/null
+++ b/src/i-accept-dirty-pages.hpp
@@ -0,0 +1,76 @@
+// Copyright Cartesi and individual authors (see AUTHORS)
+// SPDX-License-Identifier: LGPL-3.0-or-later
+//
+// This program is free software: you can redistribute it and/or modify it under
+// the terms of the GNU Lesser General Public License as published by the Free
+// Software Foundation, either version 3 of the License, or (at your option) any
+// later version.
+//
+// This program is distributed in the hope that it will be useful, but WITHOUT ANY
+// WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
+// PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details.
+//
+// You should have received a copy of the GNU Lesser General Public License along
+// with this program (see COPYING). If not, see <https://www.gnu.org/licenses/>.
+//
+
+#ifndef I_ACCEPT_DIRTY_PAGES_HPP
+#define I_ACCEPT_DIRTY_PAGES_HPP
+
+/// \file
+/// \brief Accept dirty pages interface
+
+#include <cstdint>
+#include <type_traits>
+
+#include "meta.hpp"
+
+namespace cartesi {
+
+/// \class i_accept_dirty_pages
+/// \brief Interface for state access classes that must mark pages dirty explicitly.
+/// \tparam DERIVED Derived class implementing the interface. (An example of CRTP.)
+/// \details Only a state access with a deferred store needs this. The native
+/// state_access writes straight through the host pointer in do_write_memory_word
+/// without marking the page, so it relies on this explicit call (and the eviction
+/// marking in the machine) to keep the dirty page tree complete; record_step_state_access
+/// records that same deferral. Every other context marks or hashes each page at the
+/// moment of the write: native write_word marks dirty, and the microarchitecture
+/// record path hashes on the spot. This is why the microarchitecture does not accept
+/// dirty pages. If a batched microarchitecture write path were ever added, that
+/// assumption would no longer hold and this reasoning would need to be revisited.
+template <typename DERIVED>
+class i_accept_dirty_pages { // CRTP
+    i_accept_dirty_pages() = default;
+    friend DERIVED;
+
+    /// \brief Returns object cast as the derived class
+    DERIVED &derived() {
+        return *static_cast<DERIVED *>(this);
+    }
+
+    /// \brief Returns object cast as the derived class
+    const DERIVED &derived() const {
+        return *static_cast<const DERIVED *>(this);
+    }
+
+public:
+    /// \brief Marks a page as dirty
+    /// \param paddr Target physical address within page
+    /// \param pma_index Index of PMA where page falls
+    void mark_dirty_page(uint64_t paddr, uint64_t pma_index) const {
+        derived().do_mark_dirty_page(paddr, pma_index);
+    }
+};
+
+/// \brief SFINAE test implementation of the i_accept_dirty_pages interface
+template <typename DERIVED>
+using is_an_i_accept_dirty_pages =
+    std::integral_constant<bool, is_template_base_of_v<i_accept_dirty_pages, std::remove_cvref_t<DERIVED>>>;
+
+template <typename DERIVED>
+constexpr bool is_an_i_accept_dirty_pages_v = is_an_i_accept_dirty_pages<DERIVED>::value;
+
+} // namespace cartesi
+
+#endif
diff --git a/src/i-machine.hpp b/src/i-machine.hpp
index bf47875ec..fb8ffd9d3 100644
--- a/src/i-machine.hpp
+++ b/src/i-machine.hpp
@@ -139,6 +139,16 @@ class i_machine {
         return do_get_root_hash();
     }
 
+    /// \brief Reads the revert root hash from the shadow state.
+    machine_hash read_revert_root_hash() const {
+        return do_read_revert_root_hash();
+    }
+
+    /// \brief Writes the revert root hash to the shadow state.
+    void write_revert_root_hash(const_machine_hash_view hash) {
+        do_write_revert_root_hash(hash);
+    }
+
     /// \brief Obtains the root hash of the hash tree.
     machine_hash get_node_hash(uint64_t address, int log2_size) const {
         return do_get_node_hash(address, log2_size);
@@ -266,9 +276,12 @@ class i_machine {
 
     /// \brief Collects the root hashes after every \p uarch_cycle until \p mcycle_end machine cycle, implicitly
     /// resetting the uarch between mcycles.
-    uarch_cycle_root_hashes collect_uarch_cycle_root_hashes(uint64_t mcycle_end,
-        int32_t log2_bundle_uarch_cycle_count) {
-        return do_collect_uarch_cycle_root_hashes(mcycle_end, log2_bundle_uarch_cycle_count);
+    /// \details The \p revert_uarch_tail holds the root hashes after each uarch cycle of the period of the
+    /// machine the recorded revert root hash reverts to, the last entry being the revert root hash itself.
+    /// It is required unless the machine starts at a fixed point other than a rejected manual yield.
+    uarch_cycle_root_hashes collect_uarch_cycle_root_hashes(uint64_t mcycle_end, int32_t log2_bundle_uarch_cycle_count,
+        const machine_hashes &revert_uarch_tail = {}) {
+        return do_collect_uarch_cycle_root_hashes(mcycle_end, log2_bundle_uarch_cycle_count, revert_uarch_tail);
     }
 
     /// \brief Returns a list of descriptions for all PMA entries registered in the machine, sorted by start
@@ -277,14 +290,15 @@ class i_machine {
     }
 
     /// \brief Sends cmio response.
-    void send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length) {
-        do_send_cmio_response(reason, data, length);
+    void send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason, const unsigned char *data,
+        uint64_t length) {
+        do_send_cmio_response(revert_root_hash, reason, data, length);
     }
 
     /// \brief Sends cmio response and returns an access log
-    access_log log_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-        const access_log::type &log_type) {
-        return do_log_send_cmio_response(reason, data, length, log_type);
+    access_log log_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+        const unsigned char *data, uint64_t length, const access_log::type &log_type) {
+        return do_log_send_cmio_response(revert_root_hash, reason, data, length, log_type);
     }
 
     /// \brief Gets the address of any register
@@ -321,9 +335,10 @@ class i_machine {
     }
 
     /// \brief Checks the validity of state transitions caused by log_send_cmio_response.
-    void verify_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-        const machine_hash &root_hash_before, const access_log &log, const machine_hash &root_hash_after) const {
-        do_verify_send_cmio_response(reason, data, length, root_hash_before, log, root_hash_after);
+    void verify_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason, const unsigned char *data,
+        uint64_t length, const machine_hash &root_hash_before, const access_log &log,
+        const machine_hash &root_hash_after) const {
+        do_verify_send_cmio_response(revert_root_hash, reason, data, length, root_hash_before, log, root_hash_after);
     }
 
     /// \brief Checks if implementation is jsorpc-machine
@@ -348,6 +363,8 @@ class i_machine {
     virtual access_log do_log_step_uarch(const access_log::type &log_type) = 0;
     virtual hash_tree_proof do_get_proof(uint64_t address, int log2_target_size, int log2_root_size) const = 0;
     virtual machine_hash do_get_root_hash() const = 0;
+    virtual machine_hash do_read_revert_root_hash() const = 0;
+    virtual void do_write_revert_root_hash(const_machine_hash_view hash) = 0;
     virtual machine_hash do_get_node_hash(uint64_t address, int log2_size) const = 0;
     virtual uint64_t do_read_reg(reg r) const = 0;
     virtual void do_write_reg(reg w, uint64_t val) = 0;
@@ -370,11 +387,12 @@ class i_machine {
     virtual access_log do_log_reset_uarch(const access_log::type &log_type) = 0;
     virtual uarch_interpreter_break_reason do_run_uarch(uint64_t uarch_cycle_end) = 0;
     virtual uarch_cycle_root_hashes do_collect_uarch_cycle_root_hashes(uint64_t mcycle_end,
-        int32_t log2_bundle_uarch_cycle_count) = 0;
+        int32_t log2_bundle_uarch_cycle_count, const machine_hashes &revert_uarch_tail) = 0;
     virtual address_range_descriptions do_get_address_ranges() const = 0;
-    virtual void do_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length) = 0;
-    virtual access_log do_log_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-        const access_log::type &log_type) = 0;
+    virtual void do_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+        const unsigned char *data, uint64_t length) = 0;
+    virtual access_log do_log_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+        const unsigned char *data, uint64_t length, const access_log::type &log_type) = 0;
     virtual uint64_t do_get_reg_address(reg r) const = 0;
     virtual machine_config do_get_default_config() const = 0;
     virtual std::string do_get_address_name(uint64_t paddr) const = 0;
@@ -384,8 +402,9 @@ class i_machine {
         const machine_hash &root_hash_after) const = 0;
     virtual void do_verify_reset_uarch(const machine_hash &root_hash_before, const access_log &log,
         const machine_hash &root_hash_after) const = 0;
-    virtual void do_verify_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-        const machine_hash &root_hash_before, const access_log &log, const machine_hash &root_hash_after) const = 0;
+    virtual void do_verify_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+        const unsigned char *data, uint64_t length, const machine_hash &root_hash_before, const access_log &log,
+        const machine_hash &root_hash_after) const = 0;
     virtual bool do_verify_hash_tree() const = 0;
     virtual bool do_is_jsonrpc_machine() const {
         return false;
diff --git a/src/i-state-access.hpp b/src/i-state-access.hpp
index 104564356..ccbee878e 100644
--- a/src/i-state-access.hpp
+++ b/src/i-state-access.hpp
@@ -28,6 +28,7 @@
 #include "address-range.hpp"
 #include "assert-printf.hpp"
 #include "i-prefer-shadow-state.hpp"
+#include "machine-hash.hpp"
 #include "meta.hpp"
 #include "poor-type-name.hpp"
 #include "riscv-warl.hpp"
@@ -354,6 +355,18 @@ class i_state_access { // CRTP
         derived().do_write_memory_with_padding(paddr, data, data_length, write_length_log2_size);
     }
 
+    /// \brief Reads the revert root hash from the shadow state.
+    /// \returns The hash.
+    machine_hash read_revert_root_hash() const {
+        return derived().do_read_revert_root_hash();
+    }
+
+    /// \brief Writes the revert root hash in the shadow state.
+    /// \param hash View of hash data, one full hash tree leaf in size.
+    void write_revert_root_hash(const_machine_hash_view hash) const {
+        derived().do_write_revert_root_hash(hash);
+    }
+
     /// \brief Reads a word from memory.
     /// \tparam T Type of word to read, potentially unaligned.
     /// \tparam A Type to which \p paddr and \p faddr are known to be aligned.
@@ -465,18 +478,6 @@ class i_state_access { // CRTP
         return val;
     }
 
-    /// \brief Marks a page as dirty
-    /// \param faddr Implementation-defined fast address.
-    /// \param pma_index Index of PMA where page falls
-    /// \details When there is a host machine, the hash tree only updates the hashes for pages that
-    /// have been modified. Pages can only be written to if they appear in the write TLB. Therefore,
-    /// the hash tree only considers the pages that are currently in the write TLB and those that
-    /// have been marked dirty. When a page leaves the write TLB, it is marked dirty.
-    /// If the state belongs to a host machine, then this call MUST be forwarded to machine::mark_dirty_page();
-    void mark_dirty_page(fast_addr faddr, uint64_t pma_index) const {
-        derived().do_mark_dirty_page(faddr, pma_index);
-    }
-
     /// \brief Writes a character to the console
     /// \param c Character to output
     /// \returns True if console output should be flushed.
diff --git a/src/i-uarch-state-access.hpp b/src/i-uarch-state-access.hpp
index b22955b9e..a8df09b7d 100644
--- a/src/i-uarch-state-access.hpp
+++ b/src/i-uarch-state-access.hpp
@@ -136,6 +136,14 @@ class i_uarch_state_access { // CRTP
         return val;
     }
 
+    /// \brief Reverts the canonical machine state to the one whose root hash is recorded
+    /// in the revert root hash leaf of the shadow state.
+    /// \details Implementations that track a root hash read the leaf and replace it. The
+    /// others do nothing, the physical machine state does not revert.
+    void revert_state() const {
+        derived().do_revert_state();
+    }
+
     void write_word(uint64_t paddr, uint64_t val) const {
         derived().do_write_word(paddr, val);
         dusa_printf("%s::write_word(phys_addr{0x%" PRIx64 "}, %" PRIu64 "(0x%" PRIx64 "))\n", get_name(), paddr, val,
@@ -151,10 +159,6 @@ class i_uarch_state_access { // CRTP
         return derived().do_putchar(c);
     }
 
-    void mark_dirty_page(uint64_t paddr, uint64_t pma_index) const {
-        return derived().do_mark_dirty_page(paddr, pma_index);
-    }
-
     void write_tlb(TLB_set_index set_index, uint64_t slot_index, uint64_t vaddr_page, uint64_t vp_offset,
         uint64_t pma_index) const {
         derived().do_write_tlb(set_index, slot_index, vaddr_page, vp_offset, pma_index);
diff --git a/src/interpret.cpp b/src/interpret.cpp
index bf18d2791..97d7bae76 100644
--- a/src/interpret.cpp
+++ b/src/interpret.cpp
@@ -872,22 +872,9 @@ static FORCE_INLINE int32_t insn_get_C_SWSP_imm(uint32_t insn) {
 /// \param slot_index Slot index
 template <TLB_set_index SET, typename STATE_ACCESS>
 static void flush_tlb_slot(const STATE_ACCESS a, uint64_t slot_index) {
-    // Make sure a valid page leaving the write TLB is marked as dirty
-    // We must do this BEFORE we modify the TLB entries themselves
-    // (Otherwise, we could stop uarch before it marks the page dirty but after
-    // the entry is no longer in the TLB, which would cause the hash tree to
-    // miss a dirty page.)
-    if constexpr (SET == TLB_WRITE) {
-        auto old_vaddr_page = a.template read_tlb_vaddr_page<TLB_WRITE>(slot_index);
-        if (old_vaddr_page == TLB_UNVERIFIED_PAGE) {
-            old_vaddr_page = a.template init_hot_tlb_slot<TLB_WRITE>(slot_index);
-        }
-        if (old_vaddr_page != TLB_INVALID_PAGE) {
-            auto old_pma_index = a.template read_tlb_pma_index<TLB_WRITE>(slot_index);
-            const auto old_faddr_page = old_vaddr_page + a.template read_tlb_vf_offset<TLB_WRITE>(slot_index);
-            a.mark_dirty_page(old_faddr_page, old_pma_index);
-        }
-    }
+    // A valid page leaving the write TLB is marked dirty by the machine itself,
+    // inside write_verified_tlb/write_unverified_tlb, before the outgoing slot is
+    // overwritten. The interpreter no longer marks it here.
     // We do not leave garbage behind in empty slots
     // (It would make state access classes trickier to implement)
     const auto vaddr_page = TLB_INVALID_PAGE;
diff --git a/src/json-util.cpp b/src/json-util.cpp
index ad02fa279..b32df7b4f 100644
--- a/src/json-util.cpp
+++ b/src/json-util.cpp
@@ -1158,6 +1158,17 @@ template void ju_get_opt_field<uint64_t>(const nlohmann::json &j, const uint64_t
 template void ju_get_opt_field<std::string>(const nlohmann::json &j, const std::string &key, machine_hash &value,
     const std::string &path);
 
+template <typename K>
+void ju_get_opt_field(const nlohmann::json &j, const K &key, machine_hashes &value, const std::string &path) {
+    ju_get_opt_vector_like_field(j, key, value, path);
+}
+
+template void ju_get_opt_field<uint64_t>(const nlohmann::json &j, const uint64_t &key, machine_hashes &value,
+    const std::string &path);
+
+template void ju_get_opt_field<std::string>(const nlohmann::json &j, const std::string &key, machine_hashes &value,
+    const std::string &path);
+
 template <typename K>
 void ju_get_opt_field(const nlohmann::json &j, const K &key, not_default_constructible<hash_tree_proof> &value,
     const std::string &path) {
@@ -2050,6 +2061,14 @@ void ju_get_opt_field(const nlohmann::json &j, const K &key, address_range_descr
     ju_get_opt_field(jconfig, "length"s, value.length, new_path);
     ju_get_opt_field(jconfig, "start"s, value.start, new_path);
     ju_get_opt_field(jconfig, "description"s, value.description, new_path);
+    ju_get_opt_field(jconfig, "is_memory"s, value.is_memory, new_path);
+    ju_get_opt_field(jconfig, "is_device"s, value.is_device, new_path);
+    ju_get_opt_field(jconfig, "is_readable"s, value.is_readable, new_path);
+    ju_get_opt_field(jconfig, "is_writeable"s, value.is_writeable, new_path);
+    ju_get_opt_field(jconfig, "is_executable"s, value.is_executable, new_path);
+    ju_get_opt_field(jconfig, "is_read_idempotent"s, value.is_read_idempotent, new_path);
+    ju_get_opt_field(jconfig, "is_write_idempotent"s, value.is_write_idempotent, new_path);
+    ju_get_opt_field(jconfig, "driver_id"s, value.driver_id, new_path);
 }
 
 template void ju_get_opt_field<uint64_t>(const nlohmann::json &j, const uint64_t &key, address_range_description &value,
@@ -2512,7 +2531,11 @@ void to_json(nlohmann::json &j, const machine_runtime_config &runtime) {
 }
 
 void to_json(nlohmann::json &j, const address_range_description &mrd) {
-    j = nlohmann::json{{"length", mrd.length}, {"start", mrd.start}, {"description", mrd.description}};
+    j = nlohmann::json{{"length", mrd.length}, {"start", mrd.start}, {"description", mrd.description},
+        {"is_memory", mrd.is_memory}, {"is_device", mrd.is_device}, {"is_readable", mrd.is_readable},
+        {"is_writeable", mrd.is_writeable}, {"is_executable", mrd.is_executable},
+        {"is_read_idempotent", mrd.is_read_idempotent}, {"is_write_idempotent", mrd.is_write_idempotent},
+        {"driver_id", mrd.driver_id}};
 }
 
 void to_json(nlohmann::json &j, const address_range_descriptions &mrds) {
diff --git a/src/json-util.hpp b/src/json-util.hpp
index c8d4874bf..23a93ebc5 100644
--- a/src/json-util.hpp
+++ b/src/json-util.hpp
@@ -303,6 +303,16 @@ template <typename K>
 void ju_get_opt_field(const nlohmann::json &j, const K &key, std::optional<machine_hash> &optional,
     const std::string &path = "params/");
 
+/// \brief Attempts to load an array of hashes from a field in a JSON object
+/// \tparam K Key type (explicit extern declarations for uint64_t and std::string are provided)
+/// \param j JSON object to load from
+/// \param key Key to load value from
+/// \param value Object to store value
+/// \param path Path to j
+template <typename K>
+void ju_get_opt_field(const nlohmann::json &j, const K &key, machine_hashes &value,
+    const std::string &path = "params/");
+
 /// \brief Attempts to load a hash-tree proof object from a field in a JSON object
 /// \tparam K Key type (explicit extern declarations for uint64_t and std::string are provided)
 /// \param j JSON object to load from
@@ -879,6 +889,10 @@ extern template void ju_get_opt_field(const nlohmann::json &j, const uint64_t &k
     const std::string &base = "params/");
 extern template void ju_get_opt_field(const nlohmann::json &j, const std::string &key, machine_hash &value,
     const std::string &base = "params/");
+extern template void ju_get_opt_field(const nlohmann::json &j, const uint64_t &key, machine_hashes &value,
+    const std::string &base = "params/");
+extern template void ju_get_opt_field(const nlohmann::json &j, const std::string &key, machine_hashes &value,
+    const std::string &base = "params/");
 extern template void ju_get_opt_field(const nlohmann::json &j, const uint64_t &key,
     not_default_constructible<hash_tree_proof> &value, const std::string &base = "params/");
 extern template void ju_get_opt_field(const nlohmann::json &j, const std::string &key,
diff --git a/src/jsonrpc-discover.json b/src/jsonrpc-discover.json
index 72d4e63ff..cae89ff13 100644
--- a/src/jsonrpc-discover.json
+++ b/src/jsonrpc-discover.json
@@ -498,6 +498,39 @@
         }
       }
     },
+    {
+      "name": "machine.read_revert_root_hash",
+      "summary": "Reads the revert root hash from the shadow state",
+      "params": [],
+      "result": {
+        "name": "hash",
+        "description": "Revert root hash",
+        "schema": {
+          "$ref": "#/components/schemas/Base64Hash"
+        }
+      }
+    },
+    {
+      "name": "machine.write_revert_root_hash",
+      "summary": "Writes the revert root hash to the shadow state",
+      "params": [
+        {
+          "name": "hash",
+          "description": "Revert root hash to store",
+          "required": true,
+          "schema": {
+            "$ref": "#/components/schemas/Base64Hash"
+          }
+        }
+      ],
+      "result": {
+        "name": "result",
+        "description": "True on success",
+        "schema": {
+          "type": "boolean"
+        }
+      }
+    },
     {
       "name": "machine.get_proof",
       "summary": "Obtains a hash-tree proof for a range in the machine state",
@@ -1005,6 +1038,14 @@
       "name": "machine.send_cmio_response",
       "summary": "Sends cmio response.",
       "params": [
+        {
+          "name": "revert_root_hash",
+          "description": "Machine root hash to revert to in case the response is eventually rejected",
+          "required": true,
+          "schema": {
+            "$ref": "#/components/schemas/Base64Hash"
+          }
+        },
         {
           "name": "reason",
           "description": "Reason for sending response",
@@ -1034,6 +1075,14 @@
       "name": "machine.log_send_cmio_response",
       "summary": "Sends cmio response and returns an access log",
       "params": [
+        {
+          "name": "revert_root_hash",
+          "description": "Machine root hash to revert to in case the response is eventually rejected",
+          "required": true,
+          "schema": {
+            "$ref": "#/components/schemas/Base64Hash"
+          }
+        },
         {
           "name": "reason",
           "description": "Reason for sending response",
@@ -1071,6 +1120,14 @@
       "name": "machine.verify_send_cmio_response",
       "summary": "Verifies a state transition caused by log_send_cmio_response",
       "params": [
+        {
+          "name": "revert_root_hash",
+          "description": "The revert root hash recorded when the log was generated",
+          "required": true,
+          "schema": {
+            "$ref": "#/components/schemas/Base64Hash"
+          }
+        },
         {
           "name": "reason",
           "description": "Reason for sending response",
@@ -2478,6 +2535,30 @@
           },
           "description": {
             "type": "string"
+          },
+          "is_memory": {
+            "type": "boolean"
+          },
+          "is_device": {
+            "type": "boolean"
+          },
+          "is_readable": {
+            "type": "boolean"
+          },
+          "is_writeable": {
+            "type": "boolean"
+          },
+          "is_executable": {
+            "type": "boolean"
+          },
+          "is_read_idempotent": {
+            "type": "boolean"
+          },
+          "is_write_idempotent": {
+            "type": "boolean"
+          },
+          "driver_id": {
+            "$ref": "#/components/schemas/UnsignedInteger"
           }
         }
       },
diff --git a/src/jsonrpc-machine.cpp b/src/jsonrpc-machine.cpp
index 5da071068..9ed870ef2 100644
--- a/src/jsonrpc-machine.cpp
+++ b/src/jsonrpc-machine.cpp
@@ -807,6 +807,18 @@ machine_hash jsonrpc_machine::do_get_root_hash() const {
     return hash;
 }
 
+machine_hash jsonrpc_machine::do_read_revert_root_hash() const {
+    machine_hash hash;
+    request("machine.read_revert_root_hash", std::tie(), hash);
+    return hash;
+}
+
+void jsonrpc_machine::do_write_revert_root_hash(const_machine_hash_view hash) {
+    bool result{};
+    auto b64 = encode_base64(hash);
+    request("machine.write_revert_root_hash", std::tie(b64), result);
+}
+
 machine_hash jsonrpc_machine::do_get_node_hash(uint64_t address, int log2_size) const {
     machine_hash hash;
     request("machine.get_node_hash", std::tie(address, log2_size), hash);
@@ -871,9 +883,11 @@ uarch_interpreter_break_reason jsonrpc_machine::do_run_uarch(uint64_t uarch_cycl
 }
 
 uarch_cycle_root_hashes jsonrpc_machine::do_collect_uarch_cycle_root_hashes(uint64_t mcycle_end,
-    int32_t log2_bundle_uarch_cycle_count) {
+    int32_t log2_bundle_uarch_cycle_count, const machine_hashes &revert_uarch_tail) {
     uarch_cycle_root_hashes result;
-    request("machine.collect_uarch_cycle_root_hashes", std::tie(mcycle_end, log2_bundle_uarch_cycle_count), result);
+    const base64_machine_hashes b64_revert_uarch_tail(revert_uarch_tail);
+    request("machine.collect_uarch_cycle_root_hashes",
+        std::tie(mcycle_end, log2_bundle_uarch_cycle_count, b64_revert_uarch_tail), result);
     return result;
 }
 
@@ -883,17 +897,20 @@ address_range_descriptions jsonrpc_machine::do_get_address_ranges() const {
     return result;
 }
 
-void jsonrpc_machine::do_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length) {
+void jsonrpc_machine::do_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+    const unsigned char *data, uint64_t length) {
     bool result = false;
+    auto b64_revert_root_hash = encode_base64(revert_root_hash);
     std::string b64 = cartesi::encode_base64(std::span<const unsigned char>{data, length});
-    request("machine.send_cmio_response", std::tie(reason, b64), result);
+    request("machine.send_cmio_response", std::tie(b64_revert_root_hash, reason, b64), result);
 }
 
-access_log jsonrpc_machine::do_log_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-    const access_log::type &log_type) {
+access_log jsonrpc_machine::do_log_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+    const unsigned char *data, uint64_t length, const access_log::type &log_type) {
     not_default_constructible<access_log> result;
+    auto b64_revert_root_hash = encode_base64(revert_root_hash);
     std::string b64 = cartesi::encode_base64(std::span<const unsigned char>{data, length});
-    request("machine.log_send_cmio_response", std::tie(reason, b64, log_type), result);
+    request("machine.log_send_cmio_response", std::tie(b64_revert_root_hash, reason, b64, log_type), result);
     if (!result.has_value()) {
         throw std::runtime_error("jsonrpc server error: missing result");
     }
@@ -944,14 +961,16 @@ void jsonrpc_machine::do_verify_reset_uarch(const machine_hash &root_hash_before
     request("machine.verify_reset_uarch", std::tie(b64_root_hash_before, log, b64_root_hash_after), result);
 }
 
-void jsonrpc_machine::do_verify_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-    const machine_hash &root_hash_before, const access_log &log, const machine_hash &root_hash_after) const {
+void jsonrpc_machine::do_verify_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+    const unsigned char *data, uint64_t length, const machine_hash &root_hash_before, const access_log &log,
+    const machine_hash &root_hash_after) const {
     bool result = false;
+    auto b64_revert_root_hash = encode_base64(revert_root_hash);
     std::string b64_data = cartesi::encode_base64(std::span<const unsigned char>{data, length});
     auto b64_root_hash_before = encode_base64(root_hash_before);
     auto b64_root_hash_after = encode_base64(root_hash_after);
     request("machine.verify_send_cmio_response",
-        std::tie(reason, b64_data, b64_root_hash_before, log, b64_root_hash_after), result);
+        std::tie(b64_revert_root_hash, reason, b64_data, b64_root_hash_before, log, b64_root_hash_after), result);
 }
 
 bool jsonrpc_machine::do_is_jsonrpc_machine() const {
diff --git a/src/jsonrpc-machine.hpp b/src/jsonrpc-machine.hpp
index 2721ab790..408b5eabd 100644
--- a/src/jsonrpc-machine.hpp
+++ b/src/jsonrpc-machine.hpp
@@ -134,6 +134,8 @@ class jsonrpc_machine final : public i_machine {
     void do_reset_uarch() override;
     access_log do_log_reset_uarch(const access_log::type &log_type) override;
     machine_hash do_get_root_hash() const override;
+    machine_hash do_read_revert_root_hash() const override;
+    void do_write_revert_root_hash(const_machine_hash_view hash) override;
     machine_hash do_get_node_hash(uint64_t address, int log2_size) const override;
     hash_tree_proof do_get_proof(uint64_t address, int log2_target_size, int log2_root_size) const override;
     void do_replace_memory_range(const memory_range_config &new_range) override;
@@ -148,11 +150,12 @@ class jsonrpc_machine final : public i_machine {
     bool do_verify_hash_tree() const override;
     uarch_interpreter_break_reason do_run_uarch(uint64_t uarch_cycle_end) override;
     uarch_cycle_root_hashes do_collect_uarch_cycle_root_hashes(uint64_t mcycle_end,
-        int32_t log2_bundle_uarch_cycle_count) override;
+        int32_t log2_bundle_uarch_cycle_count, const machine_hashes &revert_uarch_tail) override;
     address_range_descriptions do_get_address_ranges() const override;
-    void do_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length) override;
-    access_log do_log_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-        const access_log::type &log_type) override;
+    void do_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason, const unsigned char *data,
+        uint64_t length) override;
+    access_log do_log_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+        const unsigned char *data, uint64_t length, const access_log::type &log_type) override;
     uint64_t do_get_reg_address(reg r) const override;
     machine_config do_get_default_config() const override;
     std::string do_get_address_name(uint64_t paddr) const override;
@@ -162,8 +165,8 @@ class jsonrpc_machine final : public i_machine {
         const machine_hash &root_hash_after) const override;
     void do_verify_reset_uarch(const machine_hash &root_hash_before, const access_log &log,
         const machine_hash &root_hash_after) const override;
-    void do_verify_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-        const machine_hash &root_hash_before, const access_log &log,
+    void do_verify_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+        const unsigned char *data, uint64_t length, const machine_hash &root_hash_before, const access_log &log,
         const machine_hash &root_hash_after) const override;
     bool do_is_jsonrpc_machine() const override;
 
diff --git a/src/jsonrpc-remote-machine.cpp b/src/jsonrpc-remote-machine.cpp
index 67b759fcc..d855c7fa5 100644
--- a/src/jsonrpc-remote-machine.cpp
+++ b/src/jsonrpc-remote-machine.cpp
@@ -121,6 +121,15 @@ static std::ostream &operator<<(std::ostream &out, log_prefix prefix) {
 using namespace std::string_literals;
 using json = nlohmann::json;
 
+/// \brief Formats a beast::error_code for log messages.
+/// At trace/debug level includes Boost's source_location suffix; otherwise returns just the message.
+static std::string format_ec(const beast::error_code &ec) {
+    if (slog::log_level(slog::level_operation::get) <= slog::severity_level::debug) {
+        return ec.what();
+    }
+    return ec.message();
+}
+
 /// \brief Checks if uint64_t value can be converted to integer
 static int check_int(uint64_t val, const char *what) {
     if (val > INT_MAX) {
@@ -206,7 +215,7 @@ struct http_session : std::enable_shared_from_this<http_session> {
             return;
         }
         if (ec) { // Unexpected error
-            SLOG(error) << "read request error:" << ec.what();
+            SLOG(error) << "read request error: " << format_ec(ec);
             return;
         }
 
@@ -241,7 +250,7 @@ struct http_session : std::enable_shared_from_this<http_session> {
             return;
         }
         if (ec) { // Unexpected error
-            SLOG(error) << "send response error:" << ec.what();
+            SLOG(error) << "send response error: " << format_ec(ec);
             shutdown();
             return;
         }
@@ -368,7 +377,7 @@ struct http_handler : std::enable_shared_from_this<http_handler> {
             return;
         }
         if (ec) {
-            SLOG(error) << local_endpoint << " accept error: " << ec.what();
+            SLOG(error) << local_endpoint << " accept error: " << format_ec(ec);
             // If we can't accept, the listening socket is probably in a broken state,
             // close the acceptor so the client abort new connection attempts.
             // This may happen when amount of open files is reached.
@@ -971,12 +980,13 @@ static json jsonrpc_machine_collect_uarch_cycle_root_hashes(const json &j,
     if (!session->handler->machine) {
         return jsonrpc_response_invalid_request(j, "no machine");
     }
-    static const char *const param_name[] = {"mcycle_end", "log2_bundle_uarch_cycle_count"};
-    auto args = parse_args<uint64_t, uint64_t>(j, param_name);
+    static const char *const param_name[] = {"mcycle_end", "log2_bundle_uarch_cycle_count", "revert_uarch_tail"};
+    auto args = parse_args<uint64_t, uint64_t, cartesi::optional_param<cartesi::machine_hashes>>(j, param_name);
     auto mcycle_end = std::get<0>(args);
     auto log2_bundle_uarch_cycle_count = std::get<1>(args);
+    const auto revert_uarch_tail = std::get<2>(args).value_or(cartesi::machine_hashes{});
     const auto result = session->handler->machine->collect_uarch_cycle_root_hashes(mcycle_end,
-        static_cast<int>(log2_bundle_uarch_cycle_count));
+        static_cast<int>(log2_bundle_uarch_cycle_count), revert_uarch_tail);
     return jsonrpc_response_ok(j, result);
 }
 
@@ -1235,6 +1245,34 @@ static json jsonrpc_machine_get_root_hash_handler(const json &j, const std::shar
     return jsonrpc_response_ok(j, cartesi::base64_machine_hash(hash));
 }
 
+/// \brief JSONRPC handler for the machine.read_revert_root_hash method
+/// \param j JSON request object
+/// \param session HTTP session
+/// \returns JSON response object
+static json jsonrpc_machine_read_revert_root_hash_handler(const json &j, const std::shared_ptr<http_session> &session) {
+    if (!session->handler->machine) {
+        return jsonrpc_response_invalid_request(j, "no machine");
+    }
+    jsonrpc_check_no_params(j);
+    auto hash = session->handler->machine->read_revert_root_hash();
+    return jsonrpc_response_ok(j, cartesi::base64_machine_hash(hash));
+}
+
+/// \brief JSONRPC handler for the machine.write_revert_root_hash method
+/// \param j JSON request object
+/// \param session HTTP session
+/// \returns JSON response object
+static json jsonrpc_machine_write_revert_root_hash_handler(const json &j,
+    const std::shared_ptr<http_session> &session) {
+    if (!session->handler->machine) {
+        return jsonrpc_response_invalid_request(j, "no machine");
+    }
+    static const char *const param_name[] = {"hash"};
+    auto args = parse_args<cartesi::machine_hash>(j, param_name);
+    session->handler->machine->write_revert_root_hash(std::get<0>(args));
+    return jsonrpc_response_ok(j);
+}
+
 /// \brief JSONRPC handler for the machine.get_node_hash method
 /// \param j JSON request object
 /// \param session HTTP session
@@ -1571,12 +1609,13 @@ static json jsonrpc_machine_send_cmio_response_handler(const json &j, const std:
     if (!session->handler->machine) {
         return jsonrpc_response_invalid_request(j, "no machine");
     }
-    static const char *const param_name[] = {"reason", "data"};
-    auto args = parse_args<uint16_t, std::string>(j, param_name);
-    auto bin = cartesi::decode_base64(std::get<1>(args));
-    // NOLINTNEXTLINE(cppcoreguidelines-pro-type-reinterpret-cast)
-    session->handler->machine->send_cmio_response(std::get<0>(args), reinterpret_cast<unsigned char *>(bin.data()),
-        bin.size());
+    static const char *const param_name[] = {"revert_root_hash", "reason", "data"};
+    auto args = parse_args<cartesi::machine_hash, uint16_t, std::string>(j, param_name);
+    auto bin = cartesi::decode_base64(std::get<2>(args));
+    // NOLINTBEGIN(cppcoreguidelines-pro-type-reinterpret-cast)
+    session->handler->machine->send_cmio_response(std::get<0>(args), std::get<1>(args),
+        reinterpret_cast<unsigned char *>(bin.data()), bin.size());
+    // NOLINTEND(cppcoreguidelines-pro-type-reinterpret-cast)
     return jsonrpc_response_ok(j);
 }
 
@@ -1585,15 +1624,15 @@ static json jsonrpc_machine_log_send_cmio_response_handler(const json &j,
     if (!session->handler->machine) {
         return jsonrpc_response_invalid_request(j, "no machine");
     }
-    static const char *const param_name[] = {"reason", "data", "log_type"};
-    auto args =
-        parse_args<uint16_t, std::string, cartesi::not_default_constructible<cartesi::access_log::type>>(j, param_name);
-    auto bin = cartesi::decode_base64(std::get<1>(args));
+    static const char *const param_name[] = {"revert_root_hash", "reason", "data", "log_type"};
+    auto args = parse_args<cartesi::machine_hash, uint16_t, std::string,
+        cartesi::not_default_constructible<cartesi::access_log::type>>(j, param_name);
+    auto bin = cartesi::decode_base64(std::get<2>(args));
     // NOLINTBEGIN(bugprone-unchecked-optional-access)
     // NOLINTBEGIN(cppcoreguidelines-pro-type-reinterpret-cast)
     return jsonrpc_response_ok(j,
-        session->handler->machine->log_send_cmio_response(std::get<0>(args),
-            reinterpret_cast<unsigned char *>(bin.data()), bin.size(), std::get<2>(args).value()));
+        session->handler->machine->log_send_cmio_response(std::get<0>(args), std::get<1>(args),
+            reinterpret_cast<unsigned char *>(bin.data()), bin.size(), std::get<3>(args).value()));
     // NOLINTEND(cppcoreguidelines-pro-type-reinterpret-cast)
     // NOLINTEND(bugprone-unchecked-optional-access)
 }
@@ -1604,15 +1643,17 @@ static json jsonrpc_machine_log_send_cmio_response_handler(const json &j,
 /// \returns JSON response object
 static json jsonrpc_machine_verify_send_cmio_response_handler(const json &j,
     const std::shared_ptr<http_session> & /*session*/) {
-    static const char *const param_name[] = {"reason", "data", "root_hash_before", "log", "root_hash_after"};
-    auto args = parse_args<uint16_t, std::string, cartesi::machine_hash,
+    static const char *const param_name[] = {"revert_root_hash", "reason", "data", "root_hash_before", "log",
+        "root_hash_after"};
+    auto args = parse_args<cartesi::machine_hash, uint16_t, std::string, cartesi::machine_hash,
         cartesi::not_default_constructible<cartesi::access_log>, cartesi::machine_hash>(j, param_name);
 
-    auto bin = cartesi::decode_base64(std::get<1>(args));
+    auto bin = cartesi::decode_base64(std::get<2>(args));
     // NOLINTBEGIN(bugprone-unchecked-optional-access)
     // NOLINTBEGIN(cppcoreguidelines-pro-type-reinterpret-cast)
-    cartesi::machine::verify_send_cmio_response(std::get<0>(args), reinterpret_cast<unsigned char *>(bin.data()),
-        bin.size(), std::get<2>(args), std::get<3>(args).value(), std::get<4>(args));
+    cartesi::machine::verify_send_cmio_response(std::get<0>(args), std::get<1>(args),
+        reinterpret_cast<unsigned char *>(bin.data()), bin.size(), std::get<3>(args), std::get<4>(args).value(),
+        std::get<5>(args));
     // NOLINTEND(cppcoreguidelines-pro-type-reinterpret-cast)
     // NOLINTEND(bugprone-unchecked-optional-access)
     return jsonrpc_response_ok(j);
@@ -1689,6 +1730,8 @@ static json jsonrpc_dispatch_method(const json &j, const std::shared_ptr<http_se
         {"machine.get_node_hash", jsonrpc_machine_get_node_hash_handler},
         {"machine.get_proof", jsonrpc_machine_get_proof_handler},
         {"machine.get_root_hash", jsonrpc_machine_get_root_hash_handler},
+        {"machine.read_revert_root_hash", jsonrpc_machine_read_revert_root_hash_handler},
+        {"machine.write_revert_root_hash", jsonrpc_machine_write_revert_root_hash_handler},
         {"machine.read_word", jsonrpc_machine_read_word_handler},
         {"machine.write_word", jsonrpc_machine_write_word_handler},
         {"machine.read_memory", jsonrpc_machine_read_memory_handler},
diff --git a/src/local-machine.cpp b/src/local-machine.cpp
index efc2f9028..3147d4506 100644
--- a/src/local-machine.cpp
+++ b/src/local-machine.cpp
@@ -112,6 +112,14 @@ machine_hash local_machine::do_get_root_hash() const {
     return get_machine()->get_root_hash();
 }
 
+machine_hash local_machine::do_read_revert_root_hash() const {
+    return get_machine()->read_revert_root_hash();
+}
+
+void local_machine::do_write_revert_root_hash(const_machine_hash_view hash) {
+    get_machine()->write_revert_root_hash(hash);
+}
+
 machine_hash local_machine::do_get_node_hash(uint64_t address, int log2_size) const {
     return get_machine()->get_node_hash(address, log2_size);
 }
@@ -202,21 +210,22 @@ uarch_interpreter_break_reason local_machine::do_run_uarch(uint64_t uarch_cycle_
 }
 
 uarch_cycle_root_hashes local_machine::do_collect_uarch_cycle_root_hashes(uint64_t mcycle_end,
-    int32_t log2_bundle_uarch_cycle_count) {
-    return get_machine()->collect_uarch_cycle_root_hashes(mcycle_end, log2_bundle_uarch_cycle_count);
+    int32_t log2_bundle_uarch_cycle_count, const machine_hashes &revert_uarch_tail) {
+    return get_machine()->collect_uarch_cycle_root_hashes(mcycle_end, log2_bundle_uarch_cycle_count, revert_uarch_tail);
 }
 
 address_range_descriptions local_machine::do_get_address_ranges() const {
     return get_machine()->get_address_ranges();
 }
 
-void local_machine::do_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length) {
-    get_machine()->send_cmio_response(reason, data, length);
+void local_machine::do_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+    const unsigned char *data, uint64_t length) {
+    get_machine()->send_cmio_response(revert_root_hash, reason, data, length);
 }
 
-access_log local_machine::do_log_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-    const access_log::type &log_type) {
-    return get_machine()->log_send_cmio_response(reason, data, length, log_type);
+access_log local_machine::do_log_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+    const unsigned char *data, uint64_t length, const access_log::type &log_type) {
+    return get_machine()->log_send_cmio_response(revert_root_hash, reason, data, length, log_type);
 }
 
 uint64_t local_machine::do_get_reg_address(reg r) const {
@@ -246,9 +255,10 @@ void local_machine::do_verify_reset_uarch(const machine_hash &root_hash_before,
     machine::verify_reset_uarch(root_hash_before, log, root_hash_after);
 }
 
-void local_machine::do_verify_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-    const machine_hash &root_hash_before, const access_log &log, const machine_hash &root_hash_after) const {
-    machine::verify_send_cmio_response(reason, data, length, root_hash_before, log, root_hash_after);
+void local_machine::do_verify_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+    const unsigned char *data, uint64_t length, const machine_hash &root_hash_before, const access_log &log,
+    const machine_hash &root_hash_after) const {
+    machine::verify_send_cmio_response(revert_root_hash, reason, data, length, root_hash_before, log, root_hash_after);
 }
 
 } // namespace cartesi
diff --git a/src/local-machine.hpp b/src/local-machine.hpp
index 2476427c8..6f80a6aee 100644
--- a/src/local-machine.hpp
+++ b/src/local-machine.hpp
@@ -65,6 +65,8 @@ class local_machine final : public i_machine {
     access_log do_log_step_uarch(const access_log::type &log_type) override;
     hash_tree_proof do_get_proof(uint64_t address, int log2_target_size, int log2_root_size) const override;
     machine_hash do_get_root_hash() const override;
+    machine_hash do_read_revert_root_hash() const override;
+    void do_write_revert_root_hash(const_machine_hash_view hash) override;
     machine_hash do_get_node_hash(uint64_t address, int log2_size) const override;
     bool do_verify_hash_tree() const override;
     uint64_t do_read_reg(reg r) const override;
@@ -88,11 +90,12 @@ class local_machine final : public i_machine {
     access_log do_log_reset_uarch(const access_log::type &log_type) override;
     uarch_interpreter_break_reason do_run_uarch(uint64_t uarch_cycle_end) override;
     uarch_cycle_root_hashes do_collect_uarch_cycle_root_hashes(uint64_t mcycle_end,
-        int32_t log2_bundle_uarch_cycle_count) override;
+        int32_t log2_bundle_uarch_cycle_count, const machine_hashes &revert_uarch_tail) override;
     address_range_descriptions do_get_address_ranges() const override;
-    void do_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length) override;
-    access_log do_log_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-        const access_log::type &log_type) override;
+    void do_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason, const unsigned char *data,
+        uint64_t length) override;
+    access_log do_log_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+        const unsigned char *data, uint64_t length, const access_log::type &log_type) override;
     uint64_t do_get_reg_address(reg r) const override;
     machine_config do_get_default_config() const override;
     std::string do_get_address_name(uint64_t paddr) const override;
@@ -102,8 +105,8 @@ class local_machine final : public i_machine {
         const machine_hash &root_hash_after) const override;
     void do_verify_reset_uarch(const machine_hash &root_hash_before, const access_log &log,
         const machine_hash &root_hash_after) const override;
-    void do_verify_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-        const machine_hash &root_hash_before, const access_log &log,
+    void do_verify_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+        const unsigned char *data, uint64_t length, const machine_hash &root_hash_before, const access_log &log,
         const machine_hash &root_hash_after) const override;
 
     machine *get_machine();
diff --git a/src/machine-address-ranges.cpp b/src/machine-address-ranges.cpp
index d84111a35..bfaa037f8 100644
--- a/src/machine-address-ranges.cpp
+++ b/src/machine-address-ranges.cpp
@@ -331,7 +331,15 @@ machine_address_ranges::machine_address_ranges(const machine_config &config,
         m_all | std::views::filter([](auto &ar) { return !ar->is_empty(); }) | std::views::transform([](auto &ar) {
             return address_range_description{.start = ar->get_start(),
                 .length = ar->get_length(),
-                .description = ar->get_description()};
+                .description = ar->get_description(),
+                .is_memory = ar->is_memory(),
+                .is_device = ar->is_device(),
+                .is_readable = ar->is_readable(),
+                .is_writeable = ar->is_writeable(),
+                .is_executable = ar->is_executable(),
+                .is_read_idempotent = ar->is_read_idempotent(),
+                .is_write_idempotent = ar->is_write_idempotent(),
+                .driver_id = static_cast<uint64_t>(ar->get_driver_id())};
         });
     std::ranges::copy(src, std::back_inserter(m_descrs));
     std::ranges::sort(m_descrs, [](auto &a, auto &b) { return a.start < b.start; });
diff --git a/src/machine-config.cpp b/src/machine-config.cpp
index f9e274ba2..7d63af7c2 100644
--- a/src/machine-config.cpp
+++ b/src/machine-config.cpp
@@ -177,6 +177,44 @@ std::string machine_config::store(const std::string &dir, sharing_mode sharing)
     return name;
 }
 
+static void adjust_lengths(memory_range_configs &mrs, const std::string &what) {
+    for (int i = 0; auto &mr : mrs) {
+        if (mr.length == UINT64_C(-1)) {
+            if (mr.backing_store.data_filename.empty()) {
+                throw std::runtime_error{"unable to auto-detect length of "s.append(what)
+                        .append(std::to_string(i))
+                        .append(" with empty image file")};
+            }
+            mr.length = os::file_size(mr.backing_store.data_filename);
+        }
+        ++i;
+    }
+}
+
+static uint64_t adjust_starts(uint64_t start, memory_range_configs &mrs, const std::string &what) {
+    for (int i = 0; auto &mr : mrs) {
+        if (mr.start == UINT64_C(-1)) {
+            // Round length to next power of two
+            auto length_po2 = std::bit_ceil(mr.length);
+            // Advance start to align it to rounded length
+            if (start % length_po2 != 0) {
+                start -= (start % length_po2);
+                if (__builtin_add_overflow(start, length_po2, &start)) {
+                    throw std::runtime_error{
+                        "no address space to auto-detect start of "s.append(what).append(std::to_string(i))};
+                }
+            }
+            mr.start = start;
+            if (__builtin_add_overflow(start, length_po2, &start)) {
+                throw std::runtime_error{
+                    "no address space to auto-detect start of "s.append(what).append(std::to_string(i))};
+            }
+        }
+        ++i;
+    }
+    return start;
+}
+
 machine_config &machine_config::adjust_defaults() {
     // Fill version registers
     if (processor.registers.marchid == UINT64_C(-1)) {
@@ -188,41 +226,12 @@ machine_config &machine_config::adjust_defaults() {
     if (processor.registers.mimpid == UINT64_C(-1)) {
         processor.registers.mimpid = MIMPID_INIT;
     }
-    // Auto detect flash drives and nvram start address and length
-    int i = 0; // NOLINT(misc-const-correctness)
-    int j = 0; // NOLINT(misc-const-correctness)
-    for (auto &f : flash_drive) {
-        const std::string flash_description = "flash drive "s + std::to_string(i);
-        // Auto detect flash drive start address
-        if (f.start == UINT64_C(-1)) {
-            f.start = AR_DRIVE_START + (AR_DRIVE_OFFSET * j);
-            ++j;
-        }
-        // Auto detect flash drive image length
-        if (f.length == UINT64_C(-1)) {
-            if (f.backing_store.data_filename.empty()) {
-                throw std::runtime_error{
-                    "unable to auto-detect length of "s.append(flash_description).append(" with empty image file")};
-            }
-            f.length = os::file_size(f.backing_store.data_filename);
-        }
-        ++i;
-    }
-    i = 0;
-    for (auto &n : nvram) {
-        const std::string nvram_description = "nvram "s + std::to_string(i);
-        if (n.start == UINT64_C(-1)) {
-            n.start = AR_DRIVE_START + (AR_DRIVE_OFFSET * j);
-            ++j;
-        }
-        if (n.length == UINT64_C(-1)) {
-            if (n.backing_store.data_filename.empty()) {
-                throw std::runtime_error{nvram_description + " has no length"s};
-            }
-            n.length = os::file_size(n.backing_store.data_filename);
-        }
-        ++i;
-    }
+    // Auto detect flash drives and nvram lengths
+    adjust_lengths(flash_drive, "flash drive ");
+    adjust_lengths(nvram, "nvram ");
+    // Auto detect starts
+    auto ram_length_po2 = std::bit_ceil(ram.length);
+    adjust_starts(adjust_starts(AR_RAM_START + ram_length_po2, flash_drive, "flash drive "), nvram, "nvram ");
     return *this;
 }
 
diff --git a/src/machine-config.hpp b/src/machine-config.hpp
index 0274ff1df..e8f084e26 100644
--- a/src/machine-config.hpp
+++ b/src/machine-config.hpp
@@ -79,10 +79,12 @@ struct ram_config final {
 };
 
 /// \brief Build default DTB bootargs from its parts
-#define DTB_BOOTARGS_CONSOLE "quiet earlycon=sbi console=hvc0 "
-#define DTB_BOOTARGS_UIO "uio_pdrv_genirq.of_id=generic-uio "
-#define DTB_BOOTARGS_ROOT "root=/dev/pmem0 rw init=/usr/sbin/cartesi-init"
-#define DTB_BOOTARGS_INIT (DTB_BOOTARGS_CONSOLE DTB_BOOTARGS_UIO DTB_BOOTARGS_ROOT)
+#define DTB_BOOTARGS_CONSOLE_PART "quiet earlycon=sbi console=hvc0 "
+#define DTB_BOOTARGS_UIO_PART "uio_pdrv_genirq.of_id=generic-uio "
+#define DTB_BOOTARGS_ROOT_PART "root=/dev/pmem0 rw "
+#define DTB_BOOTARGS_INIT_PART "init=/usr/sbin/cartesi-init"
+#define DTB_BOOTARGS_INIT                                                                                              \
+    (DTB_BOOTARGS_CONSOLE_PART DTB_BOOTARGS_UIO_PART DTB_BOOTARGS_ROOT_PART DTB_BOOTARGS_INIT_PART)
 
 /// \brief DTB state config
 struct dtb_config final {
diff --git a/src/machine-hash.hpp b/src/machine-hash.hpp
index c539040ba..4b19b2a5a 100644
--- a/src/machine-hash.hpp
+++ b/src/machine-hash.hpp
@@ -23,7 +23,8 @@
 #include <array>
 #include <cstddef>
 #include <span>
-#ifndef ZKARCHITECTURE
+// std::vector is not available in freestanding builds
+#if !defined(NO_STD_VECTOR)
 #include <vector>
 #endif
 
@@ -33,7 +34,7 @@ static constexpr size_t MACHINE_HASH_SIZE = 32;
 using machine_hash = std::array<unsigned char, MACHINE_HASH_SIZE>;
 using machine_hash_view = std::span<unsigned char, MACHINE_HASH_SIZE>;
 using const_machine_hash_view = std::span<const unsigned char, MACHINE_HASH_SIZE>;
-#ifndef ZKARCHITECTURE
+#if !defined(NO_STD_VECTOR)
 using machine_hashes = std::vector<machine_hash>;
 #endif
 
diff --git a/src/machine.cpp b/src/machine.cpp
index 06e69af74..1a26a26e3 100644
--- a/src/machine.cpp
+++ b/src/machine.cpp
@@ -65,6 +65,7 @@
 #include "processor-state.hpp"
 #include "record-send-cmio-state-access.hpp"
 #include "record-step-state-access.hpp"
+#include "rejected-manual-yield.hpp"
 #include "replay-send-cmio-state-access.hpp"
 #include "replay-step-state-access.hpp"
 #include "riscv-constants.hpp"
@@ -1462,25 +1463,29 @@ uint64_t machine::get_reg_address(reg r) {
     throw std::domain_error{"invalid register"};
 }
 
-void machine::mark_write_tlb_dirty_pages() const {
-    for (uint64_t slot_index = 0; slot_index < TLB_SET_SIZE; ++slot_index) {
-        auto vaddr_page = m_s->penumbra.tlb[TLB_WRITE][slot_index].vaddr_page;
-        if (vaddr_page == TLB_UNVERIFIED_PAGE) {
-            vaddr_page = init_hot_tlb_slot(TLB_WRITE, slot_index);
+void machine::mark_write_tlb_dirty_page(uint64_t slot_index) const {
+    auto vaddr_page = m_s->penumbra.tlb[TLB_WRITE][slot_index].vaddr_page;
+    if (vaddr_page == TLB_UNVERIFIED_PAGE) {
+        vaddr_page = init_hot_tlb_slot(TLB_WRITE, slot_index);
+    }
+    if (vaddr_page != TLB_INVALID_PAGE) {
+        const auto &shadow_slot = m_s->shadow.tlb[TLB_WRITE][slot_index];
+        // NOLINTNEXTLINE(cppcoreguidelines-pro-type-const-cast)
+        auto &ar = const_cast<address_range &>(read_pma(shadow_slot.pma_index));
+        if (!ar.is_memory()) {
+            throw std::runtime_error{"could not mark dirty page for a TLB entry: TLB is corrupt"};
         }
-        if (vaddr_page != TLB_INVALID_PAGE) {
-            const auto &shadow_slot = m_s->shadow.tlb[TLB_WRITE][slot_index];
-            // NOLINTNEXTLINE(cppcoreguidelines-pro-type-const-cast)
-            auto &ar = const_cast<address_range &>(read_pma(shadow_slot.pma_index));
-            if (!ar.is_memory()) {
-                throw std::runtime_error{"could not mark dirty page for a TLB entry: TLB is corrupt"};
-            }
-            auto paddr_page = vaddr_page + shadow_slot.vp_offset;
-            if (!ar.contains_absolute(paddr_page, AR_PAGE_SIZE)) {
-                throw std::runtime_error{"could not mark dirty page for a TLB entry: TLB is corrupt"};
-            }
-            ar.get_dirty_page_tree().mark_dirty_page_and_up(paddr_page - ar.get_start());
+        auto paddr_page = vaddr_page + shadow_slot.vp_offset;
+        if (!ar.contains_absolute(paddr_page, AR_PAGE_SIZE)) {
+            throw std::runtime_error{"could not mark dirty page for a TLB entry: TLB is corrupt"};
         }
+        ar.get_dirty_page_tree().mark_dirty_page_and_up(paddr_page - ar.get_start());
+    }
+}
+
+void machine::mark_write_tlb_dirty_pages() const {
+    for (uint64_t slot_index = 0; slot_index < TLB_SET_SIZE; ++slot_index) {
+        mark_write_tlb_dirty_page(slot_index);
     }
 }
 
@@ -1497,6 +1502,14 @@ machine_hash machine::get_root_hash() const {
     return m_ht.get_root_hash();
 }
 
+machine_hash machine::read_revert_root_hash() const {
+    return m_s->shadow.revert_root_hash;
+}
+
+void machine::write_revert_root_hash(const_machine_hash_view hash) {
+    std::ranges::copy(hash, m_s->shadow.revert_root_hash.begin());
+}
+
 std::string machine::get_address_name(uint64_t paddr) {
     if (paddr >= AR_UARCH_RAM_START && paddr - AR_UARCH_RAM_START < AR_UARCH_RAM_LENGTH) {
         return "uarch.ram";
@@ -1681,6 +1694,9 @@ void machine::write_memory(uint64_t paddr, const unsigned char *data, uint64_t l
         // Overwrite the processor shadow state with the provided data
         static_assert(AR_SHADOW_STATE_LENGTH == sizeof(m_s->shadow));
         // NOLINTNEXTLINE(cppcoreguidelines-pro-type-reinterpret-cast)
+        // Make sure we marked as dirty whatever pages were in the write TLB
+        mark_write_tlb_dirty_pages();
+        // Overwrite shadow
         memcpy(reinterpret_cast<unsigned char *>(&m_s->shadow), data, sizeof(m_s->shadow));
         // Reinitialize the hot TLB to reflect changes in the shadow TLB
         init_hot_tlb_contents();
@@ -1875,13 +1891,45 @@ void machine::write_word(uint64_t paddr, uint64_t val) {
     ar.get_dirty_page_tree().mark_dirty_page_and_up(offset);
 }
 
-void machine::send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length) {
+void machine::check_pending_cmio_request(const_machine_hash_view revert_root_hash, uint16_t reason,
+    uint64_t length) const {
+    // The core send_cmio_response cannot fail. It turns detected failures into no-ops, so the
+    // honest party can always log and prove the resulting state transition. The host-facing
+    // send refuses these no-ops upfront instead. The checks run before any state changes, so
+    // a failed call leaves the machine unchanged.
+    if (read_reg(reg::iflags_Y) == 0) {
+        throw std::invalid_argument{"iflags.Y is not set"};
+    }
+    if (length > AR_CMIO_RX_BUFFER_LENGTH) {
+        throw std::invalid_argument{"CMIO response data is too large"};
+    }
+    // Only advance-state responses are checked further. They are the input boundary of the
+    // rollups flow, whose revert-on-reject scheme depends on the preconditions below.
+    // Inspect-state queries and GIO responses get no further checks.
+    if (reason != HTIF_YIELD_REASON_ADVANCE_STATE) {
+        return;
+    }
+    // The machine must be waiting for an input on an rx-accepted manual yield.
+    if (read_reg(reg::htif_tohost_dev) != HTIF_DEV_YIELD || read_reg(reg::htif_tohost_cmd) != HTIF_YIELD_CMD_MANUAL ||
+        read_reg(reg::htif_tohost_reason) != HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED) {
+        throw std::invalid_argument{"machine is not waiting on an rx-accepted manual yield"};
+    }
+    // The recorded revert root hash must be the hash of the machine about to receive the
+    // input, the state a rejection later reverts to
+    if (!std::ranges::equal(revert_root_hash, get_root_hash())) {
+        throw std::invalid_argument{"revert root hash does not match the machine root hash"};
+    }
+}
+
+void machine::send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason, const unsigned char *data,
+    uint64_t length) {
+    check_pending_cmio_request(revert_root_hash, reason, length);
     const state_access a(*this);
-    cartesi::send_cmio_response(a, reason, data, length);
+    cartesi::send_cmio_response(a, revert_root_hash, reason, data, length);
 }
 
-access_log machine::log_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-    const access_log::type &log_type) {
+access_log machine::log_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+    const unsigned char *data, uint64_t length, const access_log::type &log_type) {
     if (m_c.hash_tree.hash_function != hash_function_type::keccak256) {
         throw std::runtime_error{
             "access logs can only be used with hash tree configured with Keccak-256 hash function"};
@@ -1892,23 +1940,24 @@ access_log machine::log_send_cmio_response(uint16_t reason, const unsigned char
     const record_send_cmio_state_access a(*this, log);
     {
         [[maybe_unused]] auto note = a.make_scoped_note("send_cmio_response");
-        cartesi::send_cmio_response(a, reason, data, length);
+        cartesi::send_cmio_response(a, revert_root_hash, reason, data, length);
     }
     auto root_hash_after = get_root_hash();
-    verify_send_cmio_response(reason, data, length, root_hash_before, log, root_hash_after);
+    verify_send_cmio_response(revert_root_hash, reason, data, length, root_hash_before, log, root_hash_after);
     return log;
 }
 
-void machine::verify_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-    const machine_hash &root_hash_before, const access_log &log, const machine_hash &root_hash_after) {
+void machine::verify_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+    const unsigned char *data, uint64_t length, const_machine_hash_view root_hash_before, const access_log &log,
+    const_machine_hash_view root_hash_after) {
     replay_send_cmio_state_access::context context{log, root_hash_before, hash_function_type::keccak256};
     // Verify all intermediate state transitions
     replay_send_cmio_state_access a(context);
-    cartesi::send_cmio_response(a, reason, data, length);
+    cartesi::send_cmio_response(a, revert_root_hash, reason, data, length);
     a.finish();
     // Make sure the access log ends at the same root hash as the state
     auto obtained_root_hash = a.get_root_hash();
-    if (obtained_root_hash != root_hash_after) {
+    if (!std::ranges::equal(obtained_root_hash, root_hash_after)) {
         throw std::invalid_argument{"mismatch in root hash after replay"};
     }
 }
@@ -1940,18 +1989,19 @@ access_log machine::log_reset_uarch(const access_log::type &log_type) {
     const machine_hash root_hash_before = get_root_hash();
     // Call uarch_reset_state with a uarch_record_state_access object
     access_log log(log_type);
-    uarch_record_state_access a(*this, log);
+    uarch_record_state_access::context context;
+    uarch_record_state_access a(context, *this, log);
     {
         [[maybe_unused]] auto note = a.make_scoped_note("reset_uarch_state");
         uarch_reset_state(a);
     }
-    const auto root_hash_after = get_root_hash();
-    verify_reset_uarch(root_hash_before, log, root_hash_after);
+    // context.root_hash_after holds the revert root hash when the reset reverted the state
+    verify_reset_uarch(root_hash_before, log, context.root_hash_after);
     return log;
 }
 
-void machine::verify_reset_uarch(const machine_hash &root_hash_before, const access_log &log,
-    const machine_hash &root_hash_after) {
+void machine::verify_reset_uarch(const_machine_hash_view root_hash_before, const access_log &log,
+    const_machine_hash_view root_hash_after) {
     // Verify all intermediate state transitions
     uarch_replay_state_access::context context{log, root_hash_before};
     uarch_replay_state_access a(context);
@@ -1959,7 +2009,7 @@ void machine::verify_reset_uarch(const machine_hash &root_hash_before, const acc
     a.finish();
     // Make sure the access log ends at the same root hash as the state
     const machine_hash obtained_root_hash = a.get_root_hash();
-    if (obtained_root_hash != root_hash_after) {
+    if (!std::ranges::equal(obtained_root_hash, root_hash_after)) {
         throw std::invalid_argument{"mismatch in root hash after replay"};
     }
 }
@@ -1978,7 +2028,8 @@ access_log machine::log_step_uarch(const access_log::type &log_type) {
     auto root_hash_before = get_root_hash();
     access_log log(log_type);
     // Call interpret with a logged state access object
-    const uarch_record_state_access a(*this, log);
+    uarch_record_state_access::context context;
+    const uarch_record_state_access a(context, *this, log);
     {
         [[maybe_unused]] auto note = a.make_scoped_note("step");
         uarch_step(a);
@@ -1992,8 +2043,8 @@ access_log machine::log_step_uarch(const access_log::type &log_type) {
 // Declaration of explicit instantiation in module uarch-step.cpp
 extern template UArchStepStatus uarch_step(uarch_replay_state_access &a);
 
-void machine::verify_step_uarch(const machine_hash &root_hash_before, const access_log &log,
-    const machine_hash &root_hash_after) {
+void machine::verify_step_uarch(const_machine_hash_view root_hash_before, const access_log &log,
+    const_machine_hash_view root_hash_after) {
     // Verify all intermediate state transitions
     uarch_replay_state_access::context context{log, root_hash_before};
     uarch_replay_state_access a(context);
@@ -2001,7 +2052,7 @@ void machine::verify_step_uarch(const machine_hash &root_hash_before, const acce
     a.finish();
     // Make sure the access log ends at the same root hash as the state
     auto obtained_root_hash = a.get_root_hash();
-    if (obtained_root_hash != root_hash_after) {
+    if (!std::ranges::equal(obtained_root_hash, root_hash_after)) {
         throw std::invalid_argument{"mismatch in root hash after replay"};
     }
 }
@@ -2057,21 +2108,24 @@ interpreter_break_reason machine::log_step(uint64_t mcycle_count, const std::str
     record_step_state_access a(context, *this);
     const uint64_t mcycle_end = saturating_add(a.read_mcycle(), mcycle_count);
     auto break_reason = interpret(a, mcycle_end);
-    auto root_hash_after = get_root_hash();
+    // When the machine has rejected an input, the canonical root hash after the step is
+    // the recorded revert root hash
+    const state_access sa(*this);
+    const auto root_hash_after = is_rejected_manual_yield(sa) ? read_revert_root_hash() : get_root_hash();
     a.finish(root_hash_before, mcycle_count, root_hash_after);
     verify_step(root_hash_before, filename, mcycle_count, root_hash_after);
     return break_reason;
 }
 
-interpreter_break_reason machine::verify_step(const machine_hash &root_hash_before, const std::string &filename,
-    uint64_t mcycle_count, const machine_hash &root_hash_after) {
+interpreter_break_reason machine::verify_step(const_machine_hash_view root_hash_before, const std::string &filename,
+    uint64_t mcycle_count, const_machine_hash_view root_hash_after) {
     auto data_length = os::file_size(filename);
     auto mapped_data = os::mapped_memory(data_length, os::mapped_memory_flags{}, filename);
     replay_step_state_access::context context;
     // Constructor reads log header, validates computed initial hash == logged initial hash
     replay_step_state_access a(context, mapped_data.get_ptr(), data_length);
     // logged initial hash matches computed initial hash
-    if (context.logged_root_hash_before != root_hash_before) {
+    if (!std::ranges::equal(context.logged_root_hash_before, root_hash_before)) {
         throw std::runtime_error("root hash before mismatch: argument does not match step log header");
     }
     if (context.logged_mcycle_count != mcycle_count) {
@@ -2080,7 +2134,7 @@ interpreter_break_reason machine::verify_step(const machine_hash &root_hash_befo
     const uint64_t mcycle_end = saturating_add(a.read_mcycle(), context.logged_mcycle_count);
     auto break_reason = interpret(a, mcycle_end);
     a.finish(); // validates computed final hash == logged final hash
-    if (context.logged_root_hash_after != root_hash_after) {
+    if (!std::ranges::equal(context.logged_root_hash_after, root_hash_after)) {
         throw std::runtime_error("root hash after mismatch: argument does not match step log header");
     }
     return break_reason;
@@ -2244,6 +2298,7 @@ mcycle_root_hashes machine::collect_mcycle_root_hashes(uint64_t mcycle_end, uint
     uint64_t mcycle_target = saturating_add(mcycle_start, mcycle_period - mcycle_phase, mcycle_end);
     uint64_t mcycle_reached = read_reg(reg::mcycle);
     bool at_fixed_point = false;
+    machine_hash root_hash{};
 
     // Run until reaching next mcycle target
     while (mcycle_reached < mcycle_target) {
@@ -2291,8 +2346,13 @@ mcycle_root_hashes machine::collect_mcycle_root_hashes(uint64_t mcycle_end, uint
         // Add the current root hash to the back tree whenever we reach a period boundary or a fixed point
         // This ensures we only append at the correct intervals, even when mcycle_end does not align with the period
         if (result.mcycle_phase == 0 || at_fixed_point) {
+            // When the machine has rejected an input, the canonical root hash from the yield onward
+            // is the recorded revert root hash
+            const state_access sa(*this);
+            root_hash = is_rejected_manual_yield(sa) ? read_revert_root_hash() : m_ht.get_root_hash();
+
             // Append root hash relative to this period to the result
-            back_tree.push_back(m_ht.get_root_hash());
+            back_tree.push_back(root_hash);
 
             // When back tree is full, we can append the bundled root hash and reset it
             if (back_tree.full()) {
@@ -2313,9 +2373,9 @@ mcycle_root_hashes machine::collect_mcycle_root_hashes(uint64_t mcycle_end, uint
 
     // If the machine yielded manually or halted, then append bundled root hashes with padding
     if (at_fixed_point && log2_bundle_mcycle_count > 0) {
-        // Construct pad tree containing repetitions of the current root hash
-        const auto pad_hashes = back_merkle_tree::make_pad_hashes(m_ht.get_root_hash(), log2_bundle_mcycle_count,
-            m_c.hash_tree.hash_function);
+        // Construct pad tree containing repetitions of the last collected root hash
+        const auto pad_hashes =
+            back_merkle_tree::make_pad_hashes(root_hash, log2_bundle_mcycle_count, m_c.hash_tree.hash_function);
 
         // Pad back tree when partially filled and append its bundled root hash
         if (!back_tree.empty()) {
@@ -2337,8 +2397,78 @@ mcycle_root_hashes machine::collect_mcycle_root_hashes(uint64_t mcycle_end, uint
     return result;
 }
 
+/// \brief Appends the root hash after one uarch cycle to the collection result.
+/// \param result Collection result receiving hashes and bundled root hashes.
+/// \param back_tree Back tree bundling the root hashes.
+/// \param cycle_root_hash Root hash after the uarch cycle.
+static void append_uarch_cycle_root_hash(uarch_cycle_root_hashes &result, back_merkle_tree &back_tree,
+    const machine_hash &cycle_root_hash) {
+    back_tree.push_back(cycle_root_hash);
+
+    // When back tree is full, we can append the bundled root hash and reset it
+    if (back_tree.full()) {
+        result.hashes.emplace_back(back_tree.get_root_hash());
+        back_tree.clear();
+    }
+}
+
+/// \brief Appends the root hash after the uarch reset that ends one mcycle to the collection result.
+/// \param result Collection result receiving hashes and bundled root hashes.
+/// \param back_tree Back tree bundling the root hashes.
+/// \param log2_bundle_uarch_cycle_count Log base 2 of the amount of uarch cycle root hashes to bundle.
+/// \param halt_root_hash Root hash after the uarch halted, padding the bundles up to the reset entry.
+/// \param reset_root_hash Root hash after the uarch reset.
+static void append_uarch_reset_root_hash(uarch_cycle_root_hashes &result, back_merkle_tree &back_tree,
+    int32_t log2_bundle_uarch_cycle_count, const machine_hash &halt_root_hash, const machine_hash &reset_root_hash) {
+    if (log2_bundle_uarch_cycle_count > 0) {
+        const auto halt_pad_hashes = back_merkle_tree::make_pad_hashes(halt_root_hash, log2_bundle_uarch_cycle_count,
+            back_tree.get_hash_function());
+
+        // Pad back tree when partially filled and then append its bundled root hash
+        if (!back_tree.empty()) {
+            assert(!back_tree.full());
+            back_tree.pad_back(back_tree.get_remaining_leaf_count(), halt_pad_hashes);
+            result.hashes.emplace_back(back_tree.get_root_hash());
+            back_tree.clear();
+        }
+
+        // Append bundled root hash containing only repetitions of the halt root hash
+        result.hashes.emplace_back(halt_pad_hashes[log2_bundle_uarch_cycle_count]);
+
+        // Append bundled root hash containing repetitions of the halt root hash on the left
+        // and one reset root hash on the right
+        assert(back_tree.empty());
+        back_tree.pad_back((1 << log2_bundle_uarch_cycle_count) - 1, halt_pad_hashes);
+        back_tree.push_back(reset_root_hash);
+        assert(back_tree.full());
+        result.hashes.emplace_back(back_tree.get_root_hash());
+        back_tree.clear();
+    } else {
+        result.hashes.push_back(reset_root_hash);
+    }
+
+    // Add the index where reset happened
+    result.reset_indices.emplace_back(result.hashes.size() - 1);
+}
+
+/// \brief Appends the period of the reverted machine to the collection result.
+/// \param result Collection result receiving hashes and bundled root hashes.
+/// \param back_tree Back tree bundling the root hashes.
+/// \param log2_bundle_uarch_cycle_count Log base 2 of the amount of uarch cycle root hashes to bundle.
+/// \param revert_uarch_tail Root hashes after each uarch cycle of the reverted machine period,
+/// the last being the revert root hash itself, which is the reset entry of the period.
+static void append_revert_uarch_tail_period(uarch_cycle_root_hashes &result, back_merkle_tree &back_tree,
+    int32_t log2_bundle_uarch_cycle_count, const machine_hashes &revert_uarch_tail) {
+    assert(revert_uarch_tail.size() >= 2);
+    for (size_t i = 0; i + 1 < revert_uarch_tail.size(); ++i) {
+        append_uarch_cycle_root_hash(result, back_tree, revert_uarch_tail[i]);
+    }
+    append_uarch_reset_root_hash(result, back_tree, log2_bundle_uarch_cycle_count,
+        revert_uarch_tail[revert_uarch_tail.size() - 2], revert_uarch_tail.back());
+}
+
 uarch_cycle_root_hashes machine::collect_uarch_cycle_root_hashes(uint64_t mcycle_end,
-    int32_t log2_bundle_uarch_cycle_count) {
+    int32_t log2_bundle_uarch_cycle_count, const machine_hashes &revert_uarch_tail) {
     const uint64_t mcycle_start = read_reg(reg::mcycle);
 
     // Check preconditions
@@ -2362,6 +2492,28 @@ uarch_cycle_root_hashes machine::collect_uarch_cycle_root_hashes(uint64_t mcycle
         throw std::runtime_error{"microarchitecture is not reset"};
     }
 
+    // A call that can execute instructions may end in a rejected manual yield, and a call on a
+    // machine already in that state must emit the period of the reverted machine. Both need the
+    // revert uarch tail, which is checked here, before anything executes, so a failed call
+    // leaves the machine unchanged and can be retried with the tail in hand. A call starting at
+    // any other fixed point can only perform a no-op mcycle that cannot reject, so it never
+    // consumes the tail.
+    const state_access sa(*this);
+    const bool start_rejected = is_rejected_manual_yield(sa);
+    const bool start_at_fixed_point =
+        read_reg(reg::iflags_H) != 0 || read_reg(reg::iflags_Y) != 0 || mcycle_start == UINT64_MAX;
+    if (start_rejected || !start_at_fixed_point) {
+        if (revert_uarch_tail.empty()) {
+            throw std::runtime_error{"revert uarch tail is required"};
+        }
+        if (revert_uarch_tail.size() < 2) {
+            throw std::runtime_error{"revert uarch tail is too short"};
+        }
+        if (revert_uarch_tail.back() != read_revert_root_hash()) {
+            throw std::runtime_error{"revert uarch tail does not end with the revert root hash"};
+        }
+    }
+
     // If the collection loop does not advance mcycle, set the break reason to indicate the target mcycle was reached
     uarch_cycle_root_hashes result;
     result.break_reason = interpreter_break_reason::reached_target_mcycle;
@@ -2369,15 +2521,26 @@ uarch_cycle_root_hashes machine::collect_uarch_cycle_root_hashes(uint64_t mcycle
     // Initialize back tree
     back_merkle_tree back_tree(log2_bundle_uarch_cycle_count, m_c.hash_tree.hash_function);
 
+    // When the machine has already rejected an input, the canonical timeline continues from the
+    // reverted machine, so the result is its period, taken from the revert uarch tail, and the
+    // machine is left untouched
+    if (start_rejected) {
+        append_revert_uarch_tail_period(result, back_tree, log2_bundle_uarch_cycle_count, revert_uarch_tail);
+        result.break_reason = interpreter_break_reason::yielded_manually;
+        assert(back_tree.empty());
+        return result;
+    }
+
     hash_tree::dirty_words_type reset_dirty_words;
     collect_uarch_cycle_hashes_state_access::context context{};
     const collect_uarch_cycle_hashes_state_access a(context, *this);
 
     // Reserve space before entering the loop to minimize dynamic memory allocations,
-    // the reserved sizes below are based on empirical benchmarks to balance performance and memory usage
+    // the reserved sizes below are based on empirical benchmarks to balance performance and memory usage,
+    // and are clamped to avoid over-allocation
     const uint64_t mcycle_count = mcycle_end - mcycle_start;
-    result.hashes.reserve(mcycle_count * 512);
-    result.reset_indices.reserve(mcycle_count);
+    result.hashes.reserve(std::clamp<uint64_t>(mcycle_count * 512, 1, 16384));
+    result.reset_indices.reserve(std::clamp<uint64_t>(mcycle_count, 1, 16384));
     context.dirty_words.reserve(8);
     reset_dirty_words.reserve(64);
 
@@ -2386,8 +2549,8 @@ uarch_cycle_root_hashes machine::collect_uarch_cycle_root_hashes(uint64_t mcycle
     uint64_t mcycle_target = saturating_add(mcycle_start, UINT64_C(1), mcycle_end);
     uint64_t mcycle_reached = read_reg(reg::mcycle);
 
-    // In case we start at fixed point, we will attempt to execute one extra mcycle which
-    bool at_fixed_point = read_reg(reg::iflags_H) != 0 || read_reg(reg::iflags_Y) != 0 || mcycle_start == UINT64_MAX;
+    // In case we start at fixed point, we will attempt to execute one extra mcycle
+    bool at_fixed_point = start_at_fixed_point;
     if (at_fixed_point) {
         mcycle_target = mcycle_reached;
     }
@@ -2434,13 +2597,7 @@ uarch_cycle_root_hashes machine::collect_uarch_cycle_root_hashes(uint64_t mcycle
             assert(uarch_break_reason == uarch_interpreter_break_reason::reached_target_cycle);
 
             // Append root hash to the result
-            back_tree.push_back(m_ht.get_root_hash());
-
-            // When back tree is full, we can append the bundled root hash and reset it
-            if (back_tree.full()) {
-                result.hashes.emplace_back(back_tree.get_root_hash());
-                back_tree.clear();
-            }
+            append_uarch_cycle_root_hash(result, back_tree, m_ht.get_root_hash());
         }
 
         // Sanity check to ensure the loop is working correctly, this should always be true
@@ -2476,41 +2633,14 @@ uarch_cycle_root_hashes machine::collect_uarch_cycle_root_hashes(uint64_t mcycle
             throw std::runtime_error{"update hash tree failed"};
         }
         reset_dirty_words.clear();
-        const auto reset_root_hash = m_ht.get_root_hash();
-
-        // Add one hash after the uarch reset
-        if (log2_bundle_uarch_cycle_count > 0) {
-            const auto halt_pad_hashes = back_merkle_tree::make_pad_hashes(halt_root_hash,
-                log2_bundle_uarch_cycle_count, m_c.hash_tree.hash_function);
-
-            // Pad back tree when partially filled and then append its bundled root hash
-            if (!back_tree.empty()) {
-                assert(!back_tree.full());
-                back_tree.pad_back(back_tree.get_remaining_leaf_count(), halt_pad_hashes);
-                result.hashes.emplace_back(back_tree.get_root_hash());
-                back_tree.clear();
-            }
 
-            // Append bundled root hash containing only repetitions of the halt root hash
-            result.hashes.emplace_back(halt_pad_hashes[log2_bundle_uarch_cycle_count]);
+        // When the machine has rejected an input, the reset folds in a revert, and the canonical
+        // root hash after it is the recorded revert root hash
+        const bool rejected = is_rejected_manual_yield(sa);
+        const auto reset_root_hash = rejected ? read_revert_root_hash() : m_ht.get_root_hash();
 
-            // Append bundled root hash containing repetitions of the halt root hash on the left
-            // and one reset root hash on the right
-            assert(back_tree.empty());
-            back_tree.pad_back((1 << log2_bundle_uarch_cycle_count) - 1, halt_pad_hashes);
-            back_tree.push_back(reset_root_hash);
-            assert(back_tree.full());
-            result.hashes.emplace_back(back_tree.get_root_hash());
-            back_tree.clear();
-
-            // Add the index where reset happened
-            result.reset_indices.emplace_back(result.hashes.size() - 1);
-        } else {
-            result.hashes.push_back(reset_root_hash);
-
-            // Add the index where reset happened
-            result.reset_indices.emplace_back(result.hashes.size() - 1);
-        }
+        // Add one hash after the uarch reset
+        append_uarch_reset_root_hash(result, back_tree, log2_bundle_uarch_cycle_count, halt_root_hash, reset_root_hash);
 
         mcycle_reached = read_reg(reg::mcycle);
 
@@ -2527,6 +2657,14 @@ uarch_cycle_root_hashes machine::collect_uarch_cycle_root_hashes(uint64_t mcycle
             break;
         }
 
+        // When the machine has rejected an input, the canonical timeline continues from the
+        // reverted machine, so the period that follows comes from the revert uarch tail
+        // instead of the machine itself
+        if (rejected) {
+            append_revert_uarch_tail_period(result, back_tree, log2_bundle_uarch_cycle_count, revert_uarch_tail);
+            break;
+        }
+
         // If we already attempted to advance one mcycle over a fixed point, we are done
         if (at_fixed_point) {
             break;
diff --git a/src/machine.hpp b/src/machine.hpp
index 9c616a002..9783e302f 100644
--- a/src/machine.hpp
+++ b/src/machine.hpp
@@ -126,6 +126,16 @@ class machine final {
     /// \details The counter is key is the concatenation of \p domain with \p name.
     static std::string get_counter_key(const char *name, const char *domain = nullptr);
 
+    /// \brief Checks that the machine can receive a cmio response with the given revert root hash.
+    /// \param revert_root_hash Machine root hash to revert to in case the response is eventually rejected.
+    /// \param reason Reason for sending the response.
+    /// \param length Length of response data.
+    /// \details Throws when the machine is not waiting on a manual yield or when the response data
+    /// does not fit in the rx buffer. For advance-state responses, also throws when the machine is
+    /// not waiting on an rx-accepted manual yield or when \p revert_root_hash differs from the
+    /// machine root hash. Called by send_cmio_response before any state changes.
+    void check_pending_cmio_request(const_machine_hash_view revert_root_hash, uint16_t reason, uint64_t length) const;
+
     /// \brief Checks if the machine has VirtIO devices.
     /// \returns True if at least one VirtIO device is present.
     bool has_virtio_devices() const;
@@ -231,6 +241,9 @@ class machine final {
     /// Stores into result.back_tree the back tree context to continue collecting bundled root hashes.
     /// \detail The first hash added to \p result.hashes is the root hash after (\p mcycle_period - \p mcycle_phase)
     /// machine cycles (if the function managed to get that far before returning).
+    /// When the machine stops on a manual yield whose reason is rx-rejected, the root hash collected at the
+    /// yield and the padding that follows are substituted by the recorded revert root hash, which is the root
+    /// hash verifiers accept for these state transitions.
     mcycle_root_hashes collect_mcycle_root_hashes(uint64_t mcycle_end, uint64_t mcycle_period, uint64_t mcycle_phase,
         int32_t log2_bundle_mcycle_count, const std::optional<back_merkle_tree> &previous_back_tree = {});
 
@@ -245,8 +258,8 @@ class machine final {
     /// \param log_filename Name of the file containing the log.
     /// \param mcycle_count Number of mcycles the machine was run for.
     /// \param root_hash_after Hash of the state after the step.
-    static interpreter_break_reason verify_step(const machine_hash &root_hash_before, const std::string &log_filename,
-        uint64_t mcycle_count, const machine_hash &root_hash_after);
+    static interpreter_break_reason verify_step(const_machine_hash_view root_hash_before,
+        const std::string &log_filename, uint64_t mcycle_count, const_machine_hash_view root_hash_after);
 
     /// \brief Runs the machine in the microarchitecture until the mcycles advances by one unit or the micro cycle
     /// counter (uarch_cycle) reaches uarch_cycle_end
@@ -257,6 +270,11 @@ class machine final {
     /// the machine yields, or halts. Implicitly resetting the uarch between mcycles.
     /// \param mcycle_end End machine cycle value to execute, uarch cycle by uarch cycle.
     /// \param log2_bundle_uarch_cycle_count Log base 2 of the amount of uarch cycle root hashes to bundle.
+    /// \param revert_uarch_tail Root hashes after each uarch cycle of the period of the machine the recorded
+    /// revert root hash reverts to, the last entry being the revert root hash itself (the reset entry of that
+    /// period). It is obtained by calling this function with no bundling on that machine, while it waits for
+    /// a response. Required unless the machine starts at a fixed point other than a rejected manual yield,
+    /// in which case the call cannot consume it and ignores it.
     /// \returns The collected uarch cycle root hashes.
     /// Stores into result.hashes the root hashes after each uarch cycle.
     /// Stores into result.reset_indices the indices of the root hashes after each implicit uarch reset
@@ -264,7 +282,11 @@ class machine final {
     /// Stores into result.break_reason the reason why the function returned.
     /// \detail The first hash added to \p result.hashes is the root hash after the first uarch cycle, the last is the
     /// root hash at the time function returns (for whatever reason), which always happens right after an uarch reset.
-    uarch_cycle_root_hashes collect_uarch_cycle_root_hashes(uint64_t mcycle_end, int32_t log2_bundle_uarch_cycle_count);
+    /// When the machine ends in a manual yield whose reason is rx-rejected, the root hash after the final uarch
+    /// reset is substituted by the recorded revert root hash, and one extra period, that of the reverted machine
+    /// as given by \p revert_uarch_tail, is collected after it.
+    uarch_cycle_root_hashes collect_uarch_cycle_root_hashes(uint64_t mcycle_end, int32_t log2_bundle_uarch_cycle_count,
+        const machine_hashes &revert_uarch_tail = {});
 
     /// \brief Advances one micro step and returns a state access log.
     /// \param log_type Type of access log to generate.
@@ -278,21 +300,25 @@ class machine final {
     /// \param log_type Type of access log to generate.
     /// \param log_data If true, access data is recorded in the log, otherwise only hashes. The default is false.
     /// \returns The state access log.
+    /// \details When the machine has rejected an input (a manual yield with reason rx-rejected is pending),
+    /// the canonical state after the logged operation is the one recorded in the revert root hash, even
+    /// though the physical machine only has its uarch reset.
     access_log log_reset_uarch(const access_log::type &log_type);
 
     /// \brief Checks the validity of a state transition caused by log_step_uarch.
     /// \param root_hash_before State hash before step.
     /// \param log Step state access log.
     /// \param root_hash_after State hash after step.
-    static void verify_step_uarch(const machine_hash &root_hash_before, const access_log &log,
-        const machine_hash &root_hash_after);
+    static void verify_step_uarch(const_machine_hash_view root_hash_before, const access_log &log,
+        const_machine_hash_view root_hash_after);
 
     /// \brief Checks the validity of a state transition caused by log_reset_uarch.
     /// \param root_hash_before State hash before uarch reset
     /// \param log Step state access log.
-    /// \param root_hash_after State hash after uarch reset.
-    static void verify_reset_uarch(const machine_hash &root_hash_before, const access_log &log,
-        const machine_hash &root_hash_after);
+    /// \param root_hash_after State hash after uarch reset. When the machine has rejected an input,
+    /// this is the recorded revert root hash.
+    static void verify_reset_uarch(const_machine_hash_view root_hash_before, const access_log &log,
+        const_machine_hash_view root_hash_after);
 
     /// \brief Returns copy of default machine config
     static machine_config get_default_config();
@@ -396,6 +422,14 @@ class machine final {
     /// \returns The hash.
     machine_hash get_root_hash() const;
 
+    /// \brief Reads the revert root hash from the shadow state.
+    /// \returns The hash.
+    machine_hash read_revert_root_hash() const;
+
+    /// \brief Writes the revert root hash to the shadow state.
+    /// \param hash Hash to store.
+    void write_revert_root_hash(const_machine_hash_view hash);
+
     /// \brief Obtains the hash of a node in the hash-tree.
     /// \param address Address of target node. Must be aligned to a 2<sup>log2_size</sup> boundary.
     /// \param log2_size log<sub>2</sub> of size subintended by target node.
@@ -516,6 +550,10 @@ class machine final {
         return const_cast<address_range &>(std::as_const(*this).read_pma(index));
     }
 
+    /// \brief Mark as dirty the page currently mapped by a write TLB slot, if any.
+    /// \param slot_index Index of the write TLB slot to inspect.
+    void mark_write_tlb_dirty_page(uint64_t slot_index) const;
+
     /// \brief Go over the write TLB and mark as dirty all pages currently there.
     void mark_write_tlb_dirty_pages() const;
 
@@ -537,10 +575,15 @@ class machine final {
     void replace_memory_range(const memory_range_config &config);
 
     /// \brief Sends cmio response
+    /// \param revert_root_hash Machine root hash to revert to in case the response is eventually rejected.
+    /// For advance-state responses, it must be the root hash of the machine itself, and the machine must be
+    /// waiting on an rx-accepted manual yield, both checked before any state changes. Other responses
+    /// (inspect-state queries and GIO responses) are not checked.
     /// \param reason Reason for sending response.
     /// \param data Response data.
     /// \param length Length of response data.
-    void send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length);
+    void send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason, const unsigned char *data,
+        uint64_t length);
 
     /// \brief Converts from machine host address to target physical address
     /// \param haddr Machine host address to convert
@@ -561,15 +604,7 @@ class machine final {
     }
 
     /// \brief Marks a page as dirty
-    /// \param haddr Machine host address within page
-    /// \param pma_index Index of PMA where address falls
-    void mark_dirty_page(host_addr haddr, uint64_t pma_index) {
-        auto paddr = get_paddr(haddr, pma_index);
-        mark_dirty_page(paddr, pma_index);
-    }
-
-    /// \brief Marks a page as dirty
-    /// \param paddr Target phyislcal address within page
+    /// \param paddr Target physical address within page
     /// \param pma_index Index of PMA where address falls
     void mark_dirty_page(uint64_t paddr, uint64_t pma_index) {
         auto &ar = read_pma(pma_index);
@@ -584,6 +619,10 @@ class machine final {
     /// \param pma_index Index of PMA where address falls
     void write_verified_tlb(TLB_set_index set_index, uint64_t slot_index, uint64_t vaddr_page, host_addr vh_offset,
         uint64_t pma_index) {
+        // Mark the page currently mapped here dirty before we overwrite the slot
+        if (set_index == TLB_WRITE) {
+            mark_write_tlb_dirty_page(slot_index);
+        }
         m_s->penumbra.tlb[set_index][slot_index].vaddr_page = vaddr_page;
         m_s->penumbra.tlb[set_index][slot_index].vh_offset = vh_offset;
         m_s->shadow.tlb[set_index][slot_index].vaddr_page = vaddr_page;
@@ -607,6 +646,10 @@ class machine final {
         if (slot_index >= TLB_SET_SIZE) {
             throw std::out_of_range{"TLB slot index out of bounds"};
         }
+        // Mark the page currently mapped here dirty before we overwrite the slot
+        if (set_index == TLB_WRITE) {
+            mark_write_tlb_dirty_page(slot_index);
+        }
         m_s->penumbra.tlb[set_index][slot_index].vaddr_page = TLB_UNVERIFIED_PAGE;
         m_s->penumbra.tlb[set_index][slot_index].vh_offset = host_addr{0};
         m_s->shadow.tlb[set_index][slot_index].vaddr_page = vaddr_page;
@@ -642,23 +685,32 @@ class machine final {
     }
 
     /// \brief Sends cmio response and returns an access log
+    /// \param revert_root_hash Machine root hash to revert to in case the response is eventually rejected.
+    /// Unlike send_cmio_response, it is not checked against the machine root hash.
     /// \param reason Reason for sending response.
     /// \param data Response data.
     /// \param length Length of response data.
     /// \param log_type Type of access log to generate.
     /// \return The state access log.
-    access_log log_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-        const access_log::type &log_type);
+    /// \details The logged operation cannot fail, so the honest party can always prove the resulting
+    /// state transition. It is a no-op that leaves the state unchanged when the machine is not waiting
+    /// on a manual yield, when an advance-state response finds the machine yielded with a reason other
+    /// than rx-accepted (e.g., it rejected an input or threw an exception), or when the response data
+    /// does not fit in the rx buffer.
+    access_log log_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+        const unsigned char *data, uint64_t length, const access_log::type &log_type);
 
     /// \brief Checks the validity of state transitions caused by log_send_cmio_response.
+    /// \param revert_root_hash The revert root hash recorded when the log was generated.
     /// \param reason Reason for sending response.
     /// \param data The response sent when the log was generated.
     /// \param length Length of response
     /// \param root_hash_before State hash before response was sent.
     /// \param log Log containing the state accesses performed by the load operation
     /// \param root_hash_after State hash after response was sent.
-    static void verify_send_cmio_response(uint16_t reason, const unsigned char *data, uint64_t length,
-        const machine_hash &root_hash_before, const access_log &log, const machine_hash &root_hash_after);
+    static void verify_send_cmio_response(const_machine_hash_view revert_root_hash, uint16_t reason,
+        const unsigned char *data, uint64_t length, const_machine_hash_view root_hash_before, const access_log &log,
+        const_machine_hash_view root_hash_after);
 
     /// \brief Returns a description of what is at a given target physical address
     /// \param paddr Target physical address of interest
diff --git a/src/pmas-constants.hpp b/src/pmas-constants.hpp
index 84d208932..a421c2b0b 100644
--- a/src/pmas-constants.hpp
+++ b/src/pmas-constants.hpp
@@ -54,7 +54,7 @@ enum PMA_ISTART_masks : uint64_t {
     PMA_ISTART_START_MASK = UINT64_C(-1) << PMA_ISTART_START_SHIFT ///< Start of range
 };
 
-/// \brief PMA device ids
+/// \brief PMA driver ids
 enum class PMA_ISTART_DID : uint8_t {
     empty = PMA_EMPTY_DID_DEF,                           ///< DID for empty range
     memory = PMA_MEMORY_DID_DEF,                         ///< DID for memory
diff --git a/src/pmas-defines.h b/src/pmas-defines.h
index 11a9fa905..a5caa3561 100644
--- a/src/pmas-defines.h
+++ b/src/pmas-defines.h
@@ -20,18 +20,18 @@
 
 #define PMA_MAX_DEF 32 ///< Maximum number of PMAs
 
-#define PMA_EMPTY_DID_DEF 0              ///< Device ID for empty range
-#define PMA_MEMORY_DID_DEF 1             ///< Device ID for memory
-#define PMA_SHADOW_STATE_DID_DEF 2       ///< Device ID for shadow state device
-#define PMA_FLASH_DRIVE_DID_DEF 3        ///< Device ID for flash drive device
-#define PMA_CLINT_DID_DEF 4              ///< Device ID for CLINT device
-#define PMA_HTIF_DID_DEF 5               ///< Device ID for HTIF device
-#define PMA_PLIC_DID_DEF 6               ///< Device ID for PLIC device
-#define PMA_CMIO_RX_BUFFER_DID_DEF 7     ///< Device ID for cmio RX buffer
-#define PMA_CMIO_TX_BUFFER_DID_DEF 8     ///< Device ID for cmio TX buffer
-#define PMA_SHADOW_UARCH_STATE_DID_DEF 9 ///< Device ID for uarch shadow state device
-#define PMA_VIRTIO_DID_DEF 10            ///< Device ID for VirtIO devices
-#define PMA_NVRAM_DID_DEF 11             ///< Device ID for NVRAM
+#define PMA_EMPTY_DID_DEF 0              ///< Driver ID for empty range
+#define PMA_MEMORY_DID_DEF 1             ///< Driver ID for memory
+#define PMA_SHADOW_STATE_DID_DEF 2       ///< Driver ID for shadow state device
+#define PMA_FLASH_DRIVE_DID_DEF 3        ///< Driver ID for flash drive device
+#define PMA_CLINT_DID_DEF 4              ///< Driver ID for CLINT device
+#define PMA_HTIF_DID_DEF 5               ///< Driver ID for HTIF device
+#define PMA_PLIC_DID_DEF 6               ///< Driver ID for PLIC device
+#define PMA_CMIO_RX_BUFFER_DID_DEF 7     ///< Driver ID for cmio RX buffer
+#define PMA_CMIO_TX_BUFFER_DID_DEF 8     ///< Driver ID for cmio TX buffer
+#define PMA_SHADOW_UARCH_STATE_DID_DEF 9 ///< Driver ID for uarch shadow state device
+#define PMA_VIRTIO_DID_DEF 10            ///< Driver ID for VirtIO devices
+#define PMA_NVRAM_DID_DEF 11             ///< Driver ID for NVRAM
 
 // helper for using UINT64_C with defines
 #ifndef EXPAND_UINT64_C
diff --git a/src/record-send-cmio-state-access.hpp b/src/record-send-cmio-state-access.hpp
index b731a35f8..962b95c42 100644
--- a/src/record-send-cmio-state-access.hpp
+++ b/src/record-send-cmio-state-access.hpp
@@ -26,6 +26,7 @@
 #include <utility>
 
 #include "access-log.hpp"
+#include "address-range-constants.hpp"
 #include "assert-printf.hpp"
 #include "hash-tree-constants.hpp"
 #include "host-addr.hpp"
@@ -182,28 +183,14 @@ class record_send_cmio_state_access :
         update_after_write(paligned);
     }
 
-    // -----
-    // i_state_access interface implementation
-    // -----
-    friend i_state_access<record_send_cmio_state_access>;
-
-    void do_write_iflags_Y(uint64_t val) const {
-        log_before_write_write_and_update(machine_reg_address(machine_reg::iflags_Y),
-            m_m.get_state().shadow.registers.iflags.Y, val, "iflags.Y");
-    }
-
-    uint64_t do_read_iflags_Y() const {
-        log_read(machine_reg_address(machine_reg::iflags_Y), "iflags.Y");
-        return m_m.get_state().shadow.registers.iflags.Y;
-    }
-
-    void do_write_htif_fromhost(uint64_t val) const {
-        log_before_write_write_and_update(machine_reg_address(machine_reg::htif_fromhost),
-            m_m.get_state().shadow.registers.htif.fromhost, val, "htif.fromhost");
-    }
-
-    void do_write_memory_with_padding(uint64_t paddr, const unsigned char *data, uint64_t data_length,
-        int write_length_log2_size) const {
+    /// \brief Logs a write of a data buffer to memory padded with 0, writes, and updates the hash tree.
+    /// \param paddr Destination physical address.
+    /// \param data Pointer to source data buffer.
+    /// \param data_length Length of data buffer.
+    /// \param write_length_log2_size Log2 size of the total write length.
+    /// \param text Textual description of the access.
+    void log_write_memory_with_padding(uint64_t paddr, const unsigned char *data, uint64_t data_length,
+        int write_length_log2_size, const char *text) const {
         if ((paddr & (HASH_TREE_WORD_SIZE - 1)) != 0) {
             throw std::invalid_argument("paddr is not aligned to tree leaf size");
         }
@@ -231,9 +218,10 @@ class record_send_cmio_state_access :
         auto proof = m_m.get_proof(paddr, write_length_log2_size);
         // log hash and data before write
         a.set_read_hash(proof.get_target_hash());
+        const auto offset = paddr - ar.get_start();
         if (m_log.get_log_type().has_large_data()) {
-            access_data &data = a.get_read().emplace(write_length);
-            memcpy(data.data(), ar.get_host_memory(), write_length);
+            access_data &read_data = a.get_read().emplace(write_length);
+            memcpy(read_data.data(), ar.get_host_memory() + offset, write_length);
         }
 
         // We just store the sibling hashes in the access because this is the only missing piece of data needed to
@@ -253,16 +241,50 @@ class record_send_cmio_state_access :
         // NOLINTBEGIN(bugprone-unchecked-optional-access)
         a.get_written_hash().emplace();
         variant_hasher h(m_m.get_hash_function());
-        const auto offset = paddr - ar.get_start();
         get_merkle_tree_hash(h,
             std::span<const unsigned char>{ar.get_host_memory() + offset, static_cast<size_t>(write_length)},
             HASH_TREE_WORD_SIZE, a.get_written_hash().value());
         if (m_log.get_log_type().has_large_data()) {
-            access_data &data = a.get_written().emplace(write_length);
-            memcpy(data.data(), ar.get_host_memory() + offset, write_length);
+            access_data &written_data = a.get_written().emplace(write_length);
+            memcpy(written_data.data(), ar.get_host_memory() + offset, write_length);
         }
         // NOLINTEND(bugprone-unchecked-optional-access)
-        m_log.push_access(a, "cmio rx buffer");
+        m_log.push_access(a, text);
+    }
+
+    // -----
+    // i_state_access interface implementation
+    // -----
+    friend i_state_access<record_send_cmio_state_access>;
+
+    void do_write_iflags_Y(uint64_t val) const {
+        log_before_write_write_and_update(machine_reg_address(machine_reg::iflags_Y),
+            m_m.get_state().shadow.registers.iflags.Y, val, "iflags.Y");
+    }
+
+    uint64_t do_read_iflags_Y() const {
+        log_read(machine_reg_address(machine_reg::iflags_Y), "iflags.Y");
+        return m_m.get_state().shadow.registers.iflags.Y;
+    }
+
+    void do_write_htif_fromhost(uint64_t val) const {
+        log_before_write_write_and_update(machine_reg_address(machine_reg::htif_fromhost),
+            m_m.get_state().shadow.registers.htif.fromhost, val, "htif.fromhost");
+    }
+
+    uint64_t do_read_htif_tohost() const {
+        log_read(machine_reg_address(machine_reg::htif_tohost), "htif.tohost");
+        return m_m.get_state().shadow.registers.htif.tohost;
+    }
+
+    void do_write_revert_root_hash(const_machine_hash_view hash) const {
+        log_write_memory_with_padding(AR_SHADOW_REVERT_ROOT_HASH_START, hash.data(), hash.size(),
+            HASH_TREE_LOG2_WORD_SIZE, "revert root hash");
+    }
+
+    void do_write_memory_with_padding(uint64_t paddr, const unsigned char *data, uint64_t data_length,
+        int write_length_log2_size) const {
+        log_write_memory_with_padding(paddr, data, data_length, write_length_log2_size, "cmio rx buffer");
     }
 
     // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
diff --git a/src/record-step-state-access.hpp b/src/record-step-state-access.hpp
index 0b53a129a..d81c52972 100644
--- a/src/record-step-state-access.hpp
+++ b/src/record-step-state-access.hpp
@@ -30,6 +30,7 @@
 #include "hash-tree-constants.hpp"
 #include "hash-tree.hpp"
 #include "host-addr.hpp"
+#include "i-accept-dirty-pages.hpp"
 #include "i-accept-scoped-notes.hpp"
 #include "i-prefer-shadow-state.hpp"
 #include "i-state-access.hpp"
@@ -61,6 +62,7 @@ struct i_state_access_fast_addr<record_step_state_access> {
 class record_step_state_access :
     public i_state_access<record_step_state_access>,
     public i_accept_scoped_notes<record_step_state_access>,
+    public i_accept_dirty_pages<record_step_state_access>,
     public i_prefer_shadow_state<record_step_state_access> {
 
     using page_data_type = std::array<uint8_t, HASH_TREE_PAGE_SIZE>;
@@ -351,11 +353,6 @@ class record_step_state_access :
         return m_m.get_host_addr(paddr, pma_index);
     }
 
-    void do_mark_dirty_page(host_addr haddr, uint64_t pma_index) const {
-        // this is a noop in replay_step_state_access, so we do nothing else
-        m_m.mark_dirty_page(haddr, pma_index);
-    }
-
     bool do_putchar(uint8_t /*c*/) const { // NOLINT(readability-convert-member-functions-to-static)
         return false;
     }
@@ -363,6 +360,15 @@ class record_step_state_access :
     constexpr const char *do_get_name() const { // NOLINT(readability-convert-member-functions-to-static)
         return "record_step_state_access";
     }
+
+    // -----
+    // i_accept_dirty_pages interface implementation
+    // -----
+    friend i_accept_dirty_pages<record_step_state_access>;
+
+    void do_mark_dirty_page(uint64_t paddr, uint64_t pma_index) const {
+        m_m.mark_dirty_page(paddr, pma_index);
+    }
 };
 
 } // namespace cartesi
diff --git a/src/rejected-manual-yield.hpp b/src/rejected-manual-yield.hpp
new file mode 100644
index 000000000..1e656705d
--- /dev/null
+++ b/src/rejected-manual-yield.hpp
@@ -0,0 +1,48 @@
+// Copyright Cartesi and individual authors (see AUTHORS)
+// SPDX-License-Identifier: LGPL-3.0-or-later
+//
+// This program is free software: you can redistribute it and/or modify it under
+// the terms of the GNU Lesser General Public License as published by the Free
+// Software Foundation, either version 3 of the License, or (at your option) any
+// later version.
+//
+// This program is distributed in the hope that it will be useful, but WITHOUT ANY
+// WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
+// PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details.
+//
+// You should have received a copy of the GNU Lesser General Public License along
+// with this program (see COPYING). If not, see <https://www.gnu.org/licenses/>.
+//
+
+#ifndef REJECTED_MANUAL_YIELD_HPP
+#define REJECTED_MANUAL_YIELD_HPP
+
+/// \file
+/// \brief Predicate for the manual-yield rejected machine state
+
+#include <cstdint>
+
+#include "htif-constants.hpp"
+
+namespace cartesi {
+
+/// \brief Tells if the machine is paused on a manual yield whose reason is rx-rejected.
+/// \tparam STATE_ACCESS State access class.
+/// \param a State accessor.
+/// \returns True when a manual yield with reason rx-rejected is pending.
+/// \details This is the state from which verifiers substitute the recorded revert root
+/// hash for the machine root hash. The uarch-dialect equivalent lives in
+/// uarch-reset-state.cpp, where it is translated to Solidity.
+template <typename STATE_ACCESS>
+bool is_rejected_manual_yield(const STATE_ACCESS &a) {
+    if (a.read_iflags_Y() == 0) {
+        return false;
+    }
+    const uint64_t tohost = a.read_htif_tohost();
+    return HTIF_DEV_FIELD(tohost) == HTIF_DEV_YIELD && HTIF_CMD_FIELD(tohost) == HTIF_YIELD_CMD_MANUAL &&
+        HTIF_REASON_FIELD(tohost) == HTIF_YIELD_MANUAL_REASON_RX_REJECTED;
+}
+
+} // namespace cartesi
+
+#endif
diff --git a/src/replay-send-cmio-state-access.hpp b/src/replay-send-cmio-state-access.hpp
index ad3580438..44a57fecf 100644
--- a/src/replay-send-cmio-state-access.hpp
+++ b/src/replay-send-cmio-state-access.hpp
@@ -20,6 +20,7 @@
 /// \file
 /// \brief State access implementation that replays recorded state accesses
 
+#include <algorithm>
 #include <cstdint>
 #include <cstring>
 #include <ios>
@@ -30,6 +31,7 @@
 #include <vector>
 
 #include "access-log.hpp"
+#include "address-range-constants.hpp"
 #include "hash-tree-constants.hpp"
 #include "i-hasher.hpp"
 #include "i-state-access.hpp"
@@ -56,17 +58,16 @@ class replay_send_cmio_state_access final : public i_state_access<replay_send_cm
         /// \brief Constructor replay_send_cmio_state_access context
         /// \param log Access log to be replayed
         /// \param initial_hash Initial root hash
-        context(const access_log &log, const machine_hash &initial_hash, hash_function_type hash_function) :
+        context(const access_log &log, const_machine_hash_view initial_hash, hash_function_type hash_function) :
             accesses(log.get_accesses()),
-            root_hash(initial_hash),
             hash_function(hash_function) {
-            ;
+            std::ranges::copy(initial_hash, root_hash.begin());
         }
         const std::vector<access> &accesses; // NOLINT(cppcoreguidelines-avoid-const-or-ref-data-members)
         ///< Index of next access to ne consumed
         unsigned int next_access{};
         ///< Root hash before next access
-        machine_hash root_hash;
+        machine_hash root_hash{};
         ///< Hash function type used for the log
         hash_function_type hash_function;
     };
@@ -126,30 +127,23 @@ class replay_send_cmio_state_access final : public i_state_access<replay_send_cm
         static_assert(HASH_TREE_LOG2_WORD_SIZE >= log2_size_v<uint64_t>,
             "Hash tree word size must be at least as large as a machine word");
         if ((paligned & (sizeof(uint64_t) - 1)) != 0) {
-            // This is never reached by coverage because replay only uses check_read to check iflags_Y
+            // This is never reached by coverage because replay only uses check_read on word-aligned registers
             // LCOV_EXCL_START
             throw std::invalid_argument{"address not aligned to word size"};
             // LCOV_EXCL_STOP
         }
         if (m_context.next_access >= m_context.accesses.size()) {
-            // This is never reached by coverage because replay checks one read and its the first access
-            // If we truncate before the read, there will be zero accesses and another error triggers first
-            // LCOV_EXCL_START
             throw std::invalid_argument{"too few accesses in log"};
-            // LCOV_EXCL_STOP
         }
         const auto &access = m_context.accesses[m_context.next_access];
         if (access.get_type() != access_type::read) {
             throw std::invalid_argument{"expected " + access_to_report() + " to read " + text};
         }
         if (access.get_address() != paligned) {
-            // This is never reached by coverage because we only use check_read to check iflags_Y
-            // LCOV_EXCL_START
             std::ostringstream err;
             err << "expected " << access_to_report() << " to read " << text << " address 0x" << std::hex << paligned
                 << "(" << std::dec << paligned << ")";
             throw std::invalid_argument{err.str()};
-            // LCOV_EXCL_STOP
         }
         if (access.get_log2_size() != log2_size_v<uint64_t>) {
             throw std::invalid_argument{"expected " + access_to_report() + " to read 2^" +
@@ -276,20 +270,14 @@ class replay_send_cmio_state_access final : public i_state_access<replay_send_cm
         m_context.next_access++;
     }
 
-    void do_write_iflags_Y(uint64_t val) const {
-        check_write(machine_reg_address(machine_reg::iflags_Y), val, "iflags.Y");
-    }
-
-    uint64_t do_read_iflags_Y() const {
-        return check_read(machine_reg_address(machine_reg::iflags_Y), "iflags.Y");
-    }
-
-    void do_write_htif_fromhost(uint64_t val) const {
-        check_write(machine_reg_address(machine_reg::htif_fromhost), val, "htif.fromhost");
-    }
-
-    void do_write_memory_with_padding(uint64_t paddr, const unsigned char *data, uint64_t data_length,
-        int write_length_log2_size) const {
+    /// \brief Checks a logged write of a data buffer to memory padded with 0 and advances log.
+    /// \param paddr Destination physical address.
+    /// \param data Pointer to source data buffer.
+    /// \param data_length Length of data buffer.
+    /// \param write_length_log2_size Log2 size of the total write length.
+    /// \param text Textual description of the access.
+    void check_write_memory_with_padding(uint64_t paddr, const unsigned char *data, uint64_t data_length,
+        int write_length_log2_size, const std::string &text) const {
         variant_hasher h{m_context.hash_function};
         if (data == nullptr) {
             throw std::invalid_argument("data is null");
@@ -298,7 +286,6 @@ class replay_send_cmio_state_access final : public i_state_access<replay_send_cm
         if (write_length < data_length) {
             throw std::invalid_argument{"write length is less than data length"};
         }
-        const auto text = std::string("cmio rx buffer");
         if (m_context.next_access >= m_context.accesses.size()) {
             throw std::invalid_argument{"too few accesses in log"};
         }
@@ -363,6 +350,32 @@ class replay_send_cmio_state_access final : public i_state_access<replay_send_cm
         m_context.next_access++;
     }
 
+    void do_write_iflags_Y(uint64_t val) const {
+        check_write(machine_reg_address(machine_reg::iflags_Y), val, "iflags.Y");
+    }
+
+    uint64_t do_read_iflags_Y() const {
+        return check_read(machine_reg_address(machine_reg::iflags_Y), "iflags.Y");
+    }
+
+    void do_write_htif_fromhost(uint64_t val) const {
+        check_write(machine_reg_address(machine_reg::htif_fromhost), val, "htif.fromhost");
+    }
+
+    uint64_t do_read_htif_tohost() const {
+        return check_read(machine_reg_address(machine_reg::htif_tohost), "htif.tohost");
+    }
+
+    void do_write_revert_root_hash(const_machine_hash_view hash) const {
+        check_write_memory_with_padding(AR_SHADOW_REVERT_ROOT_HASH_START, hash.data(), hash.size(),
+            HASH_TREE_LOG2_WORD_SIZE, "revert root hash");
+    }
+
+    void do_write_memory_with_padding(uint64_t paddr, const unsigned char *data, uint64_t data_length,
+        int write_length_log2_size) const {
+        check_write_memory_with_padding(paddr, data, data_length, write_length_log2_size, "cmio rx buffer");
+    }
+
     // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
     constexpr const char *do_get_name() const {
         return "replay_send_cmio_state_access";
diff --git a/src/replay-step-state-access.hpp b/src/replay-step-state-access.hpp
index bfbdce978..3f2a2a352 100644
--- a/src/replay-step-state-access.hpp
+++ b/src/replay-step-state-access.hpp
@@ -38,6 +38,7 @@
 #include "mock-address-range.hpp"
 #include "pmas-constants.hpp"
 #include "pmas.hpp"
+#include "rejected-manual-yield.hpp"
 #include "riscv-constants.hpp"
 #include "shadow-registers.hpp"
 #include "shadow-tlb.hpp"
@@ -270,10 +271,17 @@ class replay_step_state_access :
 
     // \brief Finish the replay and check the final machine root hash
     // \throw runtime_error if the final root hash does not match
+    // \details When the machine has rejected an input (a manual yield with reason
+    // rx-rejected is pending), the canonical root hash after the step is the recorded
+    // revert root hash. Otherwise it is the computed machine root hash.
     void finish() {
-        // compute and check machine root hash after the replay
-        auto computed_final_root_hash = compute_root_hash();
-        if (computed_final_root_hash != m_context.logged_root_hash_after) {
+        machine_hash expected_root_hash_after{};
+        if (is_rejected_manual_yield(*this)) {
+            expected_root_hash_after = read_revert_root_hash();
+        } else {
+            expected_root_hash_after = compute_root_hash();
+        }
+        if (expected_root_hash_after != m_context.logged_root_hash_after) {
             THROW(std::runtime_error, "final root hash mismatch");
         }
     }
@@ -436,6 +444,14 @@ class replay_step_state_access :
         return check_read_reg(what);
     }
 
+    machine_hash do_read_revert_root_hash() const {
+        constexpr uint64_t paddr = AR_SHADOW_REVERT_ROOT_HASH_START;
+        const auto *page_log = find_page(paddr & ~PAGE_OFFSET_MASK);
+        machine_hash hash{};
+        std::copy_n(page_log->data + (paddr & PAGE_OFFSET_MASK), hash.size(), hash.begin());
+        return hash;
+    }
+
     void do_write_shadow_register(shadow_registers_what what, uint64_t val) const {
         check_write_reg(what, val);
     }
@@ -588,10 +604,6 @@ class replay_step_state_access :
     }
     // LCOV_EXCL_STOP
 
-    void do_mark_dirty_page(host_addr /* haddr */, uint64_t /* pma_index */) const {
-        // this is a noop since we have no host machine
-    }
-
     // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
     constexpr const char *do_get_name() const { // NOLINT(readability-convert-member-functions-to-static)
         return "replay_step_state_access";
diff --git a/src/send-cmio-response.cpp b/src/send-cmio-response.cpp
index 29933bdaa..0c3d54209 100644
--- a/src/send-cmio-response.cpp
+++ b/src/send-cmio-response.cpp
@@ -21,6 +21,7 @@
 
 #include "address-range-constants.hpp"
 #include "hash-tree-constants.hpp"
+#include "htif-constants.hpp"
 #include "record-send-cmio-state-access.hpp" // IWYU pragma: keep
 #include "replay-send-cmio-state-access.hpp" // IWYU pragma: keep
 #include "state-access.hpp"                  // IWYU pragma: keep
@@ -30,23 +31,41 @@
 namespace cartesi {
 
 template <typename STATE_ACCESS>
-void send_cmio_response(STATE_ACCESS a, uint16 reason, bytes data, uint32 dataLength) {
+void send_cmio_response(STATE_ACCESS a, bytes32 revertRootHash, uint16 reason, bytes data, uint32 dataLength) {
+    // This function cannot fail. When a failure is detected, the operation is a no-op instead,
+    // so the honest party can always log and prove the resulting state transition.
+    // A response to a machine that is not waiting on a manual yield is a no-op.
     if (!readIflagsY(a)) {
-        throwRuntimeError(a, "iflags.Y is not set");
+        return;
+    }
+    if (reason == HTIF_YIELD_REASON_ADVANCE_STATE) {
+        // Advance-state responses are the input boundary of the rollups flow. They only apply to a
+        // machine waiting for an input on an rx-accepted manual yield. Sending one to a machine that
+        // yielded manual with any other reason (e.g., rejected an input or threw an exception) is a no-op.
+        uint64 tohost = readHtifTohost(a);
+        if (!isYieldedManualWith(tohost, HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED)) {
+            return;
+        }
     }
     // A zero length data is a valid response. We just skip writing to the rx buffer.
+    uint32 writeLengthLog2Size = 0;
     if (dataLength > 0) {
         // Find the write length: the smallest power of 2 that is >= dataLength and >= tree leaf size
-        uint32 writeLengthLog2Size = uint32Log2(dataLength);
+        writeLengthLog2Size = uint32Log2(dataLength);
         if (writeLengthLog2Size < HASH_TREE_LOG2_WORD_SIZE) {
             writeLengthLog2Size = HASH_TREE_LOG2_WORD_SIZE; // minimum write size is the tree leaf size
         }
         if (uint32ShiftLeft(1, writeLengthLog2Size) < dataLength) {
             writeLengthLog2Size += 1;
         }
+        // A response with data that does not fit in the rx buffer is a no-op
         if (writeLengthLog2Size > AR_CMIO_RX_BUFFER_LOG2_SIZE) {
-            throwRuntimeError(a, "CMIO response data is too large");
+            return;
         }
+    }
+    // Record the machine root hash to revert to in case the response is eventually rejected
+    writeRevertRootHash(a, revertRootHash);
+    if (dataLength > 0) {
         writeMemoryWithPadding(a, AR_CMIO_RX_BUFFER_START, data, dataLength, writeLengthLog2Size);
     }
     // Write data length and reason to fromhost
@@ -59,15 +78,16 @@ void send_cmio_response(STATE_ACCESS a, uint16 reason, bytes data, uint32 dataLe
 }
 
 // Explicit instantiation for state_access
-template void send_cmio_response(state_access a, uint16_t reason, const unsigned char *data, uint32 length);
+template void send_cmio_response(state_access a, bytes32 revertRootHash, uint16_t reason, const unsigned char *data,
+    uint32 length);
 
 // Explicit instantiation for record_state_access
-template void send_cmio_response(record_send_cmio_state_access a, uint16_t reason, const unsigned char *data,
-    uint32 length);
+template void send_cmio_response(record_send_cmio_state_access a, bytes32 revertRootHash, uint16_t reason,
+    const unsigned char *data, uint32 length);
 
 // Explicit instantiation for replay_state_access
-template void send_cmio_response(replay_send_cmio_state_access a, uint16_t reason, const unsigned char *data,
-    uint32 length);
+template void send_cmio_response(replay_send_cmio_state_access a, bytes32 revertRootHash, uint16_t reason,
+    const unsigned char *data, uint32 length);
 
 } // namespace cartesi
 // NOLINTEND(google-readability-casting,misc-const-correctness,modernize-use-auto,hicpp-use-auto,readability-use-std-min-max)
diff --git a/src/send-cmio-response.hpp b/src/send-cmio-response.hpp
index bb5117684..fc62dc666 100644
--- a/src/send-cmio-response.hpp
+++ b/src/send-cmio-response.hpp
@@ -19,32 +19,41 @@
 
 #include <cstdint>
 
+#include "machine-hash.hpp"
+
 namespace cartesi {
 
+/// \brief cmio constants
+enum cmio_constants {
+    CMIO_LOG2_MAX_OUTPUT_COUNT = 63, ///< Height of the cmio outputs Merkle tree (capacity 2^63 outputs)
+};
+
 /// \brief Sends cmio response
 /// \tparam STATE_ACCESS State accessor type
 /// \param a State accessor
+/// \param revertRootHash Machine root hash to revert to in case the response is eventually rejected
 /// \param reason Reason for sending the response
 /// \param data Response data
 /// \param length Response data length
 template <typename STATE_ACCESS>
-void send_cmio_response(STATE_ACCESS a, uint16_t reason, const unsigned char *data, uint32_t dataLength);
+void send_cmio_response(STATE_ACCESS a, const_machine_hash_view revertRootHash, uint16_t reason,
+    const unsigned char *data, uint32_t dataLength);
 
 class state_access;
 class record_state_access;
 class replay_state_access;
 
 // Declaration of explicit instantiation in module send_cmio_response.cpp
-extern template void send_cmio_response(state_access a, uint16_t reason, const unsigned char *data,
-    uint32_t dataLength);
+extern template void send_cmio_response(state_access a, const_machine_hash_view revertRootHash, uint16_t reason,
+    const unsigned char *data, uint32_t dataLength);
 
 // Declaration of explicit instantiation in module uarch-reset-state.cpp
-extern template void send_cmio_response(record_state_access a, uint16_t reason, const unsigned char *data,
-    uint32_t dataLength);
+extern template void send_cmio_response(record_state_access a, const_machine_hash_view revertRootHash, uint16_t reason,
+    const unsigned char *data, uint32_t dataLength);
 
 // Declaration of explicit instantiation in module uarch-reset-state.cpp
-extern template void send_cmio_response(replay_state_access a, uint16_t reason, const unsigned char *data,
-    uint32_t dataLength);
+extern template void send_cmio_response(replay_state_access a, const_machine_hash_view revertRootHash, uint16_t reason,
+    const unsigned char *data, uint32_t dataLength);
 
 } // namespace cartesi
 
diff --git a/src/state-access.hpp b/src/state-access.hpp
index 23d82da87..e3e46f424 100644
--- a/src/state-access.hpp
+++ b/src/state-access.hpp
@@ -20,6 +20,7 @@
 /// \file
 /// \brief Fast state access implementation
 
+#include <algorithm>
 #include <cstdint>
 #include <stdexcept>
 #include <utility>
@@ -29,6 +30,7 @@
 #include "compiler-defines.hpp"
 #include "host-addr.hpp"
 #include "i-accept-counters.hpp"
+#include "i-accept-dirty-pages.hpp"
 #include "i-accept-scoped-notes.hpp"
 #include "i-interactive-state-access.hpp"
 #include "i-state-access.hpp"
@@ -56,7 +58,8 @@ class state_access :
     public i_state_access<state_access>,
     public i_interactive_state_access<state_access>,
     public i_accept_scoped_notes<state_access>,
-    public i_accept_counters<state_access> {
+    public i_accept_counters<state_access>,
+    public i_accept_dirty_pages<state_access> {
 
     // NOLINTBEGIN(cppcoreguidelines-avoid-const-or-ref-data-members)
     //??(edubart): Storing reference to the processor state removes an extra indirection when accessing registers,
@@ -450,6 +453,14 @@ class state_access :
         }
     }
 
+    machine_hash do_read_revert_root_hash() const {
+        return m_s.shadow.revert_root_hash;
+    }
+
+    void do_write_revert_root_hash(const_machine_hash_view hash) const {
+        std::ranges::copy(hash, m_s.shadow.revert_root_hash.begin());
+    }
+
     template <typename T, typename A = T>
     void do_read_memory_word(host_addr haddr, uint64_t /* pma_index */, T *pval) const {
         *pval = aliased_aligned_read<T, A>(haddr);
@@ -494,10 +505,6 @@ class state_access :
         return m_m.get_host_addr(paddr, pma_index);
     }
 
-    void do_mark_dirty_page(host_addr haddr, uint64_t pma_index) const {
-        m_m.mark_dirty_page(haddr, pma_index);
-    }
-
     // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
     bool do_putchar(uint8_t c) const {
         return m_m.putchar(c);
@@ -542,6 +549,15 @@ class state_access :
     void do_write_counter(uint64_t val, const char *name, const char *domain) const {
         m_m.write_counter(val, name, domain);
     }
+
+    // -----
+    // i_accept_dirty_pages interface implementation
+    // -----
+    friend i_accept_dirty_pages<state_access>;
+
+    void do_mark_dirty_page(uint64_t paddr, uint64_t pma_index) const {
+        m_m.mark_dirty_page(paddr, pma_index);
+    }
 };
 
 } // namespace cartesi
diff --git a/src/test-collect-hashes.lua b/src/test-collect-hashes.lua
index 6dadb0bd8..32fd7909a 100755
--- a/src/test-collect-hashes.lua
+++ b/src/test-collect-hashes.lua
@@ -116,7 +116,7 @@ local function get_root_hashes_directly(input_count)
             if hashes then tinsert(inputs, hashes) end
             hashes = {}
             local input = encode_input(index)
-            m:send_cmio_response(cartesi.CMIO_YIELD_REASON_ADVANCE_STATE, input)
+            m:send_cmio_response(m:get_root_hash(), cartesi.HTIF_YIELD_REASON_ADVANCE_STATE, input)
             index = index + 1
             if index >= input_count then break end
         end
@@ -154,7 +154,7 @@ local function get_root_hashes_with_collect(input_count)
             hashes = {}
             mcycle_phase = 0
             local input = encode_input(index)
-            m:send_cmio_response(cartesi.CMIO_YIELD_REASON_ADVANCE_STATE, input)
+            m:send_cmio_response(m:get_root_hash(), cartesi.HTIF_YIELD_REASON_ADVANCE_STATE, input)
             index = index + 1
             if index >= input_count then break end
         end
diff --git a/src/translate-virtual-address.hpp b/src/translate-virtual-address.hpp
index 79c34dd93..b34a2b41c 100644
--- a/src/translate-virtual-address.hpp
+++ b/src/translate-virtual-address.hpp
@@ -47,6 +47,7 @@
 
 #include "compiler-defines.hpp"
 #include "find-pma.hpp"
+#include "i-accept-dirty-pages.hpp"
 #include "riscv-constants.hpp"
 
 namespace cartesi {
@@ -68,7 +69,10 @@ static inline bool write_ram_uint64(STATE_ACCESS a, uint64_t paddr, uint64_t val
     // log writes to memory
     a.write_memory_word(faddr, pma_index, val);
     // mark page as dirty so we know to update the hash tree
-    a.mark_dirty_page(faddr, pma_index);
+    // only state accesses with a deferred store need this, see i_accept_dirty_pages
+    if constexpr (is_an_i_accept_dirty_pages_v<STATE_ACCESS>) {
+        a.mark_dirty_page(paddr, pma_index);
+    }
     return true;
 }
 
diff --git a/src/uarch-constants.hpp b/src/uarch-constants.hpp
index 7d99e71a2..753b08739 100644
--- a/src/uarch-constants.hpp
+++ b/src/uarch-constants.hpp
@@ -22,6 +22,7 @@
 #include "address-range-constants.hpp"
 #include "address-range-defines.h"
 #include "cm.h"
+#include "machine-reg.hpp"
 #include "uarch-defines.h"
 
 namespace cartesi {
@@ -66,12 +67,17 @@ static_assert((UARCH_SHADOW_LENGTH & (AR_PAGE_SIZE - 1)) == 0, "UARCH_SHADOW_LEN
 static_assert((UARCH_RAM_LENGTH & (AR_PAGE_SIZE - 1)) == 0, "UARCH_RAM_LENGTH must be multiple of AR_PAGE_SIZE");
 static_assert(UARCH_CYCLE_MAX == CM_UARCH_CYCLE_MAX, "CM_UARCH_CYCLE_MAX must be equal to UARCH_CYCLE_MAX");
 
+/// \brief Machine state addresses referenced by uarch code that is translated to Solidity
+enum uarch_machine_state_addresses : uint64_t {
+    IFLAGS_Y_ADDRESS = machine_reg_address(machine_reg::iflags_Y),       ///< Address of the iflags.Y register
+    HTIF_TOHOST_ADDRESS = machine_reg_address(machine_reg::htif_tohost), ///< Address of the htif.tohost register
+};
+
 /// \brief ecall function codes
 enum uarch_ecall_functions : uint64_t {
-    UARCH_ECALL_FN_HALT = EXPAND_UINT64_C(UARCH_ECALL_FN_HALT_DEF),                       ///< halt uarch execution
-    UARCH_ECALL_FN_PUTCHAR = EXPAND_UINT64_C(UARCH_ECALL_FN_PUTCHAR_DEF),                 ///< putchar
-    UARCH_ECALL_FN_MARK_DIRTY_PAGE = EXPAND_UINT64_C(UARCH_ECALL_FN_MARK_DIRTY_PAGE_DEF), ///< mark_dirty_page
-    UARCH_ECALL_FN_WRITE_TLB = EXPAND_UINT64_C(UARCH_ECALL_FN_WRITE_TLB_DEF),             ///< write_tlb
+    UARCH_ECALL_FN_HALT = EXPAND_UINT64_C(UARCH_ECALL_FN_HALT_DEF),           ///< halt uarch execution
+    UARCH_ECALL_FN_PUTCHAR = EXPAND_UINT64_C(UARCH_ECALL_FN_PUTCHAR_DEF),     ///< putchar
+    UARCH_ECALL_FN_WRITE_TLB = EXPAND_UINT64_C(UARCH_ECALL_FN_WRITE_TLB_DEF), ///< write_tlb
 };
 
 } // namespace cartesi
diff --git a/src/uarch-defines.h b/src/uarch-defines.h
index 7df833c13..78f8d7b8e 100644
--- a/src/uarch-defines.h
+++ b/src/uarch-defines.h
@@ -32,10 +32,10 @@
 #define UARCH_CYCLE_MAX_DEF (1 << UARCH_LOG2_CYCLE_MAX_DEF)
 
 // microarchitecture ecall function codes
-#define UARCH_ECALL_FN_HALT_DEF 1            // halt uarch
-#define UARCH_ECALL_FN_PUTCHAR_DEF 2         // putchar
-#define UARCH_ECALL_FN_MARK_DIRTY_PAGE_DEF 3 // mark_dirty_page
-#define UARCH_ECALL_FN_WRITE_TLB_DEF 4       // write_tlb
+// function code 3 was mark_dirty_page, now removed, and the gap is intentional
+#define UARCH_ECALL_FN_HALT_DEF 1      // halt uarch
+#define UARCH_ECALL_FN_PUTCHAR_DEF 2   // putchar
+#define UARCH_ECALL_FN_WRITE_TLB_DEF 4 // write_tlb
 
 // helper for using UINT64_C with defines
 #ifndef EXPAND_UINT64_C
diff --git a/src/uarch-record-state-access.hpp b/src/uarch-record-state-access.hpp
index 9b6b41e07..df9d4e3f6 100644
--- a/src/uarch-record-state-access.hpp
+++ b/src/uarch-record-state-access.hpp
@@ -25,6 +25,7 @@
 #include <utility>
 
 #include "access-log.hpp"
+#include "address-range-constants.hpp"
 #include "hash-tree-constants.hpp"
 #include "i-accept-scoped-notes.hpp"
 #include "i-prefer-shadow-uarch-state.hpp"
@@ -48,26 +49,35 @@ class uarch_record_state_access :
     public i_accept_scoped_notes<uarch_record_state_access>,
     public i_prefer_shadow_uarch_state<uarch_record_state_access> {
 
+public:
+    struct context {
+        ///< Root hash after the recorded operation, already reverted when the operation reverted the state
+        machine_hash root_hash_after{};
+    };
+
+private:
     // NOLINTBEGIN(cppcoreguidelines-avoid-const-or-ref-data-members)
-    machine &m_m;      ///< Macro machine
-    access_log &m_log; ///< Access log
+    context &m_context; ///< Context
+    machine &m_m;       ///< Macro machine
+    access_log &m_log;  ///< Access log
     // NOLINTEND(cppcoreguidelines-avoid-const-or-ref-data-members)
 
 public:
     /// \brief Constructor from machine and uarch states.
+    /// \param c Reference to context.
     /// \param m Reference to machine state.
     /// \param log Reference to log.
-    uarch_record_state_access(machine &m, access_log &log) : m_m(m), m_log(log) {
+    uarch_record_state_access(context &c, machine &m, access_log &log) : m_context(c), m_m(m), m_log(log) {
         ;
     }
 
 private:
-    static std::pair<uint64_t, int> adjust_access(uint64_t paddr, int log2_size) {
+    static std::pair<uint64_t, int> adjust_access(uint64_t &paddr, int log2_size) {
         static_assert(cartesi::log2_size_v<uint64_t> <= HASH_TREE_LOG2_WORD_SIZE,
             "Hash tree word size must not be smaller than machine word size");
-        if (((paddr >> log2_size) << log2_size) != paddr) {
-            throw std::invalid_argument{"misaligned access"};
-        }
+        // Unilaterally align the access down to its natural size, so that even a buggy
+        // misaligned access can still be logged and verified instead of aborting.
+        paddr = (paddr >> log2_size) << log2_size;
         const auto log2_word_size = HASH_TREE_LOG2_WORD_SIZE;
         const auto log2_access_size = std::max(log2_size, log2_word_size);
         const auto access_paddr = (paddr >> log2_access_size) << log2_access_size;
@@ -209,6 +219,24 @@ class uarch_record_state_access :
         return log_read_word_access(paddr, name.c_str());
     }
 
+    machine_hash log_read_revert_root_hash_access() const {
+        access a;
+        log_access_type(a, access_type::read);
+        log_access_range(a, AR_SHADOW_REVERT_ROOT_HASH_START, HASH_TREE_LOG2_WORD_SIZE);
+        log_access_siblings_and_read_hash(a, AR_SHADOW_REVERT_ROOT_HASH_START, HASH_TREE_LOG2_WORD_SIZE);
+        // the value must always be in the log, the EVM verifier consumes it from there
+        const auto &read_data = log_read_data(a, AR_SHADOW_REVERT_ROOT_HASH_START, HASH_TREE_LOG2_WORD_SIZE);
+        machine_hash hash{};
+        std::ranges::copy(read_data, hash.begin());
+        log_access(std::move(a), "revert root hash");
+        return hash;
+    }
+
+    void do_revert_state() const {
+        // the physical machine state does not revert, only the canonical root hash does
+        m_context.root_hash_after = log_read_revert_root_hash_access();
+    }
+
     void do_write_word(uint64_t paddr, uint64_t val) const {
         const auto name = machine::get_address_name(paddr);
         log_write_access(
@@ -259,6 +287,7 @@ class uarch_record_state_access :
                 }
             },
             "uarch.state");
+        m_context.root_hash_after = m_m.get_root_hash();
     }
 
     // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
@@ -266,11 +295,6 @@ class uarch_record_state_access :
         return false;
     }
 
-    void do_mark_dirty_page(uint64_t paddr, uint64_t pma_index) const {
-        // Forward to machine and no need to log
-        m_m.mark_dirty_page(paddr, pma_index);
-    }
-
     // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
     constexpr const char *do_get_name() const {
         return "uarch_record_state_access";
diff --git a/src/uarch-replay-state-access.hpp b/src/uarch-replay-state-access.hpp
index eac4d16c2..3c636619f 100644
--- a/src/uarch-replay-state-access.hpp
+++ b/src/uarch-replay-state-access.hpp
@@ -31,6 +31,7 @@
 #include <vector>
 
 #include "access-log.hpp"
+#include "address-range-constants.hpp"
 #include "hash-tree-constants.hpp"
 #include "hash-tree.hpp"
 #include "i-accept-scoped-notes.hpp"
@@ -60,16 +61,14 @@ class uarch_replay_state_access :
         /// \brief Constructor replay_send_cmio_state_access context
         /// \param log Access log to be replayed
         /// \param initial_hash Initial root hash
-        context(const access_log &log, const machine_hash &initial_hash) :
-            accesses(log.get_accesses()),
-            root_hash(initial_hash) {
-            ;
+        context(const access_log &log, const_machine_hash_view initial_hash) : accesses(log.get_accesses()) {
+            std::ranges::copy(initial_hash, root_hash.begin());
         }
         const std::vector<access> &accesses; // NOLINT(cppcoreguidelines-avoid-const-or-ref-data-members)
         ///< Index of next access to ne consumed
         unsigned int next_access{};
         ///< Root hash before next access
-        machine_hash root_hash;
+        machine_hash root_hash{};
         ///< Hasher needed to verify proofs
         keccak_256_hasher hasher;
     };
@@ -132,9 +131,12 @@ class uarch_replay_state_access :
         return "unknown_";
     }
 
-    static std::pair<uint64_t, int> adjust_access(uint64_t paddr, int log2_size) {
+    static std::pair<uint64_t, int> adjust_access(uint64_t &paddr, int log2_size) {
         static_assert(cartesi::log2_size_v<uint64_t> <= HASH_TREE_LOG2_WORD_SIZE,
             "Hash tree word size must not be smaller than machine word size");
+        // Unilaterally align the access down to its natural size, so that even a buggy
+        // misaligned access can still be logged and verified instead of aborting.
+        paddr = (paddr >> log2_size) << log2_size;
         const auto log2_word_size = HASH_TREE_LOG2_WORD_SIZE;
         const auto log2_access_size = std::max(log2_size, log2_word_size);
         const auto access_paddr = (paddr >> log2_access_size) << log2_access_size;
@@ -335,6 +337,27 @@ class uarch_replay_state_access :
         return check_read_word_access(paddr, name.c_str());
     }
 
+    machine_hash check_read_revert_root_hash_access() const {
+        const auto *text = "revert root hash";
+        const auto &a = check_access(text);
+        check_access_type(a, access_type::read, text);
+        check_access_range(a, access_type::read, AR_SHADOW_REVERT_ROOT_HASH_START, HASH_TREE_LOG2_WORD_SIZE, text);
+        std::ignore = check_access_siblings_and_read_hash(a, text);
+        const auto &read_data = check_read_data(a, text);
+        if (read_data.size() != HASH_TREE_WORD_SIZE) {
+            throw std::invalid_argument{
+                "read data for " + std::string(text) + " has wrong size in " + access_to_report()};
+        }
+        machine_hash hash{};
+        std::ranges::copy(read_data, hash.begin());
+        m_context.next_access++;
+        return hash;
+    }
+
+    void do_revert_state() const {
+        m_context.root_hash = check_read_revert_root_hash_access();
+    }
+
     void do_write_word(uint64_t paddr, uint64_t val) const {
         const auto name = machine::get_address_name(paddr);
         check_write_word_access(paddr, val, name.c_str());
@@ -345,11 +368,6 @@ class uarch_replay_state_access :
         return false;
     }
 
-    // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
-    void do_mark_dirty_page(uint64_t /*paddr*/, uint64_t /*pma_index*/) const {
-        ; // do nothing
-    }
-
     void do_reset_uarch() const {
         check_write_access(UARCH_STATE_START_ADDRESS, UARCH_STATE_LOG2_SIZE, get_uarch_pristine_state_hash(),
             "uarch.state");
diff --git a/src/uarch-reset-state.cpp b/src/uarch-reset-state.cpp
index 3977195f8..0e3178f34 100644
--- a/src/uarch-reset-state.cpp
+++ b/src/uarch-reset-state.cpp
@@ -21,6 +21,8 @@
 
 #include "uarch-reset-state.hpp"
 
+#include "htif-constants.hpp"
+#include "uarch-constants.hpp"
 #include "uarch-record-state-access.hpp" // IWYU pragma: keep
 #include "uarch-replay-state-access.hpp" // IWYU pragma: keep
 #include "uarch-solidity-compat.hpp"
@@ -31,6 +33,15 @@ namespace cartesi {
 template <typename UarchState>
 void uarch_reset_state(UarchState &a) {
     resetState(a);
+    // When the machine has rejected an input, the canonical state after the operation is
+    // the one recorded in the revert root hash (which has a pristine uarch)
+    uint64 iflagsY = readWord(a, IFLAGS_Y_ADDRESS);
+    if (iflagsY != 0) {
+        uint64 tohost = readWord(a, HTIF_TOHOST_ADDRESS);
+        if (isYieldedManualWith(tohost, HTIF_YIELD_MANUAL_REASON_RX_REJECTED)) {
+            revertState(a);
+        }
+    }
 }
 
 // Explicit instantiation for uarch_state_access
diff --git a/src/uarch-solidity-compat.hpp b/src/uarch-solidity-compat.hpp
index 5ade287c3..f2af585a9 100644
--- a/src/uarch-solidity-compat.hpp
+++ b/src/uarch-solidity-compat.hpp
@@ -21,6 +21,8 @@
 #include <stdexcept>
 
 #include "assert-printf.hpp"
+#include "htif-constants.hpp"
+#include "machine-hash.hpp"
 #include "shadow-tlb.hpp"
 
 /// \file
@@ -42,6 +44,7 @@ using uint32 = uint32_t;
 using int64 = int64_t;
 using uint64 = uint64_t;
 using bytes = const unsigned char *;
+using bytes32 = const_machine_hash_view;
 
 // Wrapperfunctions used to access data from the uarch state accessor
 
@@ -100,6 +103,11 @@ static inline void resetState(const UarchState a) {
     a.reset_uarch();
 }
 
+template <typename UarchState>
+static inline void revertState(const UarchState a) {
+    a.revert_state();
+}
+
 template <typename State>
 static inline uint64 readIflagsY(State &a) {
     return a.read_iflags_Y();
@@ -115,6 +123,16 @@ static inline void writeHtifFromhost(State &a, uint64 val) {
     a.write_htif_fromhost(val);
 }
 
+template <typename State>
+static inline uint64 readHtifTohost(State &a) {
+    return a.read_htif_tohost();
+}
+
+template <typename State>
+static inline void writeRevertRootHash(State &a, bytes32 revertRootHash) {
+    a.write_revert_root_hash(revertRootHash);
+}
+
 template <typename State>
 static inline void writeMemoryWithPadding(State &a, uint64 paddr, bytes data, uint64_t data_length,
     int32 write_length_log2_size) {
@@ -131,11 +149,6 @@ static inline void putCharECALL(const UarchState a, uint8 c) {
     a.putchar(c);
 }
 
-template <typename UarchState>
-static inline void markDirtyPageECALL(const UarchState a, uint64 paddr, uint64 pma_index) {
-    a.mark_dirty_page(paddr, pma_index);
-}
-
 template <typename UarchState>
 static inline void writeTlbECALL(const UarchState a, uint64 set_index, uint64 slot_index, uint64 vaddr_page,
     uint64 vp_offset, uint64 pma_index) {
@@ -218,6 +231,13 @@ static inline uint32 uint32Log2(uint32 v) {
     return 31 - __builtin_clz(v);
 }
 
+static inline bool isYieldedManualWith(uint64 tohost, uint64 yieldReason) {
+    const uint64 dev = uint64ShiftRight(tohost & HTIF_DEV_MASK, HTIF_DEV_SHIFT);
+    const uint64 cmd = uint64ShiftRight(tohost & HTIF_CMD_MASK, HTIF_CMD_SHIFT);
+    const uint64 reason = uint64ShiftRight(tohost & HTIF_REASON_MASK, HTIF_REASON_SHIFT);
+    return dev == HTIF_DEV_YIELD && cmd == HTIF_YIELD_CMD_MANUAL && reason == yieldReason;
+}
+
 template <typename T1, typename T2>
 void require([[maybe_unused]] T1 condition, [[maybe_unused]] T2 message) {
     assert((condition) && (message));
diff --git a/src/uarch-state-access.hpp b/src/uarch-state-access.hpp
index 43dd0cb57..15498cbae 100644
--- a/src/uarch-state-access.hpp
+++ b/src/uarch-state-access.hpp
@@ -83,6 +83,11 @@ class uarch_state_access :
         return m_m.read_word(paddr);
     }
 
+    // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
+    void do_revert_state() const {
+        ; // the physical machine state does not revert
+    }
+
     void do_write_word(uint64_t paddr, uint64_t val) const {
         // Forward to machine
         m_m.write_word(paddr, val);
@@ -95,12 +100,6 @@ class uarch_state_access :
         return false;
     }
 
-    // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
-    void do_mark_dirty_page(uint64_t paddr, uint64_t pma_index) const {
-        // Forward to machine
-        m_m.mark_dirty_page(paddr, pma_index);
-    }
-
     void do_write_tlb(TLB_set_index set_index, uint64_t slot_index, uint64_t vaddr_page, uint64_t vp_offset,
         uint64_t pma_index) const {
         // Forward to machine
diff --git a/src/uarch-step.cpp b/src/uarch-step.cpp
index 0c73e7c44..dc4f15000 100644
--- a/src/uarch-step.cpp
+++ b/src/uarch-step.cpp
@@ -880,12 +880,6 @@ static inline void executeECALL(const UarchState a, uint32 insn, uint64 pc) {
         putCharECALL(a, uint8(c)); // Can be a NOOP in Solidity
         return advancePc(a, pc);
     }
-    if (fn == UARCH_ECALL_FN_MARK_DIRTY_PAGE) {
-        uint64 paddr = readX(a, 10);             // a0 contains physical address in page to be marked dirty
-        uint64 pma_index = readX(a, 11);         // a1 contains a index of PMA where page falls
-        markDirtyPageECALL(a, paddr, pma_index); // This MUST be be a NOOP in Solidity
-        return advancePc(a, pc);
-    }
     if (fn == UARCH_ECALL_FN_WRITE_TLB) {
         uint64 set_index = readX(a, 10);  // a0 contains TLB set (code, read, write)
         uint64 slot_index = readX(a, 11); // a1 contains slot_index to modify
diff --git a/tests/dependencies b/tests/dependencies
index ce8897a32..e923e0515 100644
--- a/tests/dependencies
+++ b/tests/dependencies
@@ -1,2 +1,2 @@
-https://github.com/cartesi/machine-guest-tools/releases/download/v0.18.0-test1/rootfs-tools.ext2
+https://github.com/cartesi/machine-guest-tools/releases/download/v0.18.0-test4/rootfs-tools.ext2
 https://github.com/cartesi/machine-linux-image/releases/download/v0.21.0-test1/linux-6.5.13-ctsi-2-uio-test1-v0.21.0.bin
diff --git a/tests/dependencies.sha256 b/tests/dependencies.sha256
index ede08897e..70bcb868a 100644
--- a/tests/dependencies.sha256
+++ b/tests/dependencies.sha256
@@ -1,2 +1,2 @@
 9fb5aaa623f35c0ef2138c8dadf1b0a1e388e0f51758cb6a5477ec5cecd3a029  build/images/linux-6.5.13-ctsi-2-uio-test1-v0.21.0.bin
-de8a4060e41910b500bd47849301ab5b4a41959570242de0a4d81f08ad8b59cc  build/images/rootfs-tools.ext2
+fbb456fb0be38ed0e211d90214fe18b0247d59c09024b312e96b41aaa46bb91a  build/images/rootfs-tools.ext2
diff --git a/tests/lua/cartesi-machine-tests.lua b/tests/lua/cartesi-machine-tests.lua
index 689b18fef..611558663 100755
--- a/tests/lua/cartesi-machine-tests.lua
+++ b/tests/lua/cartesi-machine-tests.lua
@@ -551,9 +551,9 @@ local options = {
             if not opts then
                 return false
             end
-            local c = util.parse_options(opts, all, {
+            local c = util.parse_options({
                 update_hash_tree = "number",
-            })
+            }, all, opts)
             c.update_hash_tree = assert(c.update_hash_tree, "invalid update_hash_tree number in " .. all)
             concurrency_update_hash_tree = c.update_hash_tree
             return true
diff --git a/tests/lua/cmio-test.lua b/tests/lua/cmio-test.lua
index c6effd475..4d03f9c94 100755
--- a/tests/lua/cmio-test.lua
+++ b/tests/lua/cmio-test.lua
@@ -125,17 +125,17 @@ local function load_machine(name)
 end
 
 local function next_input(machine, reason, data)
-    machine:send_cmio_response(reason, data)
+    machine:send_cmio_response(machine:get_root_hash(), reason, data)
 end
 
 local function setup_advance(machine, data)
     assert(data)
-    local reason = cartesi.CMIO_YIELD_REASON_ADVANCE_STATE
+    local reason = cartesi.HTIF_YIELD_REASON_ADVANCE_STATE
     next_input(machine, reason, data)
 end
 
 local function setup_inspect(machine, data)
-    local reason = cartesi.CMIO_YIELD_REASON_INSPECT_STATE
+    local reason = cartesi.HTIF_YIELD_REASON_INSPECT_STATE
     next_input(machine, reason, data)
 end
 
@@ -147,8 +147,8 @@ end
 local function check_output(machine, expected)
     assert(machine:read_reg("iflags_X") ~= 0)
     local cmd, reason, output = machine:receive_cmio_request()
-    assert(cmd == cartesi.CMIO_YIELD_COMMAND_AUTOMATIC)
-    assert(reason == cartesi.CMIO_YIELD_AUTOMATIC_REASON_TX_OUTPUT)
+    assert(cmd == cartesi.HTIF_YIELD_CMD_AUTOMATIC)
+    assert(reason == cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT)
     if expected ~= output then
         local e <close> = assert(io.open("expected.bin", "wb"))
         local o <close> = assert(io.open("output.bin", "wb"))
@@ -163,16 +163,16 @@ end
 local function check_report(machine, expected)
     assert(machine:read_reg("iflags_X") ~= 0)
     local cmd, reason, output = machine:receive_cmio_request()
-    assert(cmd == cartesi.CMIO_YIELD_COMMAND_AUTOMATIC)
-    assert(reason == cartesi.CMIO_YIELD_AUTOMATIC_REASON_TX_REPORT)
+    assert(cmd == cartesi.HTIF_YIELD_CMD_AUTOMATIC)
+    assert(reason == cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT)
     assert(expected == output)
 end
 
 local function check_exception(machine, expected)
     assert(machine:read_reg("iflags_Y") ~= 0)
     local cmd, reason, output = machine:receive_cmio_request()
-    assert(cmd == cartesi.CMIO_YIELD_COMMAND_MANUAL)
-    assert(reason == cartesi.CMIO_YIELD_MANUAL_REASON_TX_EXCEPTION)
+    assert(cmd == cartesi.HTIF_YIELD_CMD_MANUAL)
+    assert(reason == cartesi.HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION)
     assert(expected == output, string.format("expected: %q, got: %q", expected, output))
 end
 
@@ -208,11 +208,11 @@ end
 local function check_finish(machine, output_hashes, expected_reason)
     local cmd, reason, output = machine:receive_cmio_request()
     assert(machine:read_reg("iflags_Y") ~= 0)
-    assert(cmd == cartesi.CMIO_YIELD_COMMAND_MANUAL)
+    assert(cmd == cartesi.HTIF_YIELD_CMD_MANUAL)
     assert(reason == expected_reason)
 
     -- only check for output-hashes-root-hash if the input was accepted
-    if expected_reason == cartesi.CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED then
+    if expected_reason == cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED then
         assert(#output == cartesi.HASH_SIZE)
         check_outputs_root_hash(output, output_hashes)
     else
@@ -290,7 +290,7 @@ for _, dapp in pairs({ "ioctl", "http" }) do
 
                 -- finish
                 machine:run(MAX_MCYCLE)
-                check_finish(machine, hashes, cartesi.CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED)
+                check_finish(machine, hashes, cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED)
             end
 
             return 0
@@ -314,7 +314,7 @@ for _, dapp in pairs({ "ioctl", "http" }) do
 
         -- finish
         machine:run(MAX_MCYCLE)
-        check_finish(machine, hashes, cartesi.CMIO_YIELD_MANUAL_REASON_RX_REJECTED)
+        check_finish(machine, hashes, cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED)
 
         return 0
     end, 0)
diff --git a/tests/lua/htif-console.lua b/tests/lua/htif-console.lua
index 68e6c602e..2a281c48c 100755
--- a/tests/lua/htif-console.lua
+++ b/tests/lua/htif-console.lua
@@ -45,8 +45,21 @@ local function test(config, console_getchar_enable)
     config.htif = {
         console_getchar = console_getchar_enable,
     }
-    local machine <close> = cartesi.machine(config)
-    machine:run(math.maxinteger)
+    -- feed the test input through the runtime console buffer instead of host stdin
+    local runtime = {
+        console = {
+            input_source = "from_buffer",
+        },
+    }
+    local machine <close> = cartesi.machine(config, runtime)
+    if console_getchar_enable then
+        machine:write_console_input("CTSI")
+    end
+    -- run() breaks with BREAK_REASON_CONSOLE_INPUT when the input buffer drains,
+    -- so keep running until the machine halts
+    repeat
+        machine:run(math.maxinteger)
+    until machine:read_reg("iflags_H") ~= 0
 
     -- should be halted
     assert(machine:read_reg("iflags_H") ~= 0, "expected iflags_H set")
diff --git a/tests/lua/htif-yield.lua b/tests/lua/htif-yield.lua
index 6c62d3610..432ebdfd1 100755
--- a/tests/lua/htif-yield.lua
+++ b/tests/lua/htif-yield.lua
@@ -131,15 +131,15 @@ if uarch then
     config.uarch = uarch
 end
 
-local YIELD_MANUAL = cartesi.CMIO_YIELD_COMMAND_MANUAL
-local YIELD_AUTOMATIC = cartesi.CMIO_YIELD_COMMAND_AUTOMATIC
+local YIELD_MANUAL = cartesi.HTIF_YIELD_CMD_MANUAL
+local YIELD_AUTOMATIC = cartesi.HTIF_YIELD_CMD_AUTOMATIC
 
-local REASON_PROGRESS = cartesi.CMIO_YIELD_AUTOMATIC_REASON_PROGRESS
-local REASON_TX_OUTPUT = cartesi.CMIO_YIELD_AUTOMATIC_REASON_TX_OUTPUT
-local REASON_TX_REPORT = cartesi.CMIO_YIELD_AUTOMATIC_REASON_TX_REPORT
-local REASON_RX_ACCEPTED = cartesi.CMIO_YIELD_MANUAL_REASON_RX_ACCEPTED
-local REASON_RX_REJECTED = cartesi.CMIO_YIELD_MANUAL_REASON_RX_REJECTED
-local REASON_TX_EXCEPTION = cartesi.CMIO_YIELD_MANUAL_REASON_TX_EXCEPTION
+local REASON_PROGRESS = cartesi.HTIF_YIELD_AUTOMATIC_REASON_PROGRESS
+local REASON_TX_OUTPUT = cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_OUTPUT
+local REASON_TX_REPORT = cartesi.HTIF_YIELD_AUTOMATIC_REASON_TX_REPORT
+local REASON_RX_ACCEPTED = cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED
+local REASON_RX_REJECTED = cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED
+local REASON_TX_EXCEPTION = cartesi.HTIF_YIELD_MANUAL_REASON_TX_EXCEPTION
 
 local yields = {
     { mcycle = 10, data = 10, cmd = YIELD_MANUAL, reason = REASON_PROGRESS },
diff --git a/tests/lua/machine-bind.lua b/tests/lua/machine-bind.lua
index 8fe227fa1..23b8888a6 100755
--- a/tests/lua/machine-bind.lua
+++ b/tests/lua/machine-bind.lua
@@ -113,9 +113,9 @@ local options = {
             if not opts then
                 return false
             end
-            local c = util.parse_options(opts, all, {
+            local c = util.parse_options({
                 update_hash_tree = "number",
-            })
+            }, all, opts)
             c.update_hash_tree = assert(c.update_hash_tree, "invalid update_hash_tree number in " .. all)
             return true
         end,
@@ -549,6 +549,14 @@ do_test("should return expected value", function(machine)
     assert(root_hash == calculated_root_hash, "initial root hash does not match")
 end)
 
+print("\n\n test read_revert_root_hash and write_revert_root_hash")
+do_test("should round-trip correctly", function(machine)
+    local root_hash = machine:get_root_hash()
+    machine:write_revert_root_hash(root_hash)
+    local revert_hash = machine:read_revert_root_hash()
+    assert(root_hash == revert_hash, "revert root hash does not match hash that was set")
+end)
+
 print("\n\n test get_initial_config")
 do_test("should have expected values", function(machine)
     -- Check initial config
@@ -767,7 +775,7 @@ print("\n\n dump step log to console")
 do_test("dumped step log content should match", function(machine)
     local log = machine:log_step_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS | cartesi.ACCESS_LOG_TYPE_LARGE_DATA)
     local temp_file <close> = test_util.new_temp_file()
-    util.dump_log(log, temp_file)
+    util.print_log(log, temp_file)
     local log_output = temp_file:read_all()
     -- luacheck: push no max line length
     local expected_output = "begin step\n"
@@ -974,7 +982,11 @@ local function test_reset_uarch(machine, with_log, with_annotations)
     if with_log then
         local log_type = (with_annotations and cartesi.ACCESS_LOG_TYPE_ANNOTATIONS or 0)
         local log = machine:log_reset_uarch(log_type)
-        assert(#log.accesses == 1)
+        assert(#log.accesses == 2)
+        -- the second access reads iflags.Y to check for a rejected input
+        local read_iflags_y = log.accesses[2]
+        assert(read_iflags_y.type == "read")
+        assert(read_iflags_y.address == machine:get_reg_address("iflags_Y"))
         local access = log.accesses[1]
         assert(access.sibling_hashes ~= nil)
         assert(access.address == cartesi.UARCH_SHADOW_START_ADDRESS)
@@ -1045,6 +1057,61 @@ test_util.make_do_test(build_machine, machine_type, { uarch = test_reset_uarch_c
     end
 )
 
+-- Puts the machine in the manual-yield rejected state with a recorded revert root hash
+local function set_rejected_input_state(machine, revert_hash)
+    machine:write_revert_root_hash(revert_hash)
+    machine:write_reg("iflags_Y", 1)
+    machine:write_reg("htif_tohost_dev", cartesi.HTIF_DEV_YIELD)
+    machine:write_reg("htif_tohost_cmd", cartesi.HTIF_YIELD_CMD_MANUAL)
+    machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED)
+end
+
+test_util.make_do_test(build_machine, machine_type, { uarch = test_reset_uarch_config })(
+    "Testing log_reset_uarch reverts to the revert root hash when the input was rejected",
+    function(machine)
+        local revert_hash = string.rep("\x5a", cartesi.HASH_SIZE)
+        set_rejected_input_state(machine, revert_hash)
+        local initial_hash = machine:get_root_hash()
+        local log = machine:log_reset_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS)
+        -- the physical machine has its uarch reset as usual
+        assert(machine:read_reg("uarch_cycle") == 0, "uarch should have been reset")
+        -- the log contains the uarch state write followed by the three reads
+        assert(#log.accesses == 4)
+        assert(log.accesses[1].type == "write")
+        assert(log.accesses[2].type == "read")
+        assert(log.accesses[3].type == "read")
+        assert(log.accesses[4].type == "read")
+        assert(log.accesses[4].address == cartesi.AR_SHADOW_REVERT_ROOT_HASH_START)
+        -- the canonical root hash after the operation is the revert root hash
+        machine:verify_reset_uarch(initial_hash, log, revert_hash)
+        -- the machine's actual root hash is not accepted
+        local _, err = pcall(machine.verify_reset_uarch, machine, initial_hash, log, machine:get_root_hash())
+        check_error_find(err, "mismatch in root hash after replay")
+        -- a tampered revert root hash value is not accepted
+        log.accesses[4].read = string.rep("\xff", cartesi.HASH_SIZE)
+        _, err = pcall(machine.verify_reset_uarch, machine, initial_hash, log, revert_hash)
+        check_error_find(err, "read data for revert root hash does not match read hash")
+    end
+)
+
+test_util.make_do_test(build_machine, machine_type, { uarch = test_reset_uarch_config })(
+    "Testing log_reset_uarch does not revert when the yield reason is not rx-rejected",
+    function(machine)
+        local revert_hash = string.rep("\x5a", cartesi.HASH_SIZE)
+        set_rejected_input_state(machine, revert_hash)
+        machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED)
+        local initial_hash = machine:get_root_hash()
+        local log = machine:log_reset_uarch()
+        -- the uarch was reset normally
+        assert(machine:read_reg("uarch_cycle") == 0, "uarch should have been reset")
+        -- the uarch state write is followed by the iflags.Y and htif.tohost reads
+        assert(#log.accesses == 3)
+        assert(log.accesses[1].type == "write")
+        assert(log.accesses[3].type == "read")
+        machine:verify_reset_uarch(initial_hash, log, machine:get_root_hash())
+    end
+)
+
 test_util.make_do_test(build_machine, machine_type, { hash_tree = { hash_function = "sha256" } })(
     "Uarch operations should fail if hash tree hash function is not keccak256",
     function(machine)
@@ -1074,7 +1141,7 @@ test_util.make_do_test(build_machine, machine_type, { hash_tree = { hash_functio
             success == false and err:match("can only be used with hash tree configured with Keccak%-256 hash function")
         )
         -- log_send_cmio_response should fail
-        success, err = pcall(machine.log_send_cmio_response, machine, 0, 0)
+        success, err = pcall(machine.log_send_cmio_response, machine, string.rep("\0", 32), 0, 0)
         assert(
             success == false and err:match("can only be used with hash tree configured with Keccak%-256 hash function")
         )
@@ -1088,6 +1155,7 @@ test_util.make_do_test(build_machine, machine_type, { uarch = test_reset_uarch_c
         local expected_dump_pattern = "begin reset_uarch_state\n"
             .. "  1: write uarch.state@0x400000%(4194304%): "
             .. 'hash:"[0-9a-f]+"%(2%^22 bytes%) %-> hash:"[0-9a-fA-F]+"%(2%^22 bytes%)\n'
+            .. "  2: read iflags.Y@0x300%(768%): 0x0%(0%)\n"
             .. "end reset_uarch_state\n"
 
         local tmpname = os.tmpname()
@@ -1098,7 +1166,7 @@ test_util.make_do_test(build_machine, machine_type, { uarch = test_reset_uarch_c
             end,
         })
         local tmp <close> = assert(io.open(tmpname, "w+"))
-        util.dump_log(log, tmp)
+        util.print_log(log, tmp)
         tmp:seek("set", 0)
         local actual_dump = tmp:read("*all")
 
@@ -1120,7 +1188,7 @@ test_util.make_do_test(build_machine, machine_type, { uarch = test_reset_uarch_c
         local initial_hash = machine:get_root_hash()
         local log = machine:log_reset_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS | cartesi.ACCESS_LOG_TYPE_LARGE_DATA)
         local final_hash = machine:get_root_hash()
-        assert(#log.accesses == 1, "log should have 1 access")
+        assert(#log.accesses == 2, "log should have 2 accesses")
         local access = log.accesses[1]
         -- when large data is requested, the log must include read and written data
         assert(access.read ~= nil, "read data should not be nil")
@@ -1165,7 +1233,7 @@ do_test("Test unhappy paths of verify_reset_uarch", function(machine)
     end)
 
     assert_error('missing field "log/accesses/0/read_hash"', function(log)
-        log.accesses[#log.accesses].read_hash = nil
+        log.accesses[1].read_hash = nil
     end)
     assert_error("siblings and read hash do not match root hash before 1st access to uarch.state", function(log)
         log.accesses[1].read_hash = bad_hash
@@ -1174,13 +1242,13 @@ do_test("Test unhappy paths of verify_reset_uarch", function(machine)
         log.accesses[#log.accesses + 1] = log.accesses[1]
     end)
     assert_error("missing written hash of uarch.state in 1st access", function(log)
-        log.accesses[#log.accesses].written_hash = nil
+        log.accesses[1].written_hash = nil
     end)
     assert_error("access written data size is inconsistent with proof size", function(log)
-        log.accesses[#log.accesses].written = "\0"
+        log.accesses[1].written = "\0"
     end)
     assert_error("written data for uarch.state does not match written hash in 1st access", function(log)
-        log.accesses[#log.accesses].written = string.rep("\0", 2 ^ 22)
+        log.accesses[1].written = string.rep("\0", 2 ^ 22)
     end)
     assert_error("siblings and read hash do not match root hash before 1st access to uarch.state", function(log)
         log.accesses[1].sibling_hashes[1] = bad_hash
@@ -1295,11 +1363,14 @@ do_test("send_cmio_response fails if iflags.Y is not set", function(machine)
     machine:write_reg("iflags_Y", 0)
     assert(machine:read_reg("iflags_Y") == 0)
     test_util.assert_error("iflags.Y is not set", function()
-        machine:send_cmio_response(reason, data)
-    end)
-    test_util.assert_error("iflags.Y is not set", function()
-        machine:log_send_cmio_response(reason, data)
+        machine:send_cmio_response(machine:get_root_hash(), reason, data)
     end)
+    -- the logged operation cannot fail, it is a no-op instead
+    local root_hash_before = machine:get_root_hash()
+    local log = machine:log_send_cmio_response(root_hash_before, reason, data)
+    assert(#log.accesses == 1, "no-op log should have 1 access")
+    assert(machine:get_root_hash() == root_hash_before)
+    machine:verify_send_cmio_response(root_hash_before, reason, data, root_hash_before, log, root_hash_before)
 end)
 
 do_test("send_cmio_response fails if data is too big", function(machine)
@@ -1307,11 +1378,14 @@ do_test("send_cmio_response fails if data is too big", function(machine)
     local data_too_big = string.rep("a", 1 + (1 << cartesi.AR_CMIO_RX_BUFFER_LOG2_SIZE))
     machine:write_reg("iflags_Y", 1)
     test_util.assert_error("CMIO response data is too large", function()
-        machine:send_cmio_response(reason, data_too_big)
-    end)
-    test_util.assert_error("CMIO response data is too large", function()
-        machine:log_send_cmio_response(reason, data_too_big)
+        machine:send_cmio_response(machine:get_root_hash(), reason, data_too_big)
     end)
+    -- the logged operation cannot fail, it is a no-op instead
+    local root_hash_before = machine:get_root_hash()
+    local log = machine:log_send_cmio_response(root_hash_before, reason, data_too_big)
+    assert(#log.accesses == 1, "no-op log should have 1 access")
+    assert(machine:get_root_hash() == root_hash_before)
+    machine:verify_send_cmio_response(root_hash_before, reason, data_too_big, root_hash_before, log, root_hash_before)
 end)
 
 -- asserts that an access has the expected key  values
@@ -1331,6 +1405,8 @@ local function test_send_cmio_input_with_different_arguments()
     local data_hash = test_util.merkle_hash(data, 0, cartesi.AR_CMIO_RX_BUFFER_LOG2_SIZE, hash_fn)
     local all_zeros = string.rep("\0", max_rx_buffer_len)
     local all_zeros_hash = test_util.merkle_hash(all_zeros, 0, cartesi.AR_CMIO_RX_BUFFER_LOG2_SIZE, hash_fn)
+    local zero_leaf = string.rep("\0", 1 << cartesi.HASH_TREE_LOG2_WORD_SIZE)
+    local zero_leaf_hash = test_util.merkle_hash(zero_leaf, 0, cartesi.HASH_TREE_LOG2_WORD_SIZE, hash_fn)
     -- prepares and asserts the state before send_cmio_response is called
     local function assert_before_cmio_response_sent(machine)
         machine:write_reg("iflags_Y", 1)
@@ -1349,7 +1425,7 @@ local function test_send_cmio_input_with_different_arguments()
     end
     do_test("send_cmio_response happy path", function(machine)
         assert_before_cmio_response_sent(machine)
-        machine:send_cmio_response(reason, data)
+        machine:send_cmio_response(machine:get_root_hash(), reason, data)
         assert_after_cmio_response_sent(machine)
     end)
     for _, large_data in ipairs({ false, true }) do
@@ -1365,18 +1441,32 @@ local function test_send_cmio_input_with_different_arguments()
                     | (large_data and cartesi.ACCESS_LOG_TYPE_LARGE_DATA or 0)
                 assert_before_cmio_response_sent(machine)
                 local root_hash_before = machine:get_root_hash()
-                local log = machine:log_send_cmio_response(reason, data, log_type)
+                local log = machine:log_send_cmio_response(root_hash_before, reason, data, log_type)
                 assert_after_cmio_response_sent(machine)
                 local root_hash_after = machine:get_root_hash()
                 -- check log
                 local accesses = log.accesses
-                assert(#accesses == 4)
+                assert(#accesses == 5)
                 assert_access(accesses, 1, {
                     type = "read",
                     address = machine:get_reg_address("iflags_Y"),
                     log2_size = 3,
                 })
                 assert_access(accesses, 2, {
+                    type = "write",
+                    address = cartesi.AR_SHADOW_REVERT_ROOT_HASH_START,
+                    log2_size = cartesi.HASH_TREE_LOG2_WORD_SIZE,
+                    read_hash = zero_leaf_hash,
+                    read = large_data and zero_leaf or nil,
+                    written_hash = test_util.merkle_hash(
+                        root_hash_before,
+                        0,
+                        cartesi.HASH_TREE_LOG2_WORD_SIZE,
+                        hash_fn
+                    ),
+                    written = large_data and root_hash_before or nil,
+                })
+                assert_access(accesses, 3, {
                     type = "write",
                     address = cartesi.AR_CMIO_RX_BUFFER_START,
                     log2_size = cartesi.AR_CMIO_RX_BUFFER_LOG2_SIZE,
@@ -1385,18 +1475,27 @@ local function test_send_cmio_input_with_different_arguments()
                     written_hash = data_hash,
                     written = large_data and data or nil,
                 })
-                assert_access(accesses, 3, {
+                assert_access(accesses, 4, {
                     type = "write",
                     address = machine:get_reg_address("htif_fromhost"),
                     log2_size = 3,
                 })
-                assert_access(accesses, 4, {
+                assert_access(accesses, 5, {
                     type = "write",
                     address = machine:get_reg_address("iflags_Y"),
                     log2_size = 3,
                 })
                 -- ask machine to verify state transitions
-                machine:verify_send_cmio_response(reason, data, root_hash_before, log, root_hash_after, log_type, {})
+                machine:verify_send_cmio_response(
+                    root_hash_before,
+                    reason,
+                    data,
+                    root_hash_before,
+                    log,
+                    root_hash_after,
+                    log_type,
+                    {}
+                )
             end
         )
     end
@@ -1408,23 +1507,132 @@ do_test("Dump of log produced by send_cmio_response should match", function(mach
     machine:write_reg("iflags_Y", 1)
     local data = "0123456789"
     local reason = 7
-    local log = machine:log_send_cmio_response(reason, data, cartesi.ACCESS_LOG_TYPE_ANNOTATIONS)
-    local expected_dump = [[
-begin send_cmio_response
-  1: read iflags.Y@0x300(768): 0x1(1)
-  2: write cmio rx buffer@0x60000000(1610612736): hash:"290decd9"(2^5 bytes) -> hash:"555b1f6d"(2^5 bytes)
-  3: write htif.fromhost@0x330(816): 0x0(0) -> 0x70000000a(30064771082)
-  4: write iflags.Y@0x300(768): 0x1(1) -> 0x0(0)
-end send_cmio_response
-]]
+    -- the revert root hash must be the machine root hash, so the leaf write value is matched by a pattern
+    local log =
+        machine:log_send_cmio_response(machine:get_root_hash(), reason, data, cartesi.ACCESS_LOG_TYPE_ANNOTATIONS)
+    local expected_dump_pattern = "begin send_cmio_response\n"
+        .. "  1: read iflags%.Y@0x300%(768%): 0x1%(1%)\n"
+        .. '  2: write revert root hash@0xfe0%(4064%): hash:"290decd9"%(2%^5 bytes%) %-> '
+        .. 'hash:"[0-9a-f]+"%(2%^5 bytes%)\n'
+        .. '  3: write cmio rx buffer@0x60000000%(1610612736%): hash:"290decd9"%(2%^5 bytes%) %-> '
+        .. 'hash:"555b1f6d"%(2%^5 bytes%)\n'
+        .. "  4: write htif%.fromhost@0x330%(816%): 0x0%(0%) %-> 0x70000000a%(30064771082%)\n"
+        .. "  5: write iflags%.Y@0x300%(768%): 0x1%(1%) %-> 0x0%(0%)\n"
+        .. "end send_cmio_response\n"
     local temp_file <close> = test_util.new_temp_file()
-    util.dump_log(log, temp_file)
+    util.print_log(log, temp_file)
     local actual_dump = temp_file:read_all()
     print("Output of log_send_cmio_response dump:")
     print("--------------------------")
     print(actual_dump)
     print("--------------------------")
-    assert(actual_dump == expected_dump, "Dump of uarch_reset_state does not match expected:\n" .. expected_dump)
+    assert(
+        actual_dump:find(expected_dump_pattern),
+        "Dump of send_cmio_response does not match expected pattern:\n" .. expected_dump_pattern
+    )
+end)
+
+do_test("send_cmio_response should check the machine state for advance-state responses", function(machine)
+    local advance_reason = cartesi.HTIF_YIELD_REASON_ADVANCE_STATE
+    local data = "0123456789"
+    local wrong_revert_root_hash = string.rep("\xff", cartesi.HASH_SIZE)
+    -- put the machine in the state that waits for an advance-state input
+    machine:write_reg("iflags_Y", 1)
+    machine:write_reg("htif_tohost_dev", cartesi.HTIF_DEV_YIELD)
+    machine:write_reg("htif_tohost_cmd", cartesi.HTIF_YIELD_CMD_MANUAL)
+    machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED)
+    local root_hash_before = machine:get_root_hash()
+    -- a revert root hash other than the machine root hash is refused
+    local _, err = pcall(machine.send_cmio_response, machine, wrong_revert_root_hash, advance_reason, data)
+    check_error_find(err, "revert root hash does not match the machine root hash")
+    -- the failed call did not change the machine state
+    assert(machine:get_root_hash() == root_hash_before)
+    -- a machine that is not waiting on an rx-accepted manual yield refuses the input
+    machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED)
+    root_hash_before = machine:get_root_hash()
+    _, err = pcall(machine.send_cmio_response, machine, root_hash_before, advance_reason, data)
+    check_error_find(err, "machine is not waiting on an rx-accepted manual yield")
+    assert(machine:get_root_hash() == root_hash_before)
+    -- other response reasons are not checked at all
+    machine:send_cmio_response(wrong_revert_root_hash, cartesi.HTIF_YIELD_REASON_INSPECT_STATE, data)
+    assert(machine:read_reg("iflags_Y") == 0)
+end)
+
+do_test("advance-state response without an rx-accepted manual yield logs as a no-op", function(machine)
+    local advance_reason = cartesi.HTIF_YIELD_REASON_ADVANCE_STATE
+    local data = "0123456789"
+    -- the machine yielded manual, but rejected the previous input
+    machine:write_reg("iflags_Y", 1)
+    machine:write_reg("htif_tohost_dev", cartesi.HTIF_DEV_YIELD)
+    machine:write_reg("htif_tohost_cmd", cartesi.HTIF_YIELD_CMD_MANUAL)
+    machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED)
+    local root_hash_before = machine:get_root_hash()
+    local log = machine:log_send_cmio_response(root_hash_before, advance_reason, data)
+    -- the log contains only the reads that conclude the operation is a no-op
+    assert(#log.accesses == 2, "no-op log should have 2 accesses")
+    assert_access(log.accesses, 1, { type = "read", address = machine:get_reg_address("iflags_Y") })
+    assert_access(log.accesses, 2, { type = "read", address = machine:get_reg_address("htif_tohost") })
+    -- the machine state is unchanged
+    assert(machine:read_reg("iflags_Y") == 1)
+    assert(machine:get_root_hash() == root_hash_before)
+    -- the no-op log verifies with equal root hashes before and after
+    machine:verify_send_cmio_response(root_hash_before, advance_reason, data, root_hash_before, log, root_hash_before)
+end)
+
+do_test("log_send_cmio_response happy path for an advance-state response", function(machine)
+    local advance_reason = cartesi.HTIF_YIELD_REASON_ADVANCE_STATE
+    local data = "0123456789"
+    -- put the machine in the state that waits for an advance-state input
+    machine:write_reg("iflags_Y", 1)
+    machine:write_reg("htif_tohost_dev", cartesi.HTIF_DEV_YIELD)
+    machine:write_reg("htif_tohost_cmd", cartesi.HTIF_YIELD_CMD_MANUAL)
+    machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED)
+    local root_hash_before = machine:get_root_hash()
+    local log = machine:log_send_cmio_response(root_hash_before, advance_reason, data)
+    -- the reads that check the machine state, followed by the writes of the response
+    assert(#log.accesses == 6, "advance-state log should have 6 accesses")
+    assert_access(log.accesses, 1, { type = "read", address = machine:get_reg_address("iflags_Y") })
+    assert_access(log.accesses, 2, { type = "read", address = machine:get_reg_address("htif_tohost") })
+    assert_access(log.accesses, 3, { type = "write", address = cartesi.AR_SHADOW_REVERT_ROOT_HASH_START })
+    assert(machine:read_reg("iflags_Y") == 0)
+    local root_hash_after = machine:get_root_hash()
+    machine:verify_send_cmio_response(root_hash_before, advance_reason, data, root_hash_before, log, root_hash_after)
+end)
+
+do_test("Test unhappy paths of verify_send_cmio_response", function(machine)
+    local advance_reason = cartesi.HTIF_YIELD_REASON_ADVANCE_STATE
+    local data = "0123456789"
+    local function assert_error(expected_error, callback)
+        -- put the machine back in the state that waits for an advance-state input
+        machine:write_reg("iflags_Y", 1)
+        machine:write_reg("htif_tohost_dev", cartesi.HTIF_DEV_YIELD)
+        machine:write_reg("htif_tohost_cmd", cartesi.HTIF_YIELD_CMD_MANUAL)
+        machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED)
+        local root_hash_before = machine:get_root_hash()
+        local log = machine:log_send_cmio_response(root_hash_before, advance_reason, data)
+        local root_hash_after = machine:get_root_hash()
+        callback(log)
+        local _, err = pcall(
+            machine.verify_send_cmio_response,
+            machine,
+            root_hash_before,
+            advance_reason,
+            data,
+            root_hash_before,
+            log,
+            root_hash_after
+        )
+        check_error_find(err, expected_error)
+    end
+    assert_error("too few accesses in log", function(log)
+        log.accesses = { log.accesses[1] }
+    end)
+    assert_error("expected 2nd access to read htif.tohost address", function(log)
+        log.accesses[2].address = 0
+    end)
+    assert_error("expected 1st access to read iflags.Y", function(log)
+        table.remove(log.accesses, 1)
+    end)
 end)
 
 do_test("send_cmio_response with different data sizes", function(machine)
@@ -1459,12 +1667,12 @@ do_test("send_cmio_response with different data sizes", function(machine)
             local data = string.rep("a", case.data_len)
             machine:write_reg("iflags_Y", 1)
             if logging then
-                local log = machine:log_send_cmio_response(reason, data)
-                assert(#log.accesses == 4, string.format("log should have 4 accesses, but it has %s", #log.accesses))
-                assert(log.accesses[2].type == "write", "access 2 should be a write")
-                assert(1 << log.accesses[2].log2_size == case.write_len, "log2_size of write access does not match")
+                local log = machine:log_send_cmio_response(machine:get_root_hash(), reason, data)
+                assert(#log.accesses == 5, string.format("log should have 5 accesses, but it has %s", #log.accesses))
+                assert(log.accesses[3].type == "write", "access 3 should be a write")
+                assert(1 << log.accesses[3].log2_size == case.write_len, "log2_size of write access does not match")
             else
-                machine:send_cmio_response(reason, data)
+                machine:send_cmio_response(machine:get_root_hash(), reason, data)
             end
             local expected_rx_buffer = padded_data(data, case.write_len, "\0")
                 .. string.rep("x", rx_buffer_size - case.write_len)
@@ -1491,18 +1699,18 @@ do_test("send_cmio_response of zero bytes", function(machine)
     machine:write_reg("iflags_Y", 1)
     local reason = 1
     local data = ""
-    machine:send_cmio_response(reason, data)
+    machine:send_cmio_response(machine:get_root_hash(), reason, data)
     local new_rx_buffer = machine:read_memory(cartesi.AR_CMIO_RX_BUFFER_START, rx_buffer_size)
     assert(new_rx_buffer == initial_rx_buffer, "rx_buffer should not have been modified")
     assert(machine:read_reg("iflags_Y") == 0, "iflags.Y should be cleared")
     -- log and verify
     machine:write_reg("iflags_Y", 1)
     local hash_before = machine:get_root_hash()
-    local log = machine:log_send_cmio_response(reason, data)
-    util.dump_log(log, io.stderr)
-    assert(#log.accesses == 3, "log should have 3 accesses")
+    local log = machine:log_send_cmio_response(hash_before, reason, data)
+    util.print_log(log, io.stderr)
+    assert(#log.accesses == 4, "log should have 4 accesses")
     local hash_after = machine:get_root_hash()
-    machine:verify_send_cmio_response(reason, data, hash_before, log, hash_after)
+    machine:verify_send_cmio_response(hash_before, reason, data, hash_before, log, hash_after)
 end)
 
 local function test_cmio_buffers_backed_by_files()
@@ -1602,7 +1810,7 @@ test_util.make_do_test(build_machine, machine_type, {
     local function log_step()
         local log = machine:log_step_uarch(cartesi.ACCESS_LOG_TYPE_ANNOTATIONS)
         local temp_file <close> = test_util.new_temp_file()
-        util.dump_log(log, temp_file)
+        util.print_log(log, temp_file)
         return log, temp_file:read_all()
     end
 
@@ -1943,4 +2151,28 @@ for _, hash_fn in pairs({ "keccak256", "sha256" }) do
     )
 end
 
+do_test("log_step from a rejected input state verifies against the revert root hash", function(machine)
+    local filename = os.tmpname()
+    os.remove(filename) -- log_step requires the file to not exist
+    local deleter = {}
+    setmetatable(deleter, {
+        __gc = function()
+            os.remove(filename)
+        end,
+    })
+    local revert_hash = string.rep("\x5a", cartesi.HASH_SIZE)
+    set_rejected_input_state(machine, revert_hash)
+    local mcycle_before = machine:read_reg("mcycle")
+    local root_hash_before = machine:get_root_hash()
+    machine:log_step(1, filename)
+    -- the machine does not advance while the manual yield is pending
+    assert(machine:read_reg("mcycle") == mcycle_before, "mcycle should not have advanced")
+    assert(machine:get_root_hash() == root_hash_before, "machine state should not have changed")
+    -- the canonical root hash after the step is the revert root hash
+    machine:verify_step(root_hash_before, filename, 1, revert_hash)
+    -- the machine's actual root hash is not accepted
+    local _, err = pcall(machine.verify_step, machine, root_hash_before, filename, 1, root_hash_before)
+    check_error_find(err, "root hash after mismatch")
+end)
+
 print("\n\nAll machine binding tests for type " .. machine_type .. " passed")
diff --git a/tests/lua/spec-backing-stores.lua b/tests/lua/spec-backing-stores.lua
index aaf67614e..5659fd36a 100644
--- a/tests/lua/spec-backing-stores.lua
+++ b/tests/lua/spec-backing-stores.lua
@@ -27,6 +27,7 @@ describe("backing stores", function()
         },
         flash_drive = {
             { -- read/write + backing file
+                start = 0x0080000000000000,
                 backing_store = {
                     data_filename = rw_data_filename,
                 },
diff --git a/tests/lua/spec-cm-cli.lua b/tests/lua/spec-cm-cli.lua
index 38dcb7976..696d303d1 100644
--- a/tests/lua/spec-cm-cli.lua
+++ b/tests/lua/spec-cm-cli.lua
@@ -28,6 +28,7 @@ local describe, it, expect = lester.describe, lester.it, lester.expect
 describe("cartesi-machine CLI", function()
     local cartesi = require("cartesi")
     local evmu = require("cartesi.evmu")
+    local hash_tree = require("cartesi.hash-tree")
 
     local function zeros(n)
         return string.rep("\0", n)
@@ -75,11 +76,6 @@ describe("cartesi-machine CLI", function()
         })
     end
 
-    local function read_bin(path)
-        local f <close> = assert(io.open(path, "rb"))
-        return f:read("*a")
-    end
-
     -- Interpreter used for sub-invocations of cartesi-machine.lua.
     -- Under coverage (coverage=yes), the Makefile exports LUA_CLI as
     -- "lua5.4 -lluacov" so that cartesi-machine.lua children are measured.
@@ -203,11 +199,11 @@ describe("cartesi-machine CLI", function()
     --       run_fail() for a version mismatch to confirm the non-zero exit path.
     -- -------------------------------------------------------------------------
     it("early exit options", function()
-        local rc, stdout = run({ "-h" })
-        expect.equal(rc, 0)
-        expect.truthy(stdout:find("cartesi%-machine"))
+        -- -h is no longer help; it is the docker-style hostname short option.
+        -- A bare -h is rejected with a hint pointing at --help.
+        run_fail({ "-h" }, "did you mean %-%-help")
 
-        rc, stdout = run({ "--help" })
+        local rc, stdout = run({ "--help" })
         expect.equal(rc, 0)
         expect.truthy(stdout:find("cartesi%-machine"))
 
@@ -225,6 +221,14 @@ describe("cartesi-machine CLI", function()
         -- assert-version with current major.minor should succeed and continue
         local ver = string.format("%d.%d", cartesi.VERSION_MAJOR, cartesi.VERSION_MINOR)
         run_ok({ "--assert-version=" .. ver, "--max-mcycle=0", "--no-init-splash", "--quiet" })
+
+        -- --bash-completion emits a bash-completion script and exits.  When it
+        -- is the only argument the CLI services it before require("cartesi"),
+        -- so it must run from cartesi.bash without the compiled module.
+        rc, stdout = run({ "--bash-completion" })
+        expect.equal(rc, 0)
+        expect.truthy(stdout:find("bash completion for cartesi%-machine"))
+        expect.truthy(stdout:find("_cm_flag_kind"))
     end)
 
     -- -------------------------------------------------------------------------
@@ -343,6 +347,18 @@ describe("cartesi-machine CLI", function()
         expect.equal(found_data.length, 0x10000)
         expect.equal(found_data.read_only, true)
 
+        -- positional filename: --flash-drive=<file> equals data_filename:<file>
+        cfg = config_for({ "--flash-drive=label:pos," .. flash_tmp })
+        local found_pos
+        for _, fd in ipairs(cfg.flash_drive) do
+            if fd.label == "pos" then
+                found_pos = fd
+                break
+            end
+        end
+        expect.truthy(found_pos)
+        expect.equal(found_pos.backing_store.data_filename, flash_tmp)
+
         -- --no-root-flash-drive + replacement
         cfg = config_for({
             "--no-root-flash-drive",
@@ -456,6 +472,16 @@ describe("cartesi-machine CLI", function()
         })
         expect.truthy(not cfg.dtb.init:find("/mnt/empty"))
 
+        -- Auto-detect failure: with neither an explicit length nor a backing
+        -- file there is nothing to auto-detect the length from.
+        run_fail({
+            "--no-root-flash-drive",
+            "--flash-drive=label:f",
+            "--max-mcycle=0",
+            "--no-init-splash",
+            "--quiet",
+        }, "unable to auto%-detect length of flash drive")
+
         -- --hash-tree: hash_function and phtc_size variations
         cfg = config_for({ "--hash-tree=hash_function:sha256" })
         expect.equal(cfg.hash_tree.hash_function, "sha256")
@@ -528,15 +554,42 @@ describe("cartesi-machine CLI", function()
         })
         expect.truthy(not cfg.dtb.init:find("chmod 0444"))
 
-        -- Auto-assigned start: NVRAMs share the drive pool with flash drives.
-        -- The default root flash drive consumes slot 0, so the first --nvram
-        -- without start lands at slot 1 and the second at slot 2.
+        -- Auto-assigned start: a drive without an explicit start is placed past
+        -- the end of RAM (RAM length rounded up to the next power of two) and
+        -- aligned to its own length (also rounded up to the next power of two).
+        -- Flash drives and NVRAMs share a single pool, with flash drives placed
+        -- first.  Here RAM length 0x5000000 rounds up to 0x8000000, so the flash
+        -- drive lands at AR_RAM_START + 0x8000000.  The NVRAM length 0x18000
+        -- rounds up to 0x20000, bumping its start to the next 0x20000-aligned
+        -- address and leaving a gap after the smaller flash drive.
         cfg = config_for({
-            "--nvram=label:auto1,length:0x1000",
-            "--nvram=label:auto2,length:0x1000",
+            "--ram-length=0x5000000",
+            "--no-root-flash-drive",
+            "--flash-drive=label:f,length:0x10000",
+            "--nvram=label:n,length:0x18000",
         })
-        expect.equal(cfg.nvram[1].start, cartesi.AR_DRIVE_START + cartesi.AR_DRIVE_OFFSET)
-        expect.equal(cfg.nvram[2].start, cartesi.AR_DRIVE_START + 2 * cartesi.AR_DRIVE_OFFSET)
+        expect.equal(cfg.flash_drive[1].start, cartesi.AR_RAM_START + 0x8000000)
+        expect.equal(cfg.nvram[1].start, cartesi.AR_RAM_START + 0x8000000 + 0x20000)
+        expect.equal(cfg.nvram[1].length, 0x18000)
+
+        -- Auto-detect failure: with neither an explicit length nor a backing
+        -- file there is nothing to auto-detect the length from.
+        run_fail({
+            "--nvram=label:n",
+            "--max-mcycle=0",
+            "--no-init-splash",
+            "--quiet",
+        }, "unable to auto%-detect length of nvram")
+
+        -- Auto-detect failure: a length whose rounded-up power of two leaves no
+        -- address space past its own alignment overflows and is rejected.
+        run_fail({
+            "--no-root-flash-drive",
+            "--nvram=label:big,length:0x8000000000000000",
+            "--max-mcycle=0",
+            "--no-init-splash",
+            "--quiet",
+        }, "no address space to auto%-detect start of nvram")
     end)
 
     -- -------------------------------------------------------------------------
@@ -610,8 +663,8 @@ describe("cartesi-machine CLI", function()
     --       Mac OS where that device type is not supported.
     -- -------------------------------------------------------------------------
     it("virtio network options", function()
-        -- --virtio-9p
-        local cfg = config_for({ "--virtio-9p=mytag:/tmp" })
+        -- --virtio-9p (key:value long form)
+        local cfg = config_for({ "--virtio-9p=tag:mytag,host_directory:/tmp" })
         expect.truthy(cfg.virtio and #cfg.virtio > 0)
         local found_p9fs
         for _, v in ipairs(cfg.virtio) do
@@ -657,8 +710,8 @@ describe("cartesi-machine CLI", function()
         end
         expect.truthy(found_net)
 
-        -- --port-forward (requires --virtio-net=user or --network)
-        cfg = config_for({ "--network", "--port-forward=18080:80" })
+        -- -p docker short form (attached value), requires --network
+        cfg = config_for({ "--network", "-p=18080:80" })
         local net_entry
         for _, v in ipairs(cfg.virtio) do
             if v.type == "net-user" then
@@ -670,8 +723,8 @@ describe("cartesi-machine CLI", function()
         expect.equal(net_entry.hostfwd[1].host_port, 18080)
         expect.equal(net_entry.hostfwd[1].guest_port, 80)
 
-        -- --volume (implies p9fs + sync-init-date + iunrep)
-        cfg = config_for({ "--volume=/tmp:/mnt" })
+        -- -v docker short form (attached value): implies p9fs + iunrep
+        cfg = config_for({ "-v=/tmp:/mnt" })
         found_p9fs = false
         for _, v in ipairs(cfg.virtio) do
             if v.type == "p9fs" then
@@ -694,10 +747,11 @@ describe("cartesi-machine CLI", function()
         expect.truthy(found_console)
         expect.equal(cfg.processor.registers.iunrep, 1)
 
-        -- --port-forward with explicit IPv4 host/guest addresses and UDP protocol
+        -- --port-forward long key:value form with explicit IPv4 host/guest
+        -- addresses ([ip:]port values) and UDP protocol
         cfg = config_for({
             "--network",
-            "--port-forward=127.0.0.1:10.0.2.15:18081:81:udp",
+            "--port-forward=host_address:127.0.0.1:18081,guest_address:10.0.2.15:81,protocol:udp",
         })
         local net_entry2
         for _, v in ipairs(cfg.virtio) do
@@ -802,12 +856,13 @@ describe("cartesi-machine CLI", function()
     -- -------------------------------------------------------------------------
     -- Hashing and proof options
     --
-    -- What: --initial-hash, --final-hash, --periodic-hashes (two-arg and
-    --       single-arg forms), --initial-proof, --final-proof,
-    --       --dense-uarch-hashes, and --dump-address-ranges.
+    -- What: --initial-hash, --final-hash, --periodic-hashes (positional period
+    --       with and without a start: sub-key), --initial-proof, --final-proof,
+    --       --dense-uarch-hashes, and --dump-memory-ranges.
     -- How:  run_ok() each flag; regex-match 64-hex-digit lines in stderr to
     --       count hash emissions; open proof output files and assert they are
-    --       non-empty.
+    --       non-empty.  Format-specific proof assertions live in the dedicated
+    --       "proof dump options" test below.
     -- -------------------------------------------------------------------------
     it("hashing options", function()
         -- --initial-hash and --final-hash emit hashes to stderr as "<mcycle>: <hex64>"
@@ -821,7 +876,7 @@ describe("cartesi-machine CLI", function()
         expect.truthy(hash_count >= 2)
 
         -- --periodic-hashes
-        _, err = run_ok({ "--periodic-hashes=1,0", "--max-mcycle=2", "--no-init-splash", "--quiet" })
+        _, err = run_ok({ "--periodic-hashes=1,start:0", "--max-mcycle=2", "--no-init-splash", "--quiet" })
         hash_count = 0
         for line in err:gmatch("[^\n]+") do
             if line:match("^%d+: [0-9a-f]+$") and #line:match("[0-9a-f]+$") == 64 then
@@ -830,59 +885,179 @@ describe("cartesi-machine CLI", function()
         end
         expect.truthy(hash_count >= 1)
 
-        -- --initial-proof / --final-proof written to files
-        local _ <close>, proof_file = scope_temp_pathname()
-        run_ok({
-            "--initial-proof=address:0x80000000,log2_size:12,filename:" .. proof_file,
-            "--max-mcycle=0",
-            "--no-init-splash",
-            "--quiet",
-        })
-        expect.truthy(#filesystem.read_file(proof_file) > 10)
-
-        -- --final-proof written to a file
-        local _ <close>, final_proof_file = scope_temp_pathname()
-        run_ok({
-            "--final-proof=address:0x80000000,log2_size:12,filename:" .. final_proof_file,
-            "--max-mcycle=0",
-            "--no-init-splash",
-            "--quiet",
-        })
-        expect.truthy(#filesystem.read_file(final_proof_file) > 10)
-
-        -- --periodic-hashes=N single-argument form (no start offset, implies start=N)
+        -- --periodic-hashes=<period> bare positional form (start defaults to 0)
         run_ok({ "--periodic-hashes=10", "--max-mcycle=0", "--no-init-splash", "--quiet" })
 
-        -- --periodic-hashes=<period>,<start> with start > 0: exercises the
+        -- --periodic-hashes=<period>,start:<n> with start > 0: exercises the
         -- next_hash_mcycle = periodic_hashes_start branch.
-        run_ok({ "--periodic-hashes=10,5", "--max-mcycle=0", "--no-init-splash", "--quiet" })
+        run_ok({ "--periodic-hashes=10,start:5", "--max-mcycle=0", "--no-init-splash", "--quiet" })
 
         -- --dense-uarch-hashes=N single-argument form
         run_ok({ "--dense-uarch-hashes=1", "--max-mcycle=0", "--no-init-splash", "--quiet" })
 
-        -- --dump-address-ranges=<dir>: writes one <start>--<length>.bin per address range under <dir>.
+        -- --dump-memory-ranges=<dir>: writes one <start>--<length>.bin per memory range under <dir>.
         -- The CLI creates the directory; we only own the cleanup.
         local dump_dir = filesystem.temp_pathname()
         local _ <close> = utils.scope_exit(function()
             os.remove(dump_dir)
         end)
-        run_ok({ "--dump-address-ranges=" .. dump_dir, "--max-mcycle=0", "--no-init-splash", "--quiet" })
+        run_ok({ "--dump-memory-ranges=" .. dump_dir, "--max-mcycle=0", "--no-init-splash", "--quiet" })
         local cfg = config_for({})
         local m <close> = cartesi.machine(cfg)
         for _, v in ipairs(m:get_address_ranges()) do
             local filename = dump_dir .. "/" .. string.format("%016x--%016x.bin", v.start, v.length)
             local f = io.open(filename, "r")
-            assert(f, "--dump-address-ranges: expected file not created: " .. filename)
-            f:close()
-            assert(os.remove(filename))
+            if v.is_memory then
+                assert(f, "--dump-memory-ranges: expected file not created: " .. filename)
+                f:close()
+                assert(os.remove(filename))
+            else
+                assert(not f, "--dump-memory-ranges: file created for device range: " .. filename)
+            end
+        end
+    end)
+
+    -- -------------------------------------------------------------------------
+    -- Proof dump options
+    --
+    -- What: --initial-proof / --final-proof emit a Lua table (loadable with
+    --       load/dofile) by default, or JSON validated against the "Proof"
+    --       schema when format:json is given.  Each option is exercised both
+    --       writing to a file (filename:<path>) and writing to stdout (no
+    --       filename:), in both formats.
+    -- How:  For Lua proofs, load() the emitted text and assert the proof shape;
+    --       for JSON proofs, round-trip through cartesi.fromjson(s, "Proof")
+    --       (which re-validates against the schema) and assert the same shape.
+    --       A proof of a 2^12 region under a 2^64 tree has 64-12 = 52 sibling
+    --       hashes, so that count doubles as a structural sanity check.
+    -- -------------------------------------------------------------------------
+    it("proof dump options", function()
+        local ADDR = 0x80000000
+        local LOG2 = 12
+
+        -- Assert the common shape shared by both formats.
+        local function check_proof(p)
+            expect.equal(p.log2_root_size, 64)
+            expect.equal(p.log2_target_size, LOG2)
+            expect.equal(p.target_address, ADDR)
+            expect.equal(#p.sibling_hashes, 64 - LOG2)
+            expect.truthy(p.root_hash ~= nil)
+            expect.truthy(p.target_hash ~= nil)
+        end
+
+        -- --initial-proof / --final-proof to a file: the text is a Lua chunk
+        -- that returns the proof table, loadable with dofile.
+        for _, opt in ipairs({ "--initial-proof", "--final-proof" }) do
+            local _ <close>, proof_file = scope_temp_pathname()
+            run_ok({
+                opt .. "=address:" .. ADDR .. ",log2_size:" .. LOG2 .. ",filename:" .. proof_file,
+                "--max-mcycle=0",
+                "--no-init-splash",
+                "--quiet",
+            })
+            check_proof(dofile(proof_file))
+        end
+
+        -- --initial-proof to stdout: same Lua chunk, loaded with load().
+        local stdout = run_ok({
+            "--initial-proof=address:" .. ADDR .. ",log2_size:" .. LOG2,
+            "--max-mcycle=0",
+            "--no-init-splash",
+            "--quiet",
+        })
+        check_proof(assert(load(stdout))())
+
+        -- --initial-proof / --final-proof with format:json to a file: valid JSON
+        -- that round-trips through the "Proof" schema.
+        for _, opt in ipairs({ "--initial-proof", "--final-proof" }) do
+            local _ <close>, json_file = scope_temp_pathname()
+            run_ok({
+                opt .. "=address:" .. ADDR .. ",log2_size:" .. LOG2 .. ",filename:" .. json_file .. ",format:json",
+                "--max-mcycle=0",
+                "--no-init-splash",
+                "--quiet",
+            })
+            check_proof(cartesi.fromjson(filesystem.read_file(json_file), "Proof"))
         end
+
+        -- --final-proof with format:json to stdout: same JSON, parsed against the schema.
+        stdout = run_ok({
+            "--final-proof=address:" .. ADDR .. ",log2_size:" .. LOG2 .. ",format:json",
+            "--max-mcycle=0",
+            "--no-init-splash",
+            "--quiet",
+        })
+        check_proof(cartesi.fromjson(stdout, "Proof"))
+    end)
+
+    -- -------------------------------------------------------------------------
+    -- Proof dump by drive label
+    --
+    -- What: The proof options accept label:<label> in place of
+    --       address+log2_size, resolving the target region from the flash
+    --       drive or nvram of that label in the materialized config.  The
+    --       proof's target_address comes from the drive's start and its
+    --       log2_target_size from ilog2(length).
+    -- How:  Run with a labeled flash drive and a labeled nvram, request a
+    --       proof by each label (covering both the Lua and JSON formats and
+    --       the flash-drive-then-nvram lookup order), and assert the derived
+    --       address/log2_size.  An unknown label is a hard error.
+    -- -------------------------------------------------------------------------
+    it("proof dump by drive label", function()
+        local FLASH_START = 0x80000020000000
+        local FLASH_LEN = 0x10000 -- 2^16
+        local NVRAM_START = 0x70000000
+        local NVRAM_LEN = 0x1000 -- 2^12
+
+        -- Flash drive, Lua format: --initial-proof=label:<flash> resolves to the
+        -- flash drive's start and ilog2(length).  This is the path the typo
+        -- "drive = driver or ..." broke, since the flash-drive lookup was
+        -- discarded and only nvram was ever searched.
+        local stdout = run_ok({
+            "--flash-drive=label:pdata,start:" .. string.format("0x%x", FLASH_START) .. ",length:" .. string.format(
+                "0x%x",
+                FLASH_LEN
+            ) .. ",mke2fs",
+            "--initial-proof=label:pdata",
+            "--max-mcycle=0",
+            "--no-init-splash",
+            "--quiet",
+        })
+        local p = assert(load(stdout))()
+        expect.equal(p.target_address, FLASH_START)
+        expect.equal(p.log2_target_size, 16)
+
+        -- NVRAM, JSON format: --final-proof=label:<nvram>,format:json falls
+        -- through to the nvram lookup and resolves the same way.
+        stdout = run_ok({
+            "--nvram=label:pnv,start:" .. string.format("0x%x", NVRAM_START) .. ",length:" .. string.format(
+                "0x%x",
+                NVRAM_LEN
+            ),
+            "--final-proof=label:pnv,format:json",
+            "--max-mcycle=0",
+            "--no-init-splash",
+            "--quiet",
+        })
+        local pj = cartesi.fromjson(stdout, "Proof")
+        expect.equal(pj.target_address, NVRAM_START)
+        expect.equal(pj.log2_target_size, 12)
+
+        -- Unknown label: neither a flash drive nor an nvram matches, so the
+        -- CLI fails before emitting a proof.
+        run_fail({
+            "--initial-proof=label:nosuch",
+            "--max-mcycle=0",
+            "--no-init-splash",
+            "--quiet",
+        }, "flash%-drive or nvram not found with label nosuch")
     end)
 
     -- -------------------------------------------------------------------------
     -- Persistence round-trip options
     --
-    -- What: --store-config / --load-config, --store-json-config /
-    --       --load-json-config (including bare to-stdout forms), --store,
+    -- What: --store-config / --load-config (Lua and JSON via format: sub-key or
+    --       .json extension, including bare to-stdout forms), --store,
     --       --load, --store=<dir>/%h (hash-substituted path), --create,
     --       --store sharing:all, --load sharing:all, and --load clone:<src>.
     -- How:  Each store flag is run, then the produced file or directory is
@@ -909,26 +1084,45 @@ describe("cartesi-machine CLI", function()
         expect.equal(cfg2.hash_tree.hash_function, "sha256")
         expect.equal(cfg2.ram.length, (64 * 1024 * 1024))
 
-        -- --store-json-config to file and --load-json-config round-trip
+        -- JSON via explicit format: sub-key; --load-config reads it back with
+        -- the matching format: sub-key. The filename here has no extension, so
+        -- format: is what selects JSON.
         local _ <close>, json_file = scope_temp_pathname()
         run_ok({
             "--hash-tree=hash_function:sha256",
             "--max-mcycle=0",
             "--no-init-splash",
             "--quiet",
-            "--store-json-config=" .. json_file,
+            "--store-config=" .. json_file .. ",format:json",
         })
         expect.truthy(filesystem.read_file(json_file):find('"sha256"'))
 
-        local cfg3 = config_for({ "--load-json-config=" .. json_file })
+        local cfg3 = config_for({ "--load-config=" .. json_file .. ",format:json" })
         expect.equal(cfg3.hash_tree.hash_function, "sha256")
 
-        -- --store-config to stdout (bare form)
+        -- JSON via .json filename extension (no explicit format:), round-tripped
+        -- by --load-config which also infers JSON from the extension.
+        local json_ext_file = filesystem.temp_pathname() .. ".json"
+        local _ <close> = utils.scope_exit(function()
+            os.remove(json_ext_file)
+        end)
+        run_ok({
+            "--hash-tree=hash_function:sha256",
+            "--max-mcycle=0",
+            "--no-init-splash",
+            "--quiet",
+            "--store-config=" .. json_ext_file,
+        })
+        expect.truthy(filesystem.read_file(json_ext_file):find('"sha256"'))
+        local cfg_ext = config_for({ "--load-config=" .. json_ext_file })
+        expect.equal(cfg_ext.hash_tree.hash_function, "sha256")
+
+        -- --store-config to stdout (bare form): Lua
         local stdout = run_ok({ "--max-mcycle=0", "--no-init-splash", "--quiet", "--store-config" })
         expect.truthy(stdout:find("return"))
 
-        -- --store-json-config to stdout (bare form)
-        stdout = run_ok({ "--max-mcycle=0", "--no-init-splash", "--quiet", "--store-json-config" })
+        -- --store-config to stdout in JSON via format: sub-key (no filename)
+        stdout = run_ok({ "--max-mcycle=0", "--no-init-splash", "--quiet", "--store-config=format:json" })
         expect.truthy(stdout:find('"ram"'))
 
         -- --store=<dir>: machine stored at that path
@@ -1350,16 +1544,23 @@ describe("cartesi-machine CLI", function()
         -- Malformed --port-forward
         run_fail({ "--network", "--port-forward=not-a-port" }, nil)
 
-        -- log2_size < 3 in --initial-proof
+        -- log2_size below cartesi.HASH_TREE_LOG2_WORD_SIZE is rejected by both
+        -- the Lua-table and JSON proof options, with the bound named in stderr.
+        local min_msg = "log2_size must be at least " .. cartesi.HASH_TREE_LOG2_WORD_SIZE
+        local too_small = cartesi.HASH_TREE_LOG2_WORD_SIZE - 1
+        run_fail({
+            "--initial-proof=address:0x80000000,log2_size:" .. too_small,
+            "--max-mcycle=0",
+        }, min_msg)
         run_fail({
-            "--initial-proof=address:0x80000000,log2_size:2",
+            "--initial-proof=address:0x80000000,log2_size:" .. too_small .. ",format:json",
             "--max-mcycle=0",
-        }, "log2_size must be at least 3")
+        }, min_msg)
 
         -- --gdb conflicts with --periodic-hashes
         run_fail({
             "--gdb=127.0.0.1:19234",
-            "--periodic-hashes=100,0",
+            "--periodic-hashes=100,start:0",
             "--max-mcycle=0",
             "--no-init-splash",
             "--quiet",
@@ -1368,23 +1569,20 @@ describe("cartesi-machine CLI", function()
         -- --assert-rolling-template: exits non-zero when machine is not a rolling template
         run_fail({ "--assert-rolling-template", "--max-mcycle=0", "--no-init-splash", "--quiet" }, nil)
 
-        -- --port-forward with a 3-octet value: matches the pattern [0-9:.]+
-        -- but is not a valid IP, port number, or protocol, so handle_port_forward_option
-        -- reaches the error() at line 1036.
-        -- --virtio-net=user must precede it to satisfy the virtio_net_user_config assert.
+        -- --port-forward with a bare 3-octet value: not a key:value sub-option,
+        -- so it is rejected as an unknown option.
         run_fail({
             "--virtio-net=user",
             "--port-forward=1.2.3",
             "--max-mcycle=0",
             "--no-init-splash",
             "--quiet",
-        }, "malformed")
+        }, "unknown option")
 
-        -- Malformed suffixes of options with optional '=' values: the handler
-        -- returns false, the catchall rejects "unrecognized option".
+        -- Malformed suffixes of options with optional values: no entry matches
+        -- the suffixed name, so the catch-all rejects "unrecognized option".
         run_fail({ "--remote-forkXXX" }, nil)
         run_fail({ "--store-configXXX" }, nil)
-        run_fail({ "--store-json-configXXX" }, nil)
 
         -- --gdb= (empty value) is rejected; bare --gdb combined with --periodic-hashes
         -- exercises the default-address branch and trips the "not supported when
@@ -1392,7 +1590,7 @@ describe("cartesi-machine CLI", function()
         run_fail({ "--gdb=" }, nil)
         run_fail({
             "--gdb",
-            "--periodic-hashes=100,0",
+            "--periodic-hashes=100,start:0",
             "--max-mcycle=0",
             "--no-init-splash",
             "--quiet",
@@ -1422,16 +1620,17 @@ describe("cartesi-machine CLI", function()
     -- Step-logging and uarch options
     --
     -- What: --log-step, --log-step-uarch, --log-reset-uarch, --max-uarch-cycle,
-    --       --auto-reset-uarch, and --dense-uarch-hashes=len,start.
+    --       --auto-reset-uarch, and --dense-uarch-hashes (positional count with
+    --       a start: sub-key).
     -- How:  run_ok() each flag; for --log-step also open the output file and
     --       assert it is non-empty to confirm the log was written.
     -- -------------------------------------------------------------------------
     it("log step options", function()
         local _ <close>, log_file = scope_temp_pathname()
 
-        -- --log-step=N,<file>
+        -- --log-step=<file>,count:N
         run_ok({
-            "--log-step=1," .. log_file,
+            "--log-step=" .. log_file .. ",count:1",
             "--max-mcycle=1",
             "--no-init-splash",
             "--quiet",
@@ -1464,8 +1663,8 @@ describe("cartesi-machine CLI", function()
         -- --auto-reset-uarch
         run_ok({ "--auto-reset-uarch", "--max-mcycle=0", "--no-init-splash", "--quiet" })
 
-        -- --dense-uarch-hashes=<length>,<start>
-        run_ok({ "--dense-uarch-hashes=1,0", "--max-mcycle=0", "--no-init-splash", "--quiet" })
+        -- --dense-uarch-hashes=<count>,start:<n>
+        run_ok({ "--dense-uarch-hashes=1,start:0", "--max-mcycle=0", "--no-init-splash", "--quiet" })
     end)
 
     -- -------------------------------------------------------------------------
@@ -1500,6 +1699,49 @@ describe("cartesi-machine CLI", function()
         run_ok({ "--console-io=input_source:from_null", "-it", "--max-mcycle=1", "--no-init-splash", "--quiet" })
     end)
 
+    -- -------------------------------------------------------------------------
+    -- Short-option value forms and option dispatch
+    --
+    -- What: A value-taking short option accepts both -x=value and the docker
+    --       space form -x value; a long value option does not consume the next
+    --       argument (it requires =).
+    -- How:  Build a config with --store-config so positionals are not relocated,
+    --       comparing the space and attached forms of -v; run_fail() the bare
+    --       long form to confirm it is rejected.
+    -- -------------------------------------------------------------------------
+    it("short-option value forms", function()
+        -- Build a config from literal args (no positional relocation), so the
+        -- "-v <value>" space form survives intact.
+        local function config_from(flags)
+            local _ <close>, tmp = scope_temp_pathname()
+            local all = {}
+            for _, f in ipairs(flags) do
+                all[#all + 1] = f
+            end
+            for _, f in ipairs({ "--max-mcycle=0", "--no-init-splash", "--quiet", "--store-config=" .. tmp }) do
+                all[#all + 1] = f
+            end
+            run_ok(all)
+            return dofile(tmp)
+        end
+        local function has_p9fs(cfg)
+            for _, v in ipairs(cfg.virtio or {}) do
+                if v.type == "p9fs" then
+                    return true
+                end
+            end
+            return false
+        end
+
+        -- -v space form and -v= attached form both add the p9fs volume.
+        expect.truthy(has_p9fs(config_from({ "-v", "/tmp:/mnt" })))
+        expect.truthy(has_p9fs(config_from({ "-v=/tmp:/mnt" })))
+
+        -- A long value option requires '='; the bare form does not swallow the
+        -- next argument, so it is rejected as unrecognized.
+        run_fail({ "--ram-length", "64Mi" }, "unrecognized option")
+    end)
+
     -- -------------------------------------------------------------------------
     -- Full-guest rollup flow: advance + inspect with ioctl-echo-loop
     --
@@ -1521,9 +1763,15 @@ describe("cartesi-machine CLI", function()
                 prefix .. "-input-1.bin",
                 prefix .. "-query.bin",
                 prefix .. "-out-0-0.bin",
-                prefix .. "-out-1-0.bin",
+                prefix .. "-out-0-1.bin",
+                prefix .. "-out-1-2.bin",
+                prefix .. "-out-1-3.bin",
                 prefix .. "-outh-0.bin",
                 prefix .. "-outh-1.bin",
+                prefix .. "-oproof-0-0.json",
+                prefix .. "-oproof-1-0.json",
+                prefix .. "-oproof-2-1.json",
+                prefix .. "-oproof-3-1.json",
                 prefix .. "-rep-0-0.bin",
                 prefix .. "-rep-1-0.bin",
                 prefix .. "-qrep-0.bin",
@@ -1543,12 +1791,15 @@ describe("cartesi-machine CLI", function()
                 .. "output:"
                 .. prefix
                 .. "-out-%i-%o.bin,"
+                .. "output_proof:"
+                .. prefix
+                .. "-oproof-%o-%i.json,"
                 .. "report:"
                 .. prefix
                 .. "-rep-%i-%o.bin,"
                 .. "output_hashes_root_hash:"
                 .. prefix
-                .. "-outh-%i.bin",
+                .. "-outh-%i.bin,output_hashes_root_hash_proof:",
             "--cmio-inspect-state=query:" .. prefix .. "-query.bin," .. "report:" .. prefix .. "-qrep-%o.bin",
             "--no-rollback",
             "--assert-rolling-template",
@@ -1559,14 +1810,190 @@ describe("cartesi-machine CLI", function()
             "ioctl-echo-loop --vouchers=1 --notices=1 --reports=1",
         })
 
+        -- Each input emits one voucher (output 0) then one notice (output 1). Both inputs are
+        -- accepted, so "%o" is the global output index: input 0 gives 0 and 1, input 1 gives 2 and 3.
         local voucher_sig = "Voucher(address destination, uint256 value, bytes payload)"
-        local out00 = evmu.decode_calldata(voucher_sig, read_bin(prefix .. "-out-0-0.bin"), "raw")
+        local out00 = evmu.decode_calldata(voucher_sig, filesystem.read_file(prefix .. "-out-0-0.bin"), "raw")
         expect.equal(out00.payload, "hello")
-        local out10 = evmu.decode_calldata(voucher_sig, read_bin(prefix .. "-out-1-0.bin"), "raw")
-        expect.equal(out10.payload, "world")
+        local out12 = evmu.decode_calldata(voucher_sig, filesystem.read_file(prefix .. "-out-1-2.bin"), "raw")
+        expect.equal(out12.payload, "world")
         assert(io.open(prefix .. "-outh-0.bin", "r"), "no output-hash for input 0")
         assert(io.open(prefix .. "-outh-1.bin", "r"), "no output-hash for input 1")
-        expect.equal(read_bin(prefix .. "-qrep-0.bin"), "inspect-me")
+        expect.equal(filesystem.read_file(prefix .. "-qrep-0.bin"), "inspect-me")
+
+        -- Every output proof must verify against the outputs root of the last accepted input (the
+        -- final epoch root), and its target must hash the saved output bytes. A passing run already
+        -- cross-checked that root against the guest via check_output_hashes_root_hash.
+        local final_root = filesystem.read_file(prefix .. "-outh-1.bin")
+        local outputs = {
+            { o = 0, i = 0, file = "-out-0-0.bin" },
+            { o = 1, i = 0, file = "-out-0-1.bin" },
+            { o = 2, i = 1, file = "-out-1-2.bin" },
+            { o = 3, i = 1, file = "-out-1-3.bin" },
+        }
+        for _, o in ipairs(outputs) do
+            local proof =
+                cartesi.fromjson(filesystem.read_file(string.format("%s-oproof-%d-%d.json", prefix, o.o, o.i)), "Proof")
+            expect.equal(proof.log2_root_size, cartesi.CMIO_LOG2_MAX_OUTPUT_COUNT)
+            expect.equal(proof.log2_target_size, 0)
+            expect.equal(proof.target_address, o.o)
+            expect.equal(proof.root_hash, final_root)
+            expect.equal(proof.target_hash, cartesi.keccak256(filesystem.read_file(prefix .. o.file)))
+            hash_tree.verify_slice(proof)
+        end
+    end)
+
+    -- -------------------------------------------------------------------------
+    -- Output-proof serialization format
+    --
+    -- What: output_proof proofs default to Lua (round-trip via load) and the
+    --       format sub-option forces the content regardless of the filename
+    --       extension.
+    -- How:  Advance one accepted voucher writing proofs two ways: the default
+    --       (Lua, read back with load) and format:json into a .lua-named file
+    --       (read back with fromjson; load must fail on it). Both must verify.
+    -- -------------------------------------------------------------------------
+    it("output proof format", function()
+        local prefix = filesystem.temp_pathname()
+        local _ <close> = utils.scope_exit(function()
+            for _, p in ipairs({
+                prefix .. "-input-0.bin",
+                prefix .. "-out-0-0.bin",
+                prefix .. "-lua-0-0.lua",
+                prefix .. "-json-0-0.lua",
+            }) do
+                os.remove(p)
+            end
+        end)
+        filesystem.write_file(prefix .. "-input-0.bin", encode_advance(0, "hello"))
+
+        -- This test inspects only the output proof files. Disable output_hashes_root_hash and
+        -- output_hashes_root_hash_proof so their cwd-relative defaults are not written (a stray
+        -- relative write fails on a read-only CI working directory).
+        run_ok({
+            "--cmio-advance-state=input:"
+                .. prefix
+                .. "-input-%i.bin,"
+                .. "input_index_begin:0,input_index_end:1,"
+                .. "output:"
+                .. prefix
+                .. "-out-%i-%o.bin,"
+                .. "output_hashes_root_hash:,output_hashes_root_hash_proof:,"
+                .. "output_proof:"
+                .. prefix
+                .. "-lua-%o-%i.lua",
+            "--no-rollback",
+            "--assert-rolling-template",
+            "--max-mcycle=2000000000",
+            "--no-init-splash",
+            "--quiet",
+            "--",
+            "ioctl-echo-loop --vouchers=1 --notices=0 --reports=0",
+        })
+
+        -- The default proof is a Lua chunk returning the Proof table, with raw-byte hashes.
+        local lua_proof = assert(load(filesystem.read_file(prefix .. "-lua-0-0.lua"), "proof", "t", {}))()
+        expect.equal(lua_proof.target_address, 0)
+        expect.equal(lua_proof.log2_root_size, cartesi.CMIO_LOG2_MAX_OUTPUT_COUNT)
+        expect.equal(lua_proof.target_hash, cartesi.keccak256(filesystem.read_file(prefix .. "-out-0-0.bin")))
+        hash_tree.verify_slice(lua_proof)
+
+        -- format:json forces JSON content even though the filename ends in .lua.
+        run_ok({
+            "--cmio-advance-state=input:"
+                .. prefix
+                .. "-input-%i.bin,"
+                .. "input_index_begin:0,input_index_end:1,"
+                .. "output:"
+                .. prefix
+                .. "-out-%i-%o.bin,"
+                .. "output_hashes_root_hash:,output_hashes_root_hash_proof:,"
+                .. "output_proof:"
+                .. prefix
+                .. "-json-%o-%i.lua,"
+                .. "format:json",
+            "--no-rollback",
+            "--assert-rolling-template",
+            "--max-mcycle=2000000000",
+            "--no-init-splash",
+            "--quiet",
+            "--",
+            "ioctl-echo-loop --vouchers=1 --notices=0 --reports=0",
+        })
+
+        local json_text = filesystem.read_file(prefix .. "-json-0-0.lua")
+        expect.falsy(load(json_text, "proof", "t", {})) -- JSON is not loadable as Lua
+        local json_proof = cartesi.fromjson(json_text, "Proof")
+        expect.equal(json_proof.target_address, 0)
+        hash_tree.verify_slice(json_proof)
+    end)
+
+    -- -------------------------------------------------------------------------
+    -- Output hashes root hash accumulates across accepted inputs
+    --
+    -- What: The outputs tree grows from genesis and is NOT reset on each accept,
+    --       so the root the guest writes after the second input covers both
+    --       inputs' outputs, not just the second's. A guest that reset its tree
+    --       per accept (a real bug once present in the rollup guest utility)
+    --       would write the single-leaf root instead.
+    -- How:  Advance two accepted inputs, one output each, and compare each
+    --       input's output_hashes_root_hash against the root computed
+    --       independently over the accumulated leaves.
+    -- -------------------------------------------------------------------------
+    it("output hashes root hash accumulates across inputs", function()
+        -- Root of the height-CMIO_LOG2_MAX_OUTPUT_COUNT pristine-padded outputs tree over leaves.
+        local function outputs_root(leaves)
+            local frontier = hash_tree.frontier(cartesi.CMIO_LOG2_MAX_OUTPUT_COUNT)
+            for _, leaf in ipairs(leaves) do
+                hash_tree.frontier_push_back(frontier, leaf)
+            end
+            return hash_tree.frontier_get_root_hash(frontier)
+        end
+
+        local prefix = filesystem.temp_pathname()
+        local _ <close> = utils.scope_exit(function()
+            for _, p in ipairs({
+                prefix .. "-input-0.bin",
+                prefix .. "-input-1.bin",
+                prefix .. "-out-0-0.bin",
+                prefix .. "-out-1-1.bin",
+                prefix .. "-oh-0.bin",
+                prefix .. "-oh-1.bin",
+            }) do
+                os.remove(p)
+            end
+        end)
+        filesystem.write_file(prefix .. "-input-0.bin", encode_advance(0, "first"))
+        filesystem.write_file(prefix .. "-input-1.bin", encode_advance(1, "second"))
+
+        run_ok({
+            "--cmio-advance-state=input:"
+                .. prefix
+                .. "-input-%i.bin,"
+                .. "input_index_begin:0,input_index_end:2,"
+                .. "output:"
+                .. prefix
+                .. "-out-%o-%i.bin,"
+                .. "output_proof:,rejected_output:,report:,"
+                .. "output_hashes_root_hash:"
+                .. prefix
+                .. "-oh-%i.bin,output_hashes_root_hash_proof:",
+            "--no-rollback",
+            "--assert-rolling-template",
+            "--max-mcycle=2000000000",
+            "--no-init-splash",
+            "--quiet",
+            "--",
+            "ioctl-echo-loop --vouchers=1 --notices=0 --reports=0",
+        })
+
+        local leaf0 = cartesi.keccak256(filesystem.read_file(prefix .. "-out-0-0.bin"))
+        local leaf1 = cartesi.keccak256(filesystem.read_file(prefix .. "-out-1-1.bin"))
+        -- After input 0 the guest root covers one leaf, after input 1 it covers both.
+        expect.equal(filesystem.read_file(prefix .. "-oh-0.bin"), outputs_root({ leaf0 }))
+        expect.equal(filesystem.read_file(prefix .. "-oh-1.bin"), outputs_root({ leaf0, leaf1 }))
+        -- A per-accept reset would have written the single-leaf root for input 1.
+        expect.truthy(filesystem.read_file(prefix .. "-oh-1.bin") ~= outputs_root({ leaf1 }))
     end)
 
     -- -------------------------------------------------------------------------
@@ -1589,7 +2016,15 @@ describe("cartesi-machine CLI", function()
                 prefix .. "-inpr-1.bin",
                 prefix .. "-inpr-2.bin",
                 prefix .. "-rbo-0-0.bin",
-                prefix .. "-rbo-2-0.bin",
+                prefix .. "-rbo-0-1.bin",
+                prefix .. "-rbo-2-2.bin",
+                prefix .. "-rbo-2-3.bin",
+                prefix .. "-rbrej-2-1.bin",
+                prefix .. "-rbrej-3-1.bin",
+                prefix .. "-rbproof-0-0.json",
+                prefix .. "-rbproof-1-0.json",
+                prefix .. "-rbproof-2-2.json",
+                prefix .. "-rbproof-3-2.json",
                 prefix .. "-rbr-0-0.bin",
                 prefix .. "-rbr-2-0.bin",
                 prefix .. "-rboh-0.bin",
@@ -1602,10 +2037,12 @@ describe("cartesi-machine CLI", function()
         filesystem.write_file(prefix .. "-inpr-1.bin", encode_advance(1, "reject-me"))
         filesystem.write_file(prefix .. "-inpr-2.bin", encode_advance(2, "also-ok"))
 
-        -- ioctl-echo-loop --reject=1 rejects the second input, exercising do_rollback;
-        -- inputs 0 and 2 exercise do_snapshot + do_commit
+        -- ioctl-echo-loop --reject=1 rejects input 1, exercising do_rollback; inputs 0 and 2
+        -- exercise do_snapshot + do_commit. A rejected input's outputs go to rejected_output and
+        -- do not advance the global output index, so input 2 continues at index 2.
         run_ok({
             "--remote-address=" .. address,
+            "--console-io=output_destination:to_null",
             "--cmio-advance-state=input:"
                 .. prefix
                 .. "-inpr-%i.bin,"
@@ -1613,18 +2050,185 @@ describe("cartesi-machine CLI", function()
                 .. "output:"
                 .. prefix
                 .. "-rbo-%i-%o.bin,"
+                .. "rejected_output:"
+                .. prefix
+                .. "-rbrej-%o-%i.bin,"
+                .. "output_proof:"
+                .. prefix
+                .. "-rbproof-%o-%i.json,"
                 .. "report:"
                 .. prefix
                 .. "-rbr-%i-%o.bin,"
                 .. "output_hashes_root_hash:"
                 .. prefix
-                .. "-rboh-%i.bin",
+                .. "-rboh-%i.bin,output_hashes_root_hash_proof:",
             "--max-mcycle=2000000000",
             "--no-init-splash",
             "--quiet",
             "--",
             "ioctl-echo-loop --vouchers=1 --notices=1 --reports=1 --reject=1",
         })
+
+        local voucher_sig = "Voucher(address destination, uint256 value, bytes payload)"
+        -- input 0 accepted gives global 0 and 1, input 2 accepted continues at 2 and 3
+        expect.equal(
+            evmu.decode_calldata(voucher_sig, filesystem.read_file(prefix .. "-rbo-0-0.bin"), "raw").payload,
+            "ok"
+        )
+        expect.equal(
+            evmu.decode_calldata(voucher_sig, filesystem.read_file(prefix .. "-rbo-2-2.bin"), "raw").payload,
+            "also-ok"
+        )
+        -- the rejected input's outputs land in rejected_output at their would-be indices
+        expect.equal(
+            evmu.decode_calldata(voucher_sig, filesystem.read_file(prefix .. "-rbrej-2-1.bin"), "raw").payload,
+            "reject-me"
+        )
+        assert(io.open(prefix .. "-rbrej-3-1.bin", "r"), "no rejected notice for input 1")
+        -- and never appear among the accepted outputs, nor get a proof or an output root hash
+        assert(not io.open(prefix .. "-rbo-1-2.bin", "r"), "rejected output leaked into accepted outputs")
+        assert(not io.open(prefix .. "-rbproof-2-1.json", "r"), "proof emitted for a rejected output")
+        assert(not io.open(prefix .. "-rboh-1.bin", "r"), "rejected input wrote an output root hash")
+
+        -- every accepted output proof verifies against the last accepted input's outputs root
+        local final_root = filesystem.read_file(prefix .. "-rboh-2.bin")
+        for _, p in ipairs({ { o = 0, i = 0 }, { o = 1, i = 0 }, { o = 2, i = 2 }, { o = 3, i = 2 } }) do
+            local proof = cartesi.fromjson(
+                filesystem.read_file(string.format("%s-rbproof-%d-%d.json", prefix, p.o, p.i)),
+                "Proof"
+            )
+            expect.equal(proof.target_address, p.o)
+            expect.equal(proof.root_hash, final_root)
+            hash_tree.verify_slice(proof)
+        end
+    end)
+
+    -- -------------------------------------------------------------------------
+    -- Two-epoch continuation via last_output_proof, with a reject mid-epoch
+    --
+    -- What: A later epoch's output proofs continue the genesis-rooted outputs tree
+    --       of an earlier one when seeded with the previous epoch's last output
+    --       proof, and check_output_hashes_root_hash (default on) keeps holding
+    --       even when an input in the middle is rejected and rolls the tree back.
+    -- How:  Spawn one server and keep it alive. Epoch 1 (--no-remote-destroy)
+    --       instantiates the machine and advances inputs 0 and 1 against it. The
+    --       entrypoint, fixed at instantiation, carries --reject=3 so the input
+    --       with global index 3 is rejected when it arrives. Epoch 2
+    --       (--no-remote-create, no entrypoint) reuses the same live machine,
+    --       advancing inputs 2, 3, 4 seeded with epoch 1's last output proof. Each
+    --       input emits a voucher and a notice, so the global output index runs
+    --       0..3 in epoch 1 and continues over the accepted inputs 2 and 4 (4..7)
+    --       in epoch 2, while rejected input 3 advances nothing.
+    -- -------------------------------------------------------------------------
+    it("two-epoch continuation via last_output_proof", function()
+        local jsonrpc = require("cartesi.jsonrpc")
+        local server <close>, address = jsonrpc.spawn_server()
+        server:set_cleanup_call(jsonrpc.NOTHING)
+        local prefix = filesystem.temp_pathname()
+        local files = {
+            prefix .. "-ein-0.bin",
+            prefix .. "-ein-1.bin",
+            prefix .. "-ein-2.bin",
+            prefix .. "-ein-3.bin",
+            prefix .. "-ein-4.bin",
+            prefix .. "-e1proof-0-0.json",
+            prefix .. "-e1proof-1-0.json",
+            prefix .. "-e1proof-2-1.json",
+            prefix .. "-e1proof-3-1.json",
+            prefix .. "-e2o-4-2.bin",
+            prefix .. "-e2o-5-2.bin",
+            prefix .. "-e2o-6-4.bin",
+            prefix .. "-e2o-7-4.bin",
+            prefix .. "-e2rej-6-3.bin",
+            prefix .. "-e2rej-7-3.bin",
+            prefix .. "-e2proof-4-2.json",
+            prefix .. "-e2proof-5-2.json",
+            prefix .. "-e2proof-6-4.json",
+            prefix .. "-e2proof-7-4.json",
+            prefix .. "-e2oh-2.bin",
+            prefix .. "-e2oh-4.bin",
+        }
+        local _ <close> = utils.scope_exit(function()
+            for _, p in ipairs(files) do
+                os.remove(p)
+            end
+        end)
+        -- Inputs carry global indices. The reject targets the input whose encoded index is 3.
+        for i = 0, 4 do
+            filesystem.write_file(prefix .. "-ein-" .. i .. ".bin", encode_advance(i, "epoch-input-" .. i))
+        end
+
+        -- Epoch 1: inputs 0 and 1 against a freshly created machine, left alive on the server. Only
+        -- the proofs are kept, since epoch 2 is seeded from the last one (output 3, from input 1).
+        -- The entrypoint is fixed here, so --reject=3 is set now even though input 3 arrives later.
+        run_ok({
+            "--remote-address=" .. address,
+            "--no-remote-destroy",
+            "--console-io=output_destination:to_null",
+            "--cmio-advance-state=input:"
+                .. prefix
+                .. "-ein-%i.bin,"
+                .. "input_index_begin:0,input_index_end:2,"
+                .. "output:,rejected_output:,report:,output_hashes_root_hash:,output_hashes_root_hash_proof:,"
+                .. "output_proof:"
+                .. prefix
+                .. "-e1proof-%o-%i.json",
+            "--max-mcycle=2000000000",
+            "--no-init-splash",
+            "--quiet",
+            "--",
+            "ioctl-echo-loop --vouchers=1 --notices=1 --reports=1 --reject=3",
+        })
+
+        -- Epoch 2: reuse the same live machine (no new entrypoint), seeded with epoch 1's last output
+        -- proof. Input 3 is rejected, so the guest rolls its outputs tree back. The default root-hash
+        -- check still holds because the host frontier rolls back in step.
+        run_ok({
+            "--remote-address=" .. address,
+            "--no-remote-create",
+            "--cmio-advance-state=input:"
+                .. prefix
+                .. "-ein-%i.bin,"
+                .. "input_index_begin:2,input_index_end:5,"
+                .. "report:,"
+                .. "output:"
+                .. prefix
+                .. "-e2o-%o-%i.bin,"
+                .. "rejected_output:"
+                .. prefix
+                .. "-e2rej-%o-%i.bin,"
+                .. "last_output_proof:"
+                .. prefix
+                .. "-e1proof-3-1.json,"
+                .. "output_proof:"
+                .. prefix
+                .. "-e2proof-%o-%i.json,"
+                .. "output_hashes_root_hash:"
+                .. prefix
+                .. "-e2oh-%i.bin,output_hashes_root_hash_proof:",
+            "--max-mcycle=2000000000",
+            "--no-init-splash",
+            "--quiet",
+        })
+
+        -- Accepted epoch 2 outputs continue the global index over inputs 2 and 4 (4..7) and verify
+        -- against epoch 2's final root. Rejected input 3 advanced nothing.
+        local final_root = filesystem.read_file(prefix .. "-e2oh-4.bin")
+        for _, p in ipairs({ { o = 4, i = 2 }, { o = 5, i = 2 }, { o = 6, i = 4 }, { o = 7, i = 4 } }) do
+            local proof = cartesi.fromjson(
+                filesystem.read_file(string.format("%s-e2proof-%d-%d.json", prefix, p.o, p.i)),
+                "Proof"
+            )
+            expect.equal(proof.log2_root_size, cartesi.CMIO_LOG2_MAX_OUTPUT_COUNT)
+            expect.equal(proof.target_address, p.o)
+            expect.equal(proof.root_hash, final_root)
+            hash_tree.verify_slice(proof)
+        end
+        -- input 3's outputs went to rejected_output at their would-be indices and got no proof
+        assert(io.open(prefix .. "-e2rej-6-3.bin", "r"), "no rejected voucher for input 3")
+        assert(io.open(prefix .. "-e2rej-7-3.bin", "r"), "no rejected notice for input 3")
+        assert(not io.open(prefix .. "-e2o-6-3.bin", "r"), "rejected output leaked into accepted outputs")
+        assert(not io.open(prefix .. "-e2oh-3.bin", "r"), "rejected input wrote an output root hash")
     end)
 
     -- -------------------------------------------------------------------------
diff --git a/tests/lua/spec-collect-hashes.lua b/tests/lua/spec-collect-hashes.lua
index 586faa36c..f6d31216a 100644
--- a/tests/lua/spec-collect-hashes.lua
+++ b/tests/lua/spec-collect-hashes.lua
@@ -19,6 +19,28 @@ local function expect_consistent_root_hash(machine)
     return root_hash
 end
 
+local function is_rejected_manual_yield(machine)
+    return machine:read_reg("iflags_Y") ~= 0
+        and machine:read_reg("htif_tohost_dev") == cartesi.HTIF_DEV_YIELD
+        and machine:read_reg("htif_tohost_cmd") == cartesi.HTIF_YIELD_CMD_MANUAL
+        and machine:read_reg("htif_tohost_reason") == cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED
+end
+
+-- Root hash that verifiers accept after a state transition ending in the machine state,
+-- which is the recorded revert root hash when the machine has rejected an input
+local function canonical_root_hash(machine)
+    if is_rejected_manual_yield(machine) then
+        return machine:read_revert_root_hash()
+    end
+    return machine:get_root_hash()
+end
+
+-- Tail accepted by machines whose revert leaf is pristine, required at entry but never consumed
+local pristine_revert_uarch_tail = {
+    string.rep("\x00", cartesi.HASH_SIZE),
+    string.rep("\x00", cartesi.HASH_SIZE),
+}
+
 local function expect_mcycle_root_hashes(machine, mcycle_end, mcycle_period, mcycle_phase, log2_bundle_mcycle_count)
     -- this reference implementation does not support the following conditions
     assert(mcycle_end >= 0 and mcycle_end <= math.maxinteger)
@@ -35,13 +57,13 @@ local function expect_mcycle_root_hashes(machine, mcycle_end, mcycle_period, mcy
         if machine:read_reg("mcycle") ~= mcycle_target then
             mcycle_phase = mcycle_period - (mcycle_target - machine:read_reg("mcycle"))
             if break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY then
-                table.insert(hashes, machine:get_root_hash())
+                table.insert(hashes, canonical_root_hash(machine))
                 at_fixed_point = true
             end
             break
         end
         mcycle_phase = 0
-        table.insert(hashes, machine:get_root_hash())
+        table.insert(hashes, canonical_root_hash(machine))
         if break_reason ~= cartesi.BREAK_REASON_REACHED_TARGET_MCYCLE then
             if break_reason == cartesi.BREAK_REASON_HALTED or break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY then
                 at_fixed_point = true
@@ -112,7 +134,8 @@ local function expect_next_mcycle_uarch_root_hashes(
     expect.equal(machine:read_reg("uarch_halt_flag"), 1)
     local halt_root_hash = expect_consistent_root_hash(machine)
     machine:reset_uarch()
-    local reset_root_hash = expect_consistent_root_hash(machine)
+    expect_consistent_root_hash(machine)
+    local reset_root_hash = canonical_root_hash(machine)
     expect.equal(machine:read_reg("uarch_cycle"), 0)
     expect.equal(machine:read_reg("mcycle"), mcycle)
     if log2_bundle_uarch_cycle_count and log2_bundle_uarch_cycle_count > 0 then
@@ -133,7 +156,32 @@ local function expect_next_mcycle_uarch_root_hashes(
     table.insert(reset_indices, #hashes)
 end
 
-local function expect_uarch_cycle_root_hashes(machine, mcycle_end, log2_bundle_uarch_cycle_count)
+-- Appends the period of the reverted machine, as given by the revert uarch tail
+local function expect_revert_uarch_tail_period(hashes, reset_indices, revert_uarch_tail, log2_bundle_uarch_cycle_count)
+    for i = 1, #revert_uarch_tail - 1 do
+        table.insert(hashes, revert_uarch_tail[i])
+    end
+    local halt_root_hash = revert_uarch_tail[#revert_uarch_tail - 1]
+    local reset_root_hash = revert_uarch_tail[#revert_uarch_tail]
+    if log2_bundle_uarch_cycle_count and log2_bundle_uarch_cycle_count > 0 then
+        local bundle_uarch_cycle_count = 1 << log2_bundle_uarch_cycle_count
+        -- add halt root hash padding until finishing a bundle
+        while #hashes % bundle_uarch_cycle_count ~= 0 do
+            table.insert(hashes, halt_root_hash)
+        end
+        -- add repetitions of the halt root hash
+        for _ = 1, 2 * bundle_uarch_cycle_count - 1 do
+            table.insert(hashes, halt_root_hash)
+        end
+        table.insert(hashes, reset_root_hash)
+        assert(#hashes % bundle_uarch_cycle_count == 0)
+    else
+        table.insert(hashes, reset_root_hash)
+    end
+    table.insert(reset_indices, #hashes)
+end
+
+local function expect_uarch_cycle_root_hashes(machine, mcycle_end, log2_bundle_uarch_cycle_count, revert_uarch_tail)
     -- this reference implementation does not support the following conditions
     assert(mcycle_end >= 0 and mcycle_end <= math.maxinteger, "unsupported call")
     assert(machine:read_reg("iflags_H") == 0, "unsupported call")
@@ -151,7 +199,19 @@ local function expect_uarch_cycle_root_hashes(machine, mcycle_end, log2_bundle_u
         end
         if machine:read_reg("iflags_Y") ~= 0 then
             break_reason = cartesi.BREAK_REASON_YIELDED_MANUALLY
-            expect_next_mcycle_uarch_root_hashes(machine, mcycle, hashes, reset_indices, log2_bundle_uarch_cycle_count)
+            if is_rejected_manual_yield(machine) then
+                -- the canonical timeline continues from the reverted machine,
+                -- whose period is given by the revert uarch tail
+                expect_revert_uarch_tail_period(hashes, reset_indices, revert_uarch_tail, log2_bundle_uarch_cycle_count)
+            else
+                expect_next_mcycle_uarch_root_hashes(
+                    machine,
+                    mcycle,
+                    hashes,
+                    reset_indices,
+                    log2_bundle_uarch_cycle_count
+                )
+            end
             break
         end
         if machine:read_reg("iflags_X") ~= 0 then
@@ -300,7 +360,7 @@ describe("collect hashes", function()
                         mcycle_phase = mcycle_phase,
                     }
                 )
-                expect.equal(machine:collect_uarch_cycle_root_hashes(mcycle_end), {
+                expect.equal(machine:collect_uarch_cycle_root_hashes(mcycle_end, 0, pristine_revert_uarch_tail), {
                     hashes = {},
                     reset_indices = {},
                     break_reason = cartesi.BREAK_REASON_REACHED_TARGET_MCYCLE,
@@ -324,7 +384,8 @@ describe("collect hashes", function()
 
                 local machine_uarch <close> = create_machine({ ram = { length = 4096 } })
                 machine_uarch:run(mcycle_start)
-                local collected_uarch = machine_uarch:collect_uarch_cycle_root_hashes(mcycle_end)
+                local collected_uarch =
+                    machine_uarch:collect_uarch_cycle_root_hashes(mcycle_end, 0, pristine_revert_uarch_tail)
                 expect.equal(machine_uarch:read_reg("mcycle"), mcycle_end)
                 expect.equal(machine_uarch:get_root_hash(), machine:get_root_hash())
                 expect.equal(#collected_uarch.reset_indices, mcycle_end - mcycle_start)
@@ -454,6 +515,64 @@ describe("collect hashes", function()
                 expect.equal(collected_uarch.hashes[collected_uarch.reset_indices[1]], expected_root_hash)
             end)
 
+            it("should require the revert uarch tail when collecting with a running machine", function()
+                local machine <close> = create_machine({ ram = { length = 4096 } })
+                local compare_machine <close> = cartesi.machine({ ram = { length = 4096 } })
+                expect.fail(function()
+                    machine:collect_uarch_cycle_root_hashes(2)
+                end, "revert uarch tail is required")
+                expect.fail(function()
+                    machine:collect_uarch_cycle_root_hashes(2, 0, { string.rep("\x11", cartesi.HASH_SIZE) })
+                end, "revert uarch tail is too short")
+                expect.fail(function()
+                    machine:collect_uarch_cycle_root_hashes(2, 0, {
+                        string.rep("\x11", cartesi.HASH_SIZE),
+                        string.rep("\x22", cartesi.HASH_SIZE),
+                    })
+                end, "revert uarch tail does not end with the revert root hash")
+                -- failing calls leave the machine unchanged, so retrying with the tail works
+                local collected = machine:collect_uarch_cycle_root_hashes(2, 0, pristine_revert_uarch_tail)
+                local expected_collected = expect_uarch_cycle_root_hashes(compare_machine, 2)
+                expect.equal(collected, expected_collected)
+            end)
+
+            it("should collect the revert uarch tail period when starting from a rejected machine", function()
+                local mcycle_end = 32
+                local revert_root_hash = string.rep("\x5a", cartesi.HASH_SIZE)
+                local revert_uarch_tail = {
+                    string.rep("\x01", cartesi.HASH_SIZE),
+                    string.rep("\x02", cartesi.HASH_SIZE),
+                    revert_root_hash,
+                }
+                local machine <close> = create_machine({ ram = { length = 4096 } })
+                machine:write_revert_root_hash(revert_root_hash)
+                machine:write_reg("iflags_Y", 1)
+                machine:write_reg("htif_tohost_dev", cartesi.HTIF_DEV_YIELD)
+                machine:write_reg("htif_tohost_cmd", cartesi.HTIF_YIELD_CMD_MANUAL)
+                machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED)
+                local expected_root_hash = machine:get_root_hash()
+
+                -- the tail is required even though the machine is at a fixed point
+                expect.fail(function()
+                    machine:collect_uarch_cycle_root_hashes(mcycle_end)
+                end, "revert uarch tail is required")
+
+                -- the machine is not touched, the period comes entirely from the tail
+                expect.equal(machine:collect_uarch_cycle_root_hashes(mcycle_end, 0, revert_uarch_tail), {
+                    hashes = revert_uarch_tail,
+                    reset_indices = { #revert_uarch_tail },
+                    break_reason = cartesi.BREAK_REASON_YIELDED_MANUALLY,
+                })
+                expect.equal(machine:get_root_hash(), expected_root_hash)
+
+                -- the mcycle collector collects no hashes when starting from a yielded machine
+                expect.equal(machine:collect_mcycle_root_hashes(mcycle_end, 32, 1), {
+                    hashes = {},
+                    break_reason = cartesi.BREAK_REASON_YIELDED_MANUALLY,
+                    mcycle_phase = 1,
+                })
+            end)
+
             it("should collect mcycles during mcycle overflow", function()
                 local mcycle_period = 32
                 local machine <close> = create_machine({ ram = { length = 4096 } })
@@ -488,7 +607,8 @@ describe("collect hashes", function()
             it("should collect uarch cycles during mcycle overflows", function()
                 local machine <close> = create_machine({ ram = { length = 4096 } })
                 machine:write_reg("mcycle", cartesi.MCYCLE_MAX - 1)
-                local collected_uarch = machine:collect_uarch_cycle_root_hashes(cartesi.MCYCLE_MAX)
+                local collected_uarch =
+                    machine:collect_uarch_cycle_root_hashes(cartesi.MCYCLE_MAX, 0, pristine_revert_uarch_tail)
                 expect.equal(collected_uarch.break_reason, cartesi.BREAK_REASON_REACHED_TARGET_MCYCLE)
                 local expected_root_hash = machine:get_root_hash()
                 expect.equal(collected_uarch.hashes[collected_uarch.reset_indices[1]], expected_root_hash)
@@ -783,13 +903,106 @@ describe("collect hashes", function()
                     local compare_machine <close> = cartesi.machine(add_machine_config)
                     machine:run(mcycle_start)
                     compare_machine:run(mcycle_start)
-                    local collected = machine:collect_uarch_cycle_root_hashes(mcycle_end, log2_uarch_cycle_mcycle_count)
+                    local collected = machine:collect_uarch_cycle_root_hashes(
+                        mcycle_end,
+                        log2_uarch_cycle_mcycle_count,
+                        pristine_revert_uarch_tail
+                    )
                     local expected_collected =
                         expect_uarch_cycle_root_hashes(compare_machine, mcycle_end, log2_uarch_cycle_mcycle_count)
                     expect.equal(collected, expected_collected)
                     expect.equal(machine:get_root_hash(), compare_machine:get_root_hash())
                 end
             end)
+
+            it("should substitute the revert root hash when bundling across a rejected yield", function()
+                local log2_bundle_mcycle_count = 2
+                local mcycle_period = 4
+                local mcycle_end = 1024
+                local revert_root_hash = string.rep("\x5a", cartesi.HASH_SIZE)
+                local machine <close> = create_machine(yield_machine_config)
+                machine:write_revert_root_hash(revert_root_hash)
+                -- the bundles that follow a rejected yield contain only revert root hash repetitions
+                local revert_bundle_hash = revert_root_hash
+                for _ = 1, log2_bundle_mcycle_count do
+                    revert_bundle_hash = cartesi.keccak256(revert_bundle_hash, revert_bundle_hash)
+                end
+                local count_rejected_yields = 0
+                local last_collected = { mcycle_phase = 0 }
+                for _ = 1, 64 do
+                    local collected = machine:collect_mcycle_root_hashes(
+                        mcycle_end,
+                        mcycle_period,
+                        last_collected.mcycle_phase,
+                        log2_bundle_mcycle_count,
+                        last_collected.back_tree
+                    )
+                    if collected.break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY then
+                        if is_rejected_manual_yield(machine) then
+                            expect.equal(collected.hashes[#collected.hashes], revert_bundle_hash)
+                            count_rejected_yields = count_rejected_yields + 1
+                        end
+                        machine:write_reg("iflags_Y", 0)
+                    elseif collected.break_reason == cartesi.BREAK_REASON_HALTED then
+                        break
+                    end
+                    last_collected = collected
+                end
+                -- htif_yield.bin breaks twice on a rejected manual yield, once with the rx-rejected reason
+                -- and once with the tx-output automatic reason, which shares the same reason value
+                expect.equal(count_rejected_yields, 2)
+                expect.equal(machine:read_reg("iflags_H"), 1)
+            end)
+
+            it("should collect across a rejected yield using a tail collected in advance", function()
+                local machine <close> = create_machine(yield_machine_config)
+                local compare_machine <close> = cartesi.machine(yield_machine_config)
+                -- run both machines to the first manual yield, where the machine waits for a response
+                expect.equal(machine:run(1 << 62), cartesi.BREAK_REASON_YIELDED_MANUALLY)
+                compare_machine:run(1 << 62)
+                -- collecting on the waiting machine needs no tail and returns its period, which is
+                -- the tail for ranges that end rejected after the machine resumes
+                local revert_root_hash = machine:get_root_hash()
+                local bootstrap = machine:collect_uarch_cycle_root_hashes(machine:read_reg("mcycle"))
+                expect.equal(bootstrap.break_reason, cartesi.BREAK_REASON_YIELDED_MANUALLY)
+                expect.equal(#bootstrap.reset_indices, 1)
+                local revert_uarch_tail = bootstrap.hashes
+                expect.equal(revert_uarch_tail[#revert_uarch_tail], revert_root_hash)
+                expect.equal(machine:get_root_hash(), revert_root_hash)
+                -- record the revert root hash and resume the guest, standing in for
+                -- send_cmio_response, whose fromhost response fails this guest's ack checks
+                machine:write_revert_root_hash(revert_root_hash)
+                machine:write_reg("iflags_Y", 0)
+                compare_machine:write_revert_root_hash(revert_root_hash)
+                compare_machine:write_reg("iflags_Y", 0)
+                -- run until the guest rejects, collecting with the tail in hand
+                local count_rejected_yields = 0
+                for _ = 1, 32 do
+                    local collected = machine:collect_uarch_cycle_root_hashes(1 << 62, 0, revert_uarch_tail)
+                    local expected_collected =
+                        expect_uarch_cycle_root_hashes(compare_machine, 1 << 62, 0, revert_uarch_tail)
+                    expect.equal(collected, expected_collected)
+                    expect.equal(machine:get_root_hash(), compare_machine:get_root_hash())
+                    if collected.break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY then
+                        if is_rejected_manual_yield(machine) then
+                            -- the collected stream ends with the period collected before the response
+                            for i = 1, #revert_uarch_tail do
+                                expect.equal(
+                                    collected.hashes[#collected.hashes - #revert_uarch_tail + i],
+                                    revert_uarch_tail[i]
+                                )
+                            end
+                            count_rejected_yields = count_rejected_yields + 1
+                            break
+                        end
+                        machine:write_reg("iflags_Y", 0)
+                        compare_machine:write_reg("iflags_Y", 0)
+                    elseif collected.break_reason == cartesi.BREAK_REASON_HALTED then
+                        break
+                    end
+                end
+                expect.equal(count_rejected_yields, 1)
+            end)
         end) -- describe remote/local
     end -- for remote/local create
 
@@ -836,6 +1049,17 @@ describe("collect hashes", function()
             local yield_last_mcycle = 500
             local yield_last_root_hash
             local yield_sparse_hashes = {}
+            -- htif_yield.bin breaks twice on a rejected manual yield, once with the rx-rejected reason
+            -- and once with the tx-output automatic reason, which shares the same reason value
+            local yield_rejected_count = 2
+            local yield_revert_root_hash = string.rep("\x5a", cartesi.HASH_SIZE)
+            -- a fabricated period for the reverted machine, collected as the tail after the rejected yield
+            local yield_revert_uarch_tail = {
+                string.rep("\x01", cartesi.HASH_SIZE),
+                string.rep("\x02", cartesi.HASH_SIZE),
+                string.rep("\x03", cartesi.HASH_SIZE),
+                yield_revert_root_hash,
+            }
 
             if hash_function == "keccak256" then
                 it("should fail when microarchitecture is not reset", function()
@@ -897,6 +1121,8 @@ describe("collect hashes", function()
                 local period_count = yield_last_mcycle // mcycle_period
                 local machine <close> = cartesi.machine(yield_machine_config)
                 local collect_machine <close> = cartesi.machine(yield_machine_config)
+                machine:write_revert_root_hash(yield_revert_root_hash)
+                collect_machine:write_revert_root_hash(yield_revert_root_hash)
                 expect.equal(machine:run(mcycle_start), cartesi.BREAK_REASON_REACHED_TARGET_MCYCLE)
                 expect.equal(machine:read_reg("mcycle"), mcycle_start)
                 collect_machine:run(mcycle_start)
@@ -904,6 +1130,7 @@ describe("collect hashes", function()
                 expect.equal(machine:get_root_hash(), collect_machine:get_root_hash())
                 local count_manual_yields = 0
                 local count_automatic_yields = 0
+                local count_rejected_yields = 0
                 local count_halts = 1
                 local halt_exit_code
                 for _ = 1, period_count * 2 do
@@ -920,6 +1147,11 @@ describe("collect hashes", function()
                         table.insert(yield_sparse_hashes, hash)
                     end
                     if collected.break_reason == cartesi.BREAK_REASON_YIELDED_MANUALLY then
+                        if is_rejected_manual_yield(machine) then
+                            -- the entry collected at the rejected yield is the substituted revert root hash
+                            expect.equal(collected.hashes[#collected.hashes], yield_revert_root_hash)
+                            count_rejected_yields = count_rejected_yields + 1
+                        end
                         collect_machine:write_reg("iflags_Y", 0)
                         machine:write_reg("iflags_Y", 0)
                         count_manual_yields = count_manual_yields + 1
@@ -936,6 +1168,7 @@ describe("collect hashes", function()
                 expect.equal(#yield_sparse_hashes, period_count + count_manual_yields + count_halts)
                 expect.equal(count_manual_yields, 8)
                 expect.equal(count_automatic_yields, 7)
+                expect.equal(count_rejected_yields, yield_rejected_count)
                 expect.equal(halt_exit_code, 42)
                 yield_last_root_hash = machine:get_root_hash()
             end)
@@ -959,7 +1192,8 @@ describe("collect hashes", function()
                     expect_consistent_root_hash(machine)
                     collect_machine:run(big_last_mcycle - mcycle_count)
                     expect.equal(machine:get_root_hash(), collect_machine:get_root_hash())
-                    local collected = collect_machine:collect_uarch_cycle_root_hashes(big_last_mcycle)
+                    local collected =
+                        collect_machine:collect_uarch_cycle_root_hashes(big_last_mcycle, 0, pristine_revert_uarch_tail)
                     local expected_collected = expect_uarch_cycle_root_hashes(machine, big_last_mcycle)
                     local halt_exit_code = machine:read_reg("htif_tohost_data") >> 1
                     expect.equal(collected, expected_collected)
@@ -981,6 +1215,8 @@ describe("collect hashes", function()
                     local period_count = yield_last_mcycle // mcycle_period
                     local machine <close> = cartesi.machine(yield_machine_config)
                     local collect_machine <close> = cartesi.machine(yield_machine_config)
+                    machine:write_revert_root_hash(yield_revert_root_hash)
+                    collect_machine:write_revert_root_hash(yield_revert_root_hash)
                     machine:run(mcycle_start)
                     expect.equal(machine:read_reg("mcycle"), mcycle_start)
                     collect_machine:run(mcycle_start)
@@ -990,23 +1226,34 @@ describe("collect hashes", function()
                     local sparse_hashes_count = 0
                     local count_manual_yields = 0
                     local count_automatic_yields = 0
+                    local count_rejected_yields = 0
                     local halt_exit_code
                     for _ = 1, period_count * 2 do
                         local mcycles_to_phase0 = mcycle_period
                             - ((machine:read_reg("mcycle") - mcycle_phase_offset) % mcycle_period)
                         local mcycle_target = machine:read_reg("mcycle") + mcycles_to_phase0
-                        local collected = collect_machine:collect_uarch_cycle_root_hashes(mcycle_target)
-                        local expected_collected = expect_uarch_cycle_root_hashes(machine, mcycle_target)
+                        local collected =
+                            collect_machine:collect_uarch_cycle_root_hashes(mcycle_target, 0, yield_revert_uarch_tail)
+                        local expected_collected =
+                            expect_uarch_cycle_root_hashes(machine, mcycle_target, 0, yield_revert_uarch_tail)
                         expect.equal(collect_machine:read_reg("mcycle"), machine:read_reg("mcycle"))
                         expect.equal(collected, expected_collected)
                         expect.equal(collect_machine:get_root_hash(), machine:get_root_hash())
                         mcycles_to_phase0 = (machine:read_reg("mcycle") - mcycle_phase_offset) % mcycle_period
                         local at_fixed_point = machine:read_reg("iflags_Y") ~= 0 or machine:read_reg("iflags_H") ~= 0
                         if mcycles_to_phase0 == 0 or at_fixed_point then
-                            expect.equal(yield_sparse_hashes[sparse_hashes_count + 1], machine:get_root_hash())
+                            expect.equal(yield_sparse_hashes[sparse_hashes_count + 1], canonical_root_hash(machine))
                             sparse_hashes_count = sparse_hashes_count + 1
                         end
                         if machine:read_reg("iflags_Y") == 1 then
+                            if is_rejected_manual_yield(machine) then
+                                -- the last period is the reverted machine period, ending on the revert root hash
+                                expect.equal(
+                                    collected.hashes[collected.reset_indices[#collected.reset_indices]],
+                                    yield_revert_root_hash
+                                )
+                                count_rejected_yields = count_rejected_yields + 1
+                            end
                             collect_machine:write_reg("iflags_Y", 0)
                             machine:write_reg("iflags_Y", 0)
                             count_manual_yields = count_manual_yields + 1
@@ -1021,6 +1268,7 @@ describe("collect hashes", function()
                     expect.equal(machine:get_root_hash(), yield_last_root_hash)
                     expect.equal(count_manual_yields, 8)
                     expect.equal(count_automatic_yields, 7)
+                    expect.equal(count_rejected_yields, yield_rejected_count)
                     expect.equal(halt_exit_code, 42)
                     expect.equal(sparse_hashes_count, #yield_sparse_hashes)
                 end)
diff --git a/tests/lua/spec-hash-tree-lua.lua b/tests/lua/spec-hash-tree-lua.lua
new file mode 100644
index 000000000..efc44b954
--- /dev/null
+++ b/tests/lua/spec-hash-tree-lua.lua
@@ -0,0 +1,137 @@
+--[[
+Test suite for the Lua hash-tree module.
+Specifically, it provides test coverage for:
+    src/cartesi/hash-tree.lua
+It covers the outputs-tree frontier accumulator and the proof verifier at the outputs-tree depth.
+Can be run independently during development of the mentioned file.
+]]
+
+local lester = require("cartesi.third-party.lester")
+local describe, it, expect = lester.describe, lester.it, lester.expect
+local cartesi = require("cartesi")
+local hash_tree = require("cartesi.hash-tree")
+
+local H = cartesi.CMIO_LOG2_MAX_OUTPUT_COUNT
+
+-- Independent reference for the height-H pristine-padded keccak outputs root, mirroring
+-- check_outputs_root_hash in tests/lua/cmio-test.lua. The leaves are already keccak256(output).
+local function reference_root(leaves)
+    local z = string.rep("\0", cartesi.HASH_SIZE)
+    local level = #leaves == 0 and { z } or leaves
+    for _ = 1, H do
+        local parents = {}
+        local child = 1
+        while level[child] do
+            parents[#parents + 1] = cartesi.keccak256(level[child], level[child + 1] or z)
+            child = child + 2
+        end
+        z = cartesi.keccak256(z, z)
+        level = parents
+    end
+    return level[1]
+end
+
+local function leaf(k)
+    return cartesi.keccak256("output-" .. k)
+end
+
+local function make_leaves(n)
+    local leaves = {}
+    for k = 1, n do
+        leaves[k] = leaf(k)
+    end
+    return leaves
+end
+
+-- Two proofs of the same output, computed independently, must agree on every field.
+local function expect_same_proof(a, b)
+    expect.equal(a.target_address, b.target_address)
+    expect.equal(a.log2_target_size, b.log2_target_size)
+    expect.equal(a.log2_root_size, b.log2_root_size)
+    expect.equal(a.target_hash, b.target_hash)
+    expect.equal(a.root_hash, b.root_hash)
+    expect.equal(#a.sibling_hashes, #b.sibling_hashes)
+    for i = 1, #a.sibling_hashes do
+        expect.equal(a.sibling_hashes[i], b.sibling_hashes[i])
+    end
+end
+
+describe("hash-tree.lua", function()
+    local counts = { 0, 1, 2, 3, 4, 5, 7, 8, 9, 15, 16, 17, 31, 33, 64, 100 }
+
+    describe("frontier", function()
+        it("produces proofs that verify and share the reference root", function()
+            for _, n in ipairs(counts) do
+                local leaves = make_leaves(n)
+                local proofs = hash_tree.frontier_next_proofs(hash_tree.frontier(H), leaves)
+                expect.equal(#proofs, n)
+                local root = reference_root(leaves)
+                for i = 1, n do
+                    expect.equal(proofs[i].target_address, i - 1)
+                    expect.equal(proofs[i].log2_target_size, 0)
+                    expect.equal(proofs[i].log2_root_size, H)
+                    expect.equal(proofs[i].target_hash, leaves[i])
+                    expect.equal(proofs[i].root_hash, root)
+                    hash_tree.verify_slice(proofs[i]) -- errors unless the proof rolls up to root
+                end
+            end
+        end)
+
+        it("matches the reference root as leaves are pushed back", function()
+            local frontier = hash_tree.frontier(H)
+            local leaves = {}
+            expect.equal(hash_tree.frontier_get_root_hash(frontier), reference_root(leaves))
+            for k = 1, 100 do
+                leaves[k] = leaf(k)
+                hash_tree.frontier_push_back(frontier, leaves[k])
+                expect.equal(hash_tree.frontier_get_root_hash(frontier), reference_root(leaves))
+            end
+        end)
+
+        it("resumes from the previous epoch's last proof (epoch-split equivalence)", function()
+            for _, n in ipairs({ 5, 8, 16, 33, 100 }) do
+                local leaves = make_leaves(n)
+                local single = hash_tree.frontier_next_proofs(hash_tree.frontier(H), leaves)
+                for split = 1, n - 1 do
+                    local first, second = {}, {}
+                    for k = 1, split do
+                        first[k] = leaves[k]
+                    end
+                    for k = split + 1, n do
+                        second[#second + 1] = leaves[k]
+                    end
+                    local first_proofs = hash_tree.frontier_next_proofs(hash_tree.frontier(H), first)
+                    -- the previous epoch's last proof seeds the next epoch
+                    local seed = hash_tree.frontier(first_proofs[#first_proofs])
+                    local second_proofs = hash_tree.frontier_next_proofs(seed, second)
+                    for j = 1, #second do
+                        expect_same_proof(second_proofs[j], single[split + j])
+                    end
+                end
+            end
+        end)
+
+        it("has nothing to prove for an empty epoch", function()
+            expect.equal(#hash_tree.frontier_next_proofs(hash_tree.frontier(H), {}), 0)
+        end)
+    end)
+
+    describe("verify_slice", function()
+        it("verifies proofs at the outputs-tree depth", function()
+            local proofs = hash_tree.frontier_next_proofs(hash_tree.frontier(H), make_leaves(10))
+            for _, proof in ipairs(proofs) do
+                expect.equal(proof.log2_root_size, H)
+                hash_tree.verify_slice(proof)
+            end
+        end)
+
+        it("rejects a proof with a tampered target", function()
+            local proofs = hash_tree.frontier_next_proofs(hash_tree.frontier(H), make_leaves(4))
+            local proof = proofs[2]
+            proof.target_hash = string.rep("\0", cartesi.HASH_SIZE)
+            expect.fail(function()
+                hash_tree.verify_slice(proof)
+            end)
+        end)
+    end)
+end)
diff --git a/tests/lua/spec-json.lua b/tests/lua/spec-json.lua
new file mode 100644
index 000000000..bc3e77e7f
--- /dev/null
+++ b/tests/lua/spec-json.lua
@@ -0,0 +1,104 @@
+--[[
+Test suite for cartesi.tojson / cartesi.fromjson schema dictionaries.
+Specifically, it provides test coverage for:
+    clua-i-machine.cpp (clua_tojson, clua_fromjson, clua_tojsonschemadict)
+    clua-cartesi.cpp (cartesi.tojson, cartesi.fromjson)
+]]
+
+local lester = require("cartesi.third-party.lester")
+local cartesi = require("cartesi")
+local describe, it, expect = lester.describe, lester.it, lester.expect
+
+describe("tojson / fromjson schema dictionary", function()
+    local machine <close> = cartesi.machine({ ram = { length = 0x1000 } })
+    local HASH = string.rep("\xa5", 32)
+
+    it("should roundtrip a plain table with no schema", function()
+        local t = { a = 1, b = "x", c = true, d = { 1, 2, 3 } }
+        expect.equal(cartesi.fromjson(cartesi.tojson(t)), t)
+    end)
+
+    it("should serialize bare scalars with no schema", function()
+        expect.equal(cartesi.tojson(42), "42")
+        expect.equal(cartesi.tojson("str"), '"str"')
+        expect.equal(cartesi.fromjson(cartesi.tojson(42)), 42)
+        expect.equal(cartesi.fromjson(cartesi.tojson("str")), "str")
+    end)
+
+    it("should honor the indent argument", function()
+        expect.truthy(cartesi.tojson({ a = 1 }, 2):find("\n", 1, true))
+    end)
+
+    it("should serialize a bare hash under the Base64 schema", function()
+        local j = cartesi.tojson(HASH, nil, "Base64")
+        -- in JSON the hash rides as base64 text (44 chars for 32 bytes), not raw binary
+        expect.equal(#cartesi.fromjson(j), 44)
+        -- with the schema it decodes back to the original 32 binary bytes
+        expect.equal(cartesi.fromjson(j, "Base64"), HASH)
+    end)
+
+    it("should apply user schema types Base64 and ArrayIndex", function()
+        local SCHEMA = { Msg = { hash = "Base64", n = "ArrayIndex" } }
+        local msg = { hash = HASH, n = 5, label = "hi" }
+        local j = cartesi.tojson(msg, nil, "Msg", SCHEMA)
+        -- ArrayIndex is stored 0-based in JSON, hash rides as base64 text
+        expect.equal(cartesi.fromjson(j).n, 4)
+        expect.equal(#cartesi.fromjson(j).hash, 44)
+        -- with the schema, the hash is binary again and the index is 1-based again
+        local back = cartesi.fromjson(j, "Msg", SCHEMA)
+        expect.equal(back, { hash = HASH, n = 5, label = "hi" })
+    end)
+
+    it("should roundtrip a Proof through the machine schema dictionary", function()
+        local proof = machine:get_proof(0, 12)
+        expect.equal(#proof.root_hash, 32)
+        expect.equal(cartesi.fromjson(cartesi.tojson(proof, nil, "Proof"), "Proof"), proof)
+    end)
+
+    it("should resolve machine types referenced from a user type", function()
+        local proof = machine:get_proof(0, 12)
+        local SCHEMA = { Envelope = { final_hash = "Base64", proof = "Proof" } }
+        local env = { final_hash = HASH, proof = proof, who = "referee" }
+        local back = cartesi.fromjson(cartesi.tojson(env, nil, "Envelope", SCHEMA), "Envelope", SCHEMA)
+        expect.equal(back, env)
+    end)
+
+    it("should follow a user type that aliases a compound machine type", function()
+        local proof = machine:get_proof(0, 12)
+        -- a bare top-level alias resolves to its target's schema, not just to a leaf like
+        -- Base64; here it reaches the compound Proof object so the hashes still ride as base64
+        local SCHEMA = { ProofAlias = "Proof" }
+        expect.equal(cartesi.fromjson(cartesi.tojson(proof, nil, "ProofAlias", SCHEMA), "ProofAlias", SCHEMA), proof)
+        -- and a multi-hop alias chain resolves the same way
+        local CHAIN = { A = "B", B = "Proof" }
+        expect.equal(cartesi.fromjson(cartesi.tojson(proof, nil, "A", CHAIN), "A", CHAIN), proof)
+    end)
+
+    it("should leave a Default field as a plain table", function()
+        -- a field typed "Default" carries no schema, so it rides as a plain nested table while a
+        -- sibling Base64 field is still translated
+        local SCHEMA = { Msg = { hash = "Base64", meta = "Default" } }
+        local msg = { hash = HASH, meta = { a = 1, b = "x", c = { 2, 3 } } }
+        expect.equal(cartesi.fromjson(cartesi.tojson(msg, nil, "Msg", SCHEMA), "Msg", SCHEMA), msg)
+    end)
+
+    it("should let user types override machine types of the same name", function()
+        -- the machine dictionary defines Bracket.where as ArrayIndex (0-based in JSON)...
+        expect.equal(cartesi.fromjson(cartesi.tojson({ where = 5 }, nil, "Bracket")).where, 4)
+        -- ...but a user Bracket can reinterpret the same field as a Base64 hash,
+        -- while the nested "Base64" still resolves from the machine dictionary
+        local SCHEMA = { Bracket = { where = "Base64" } }
+        local back = cartesi.fromjson(cartesi.tojson({ where = HASH }, nil, "Bracket", SCHEMA), "Bracket", SCHEMA)
+        expect.equal(back.where, HASH)
+        expect.equal(#back.where, 32)
+    end)
+
+    it("should error on an unknown schema name", function()
+        expect.fail(function()
+            cartesi.tojson({}, nil, "NoSuchType")
+        end, "NoSuchType")
+        expect.fail(function()
+            cartesi.fromjson("{}", "NoSuchType")
+        end, "NoSuchType")
+    end)
+end)
diff --git a/tests/lua/spec-machine-api.lua b/tests/lua/spec-machine-api.lua
index 6c7bed8b2..72678d07d 100644
--- a/tests/lua/spec-machine-api.lua
+++ b/tests/lua/spec-machine-api.lua
@@ -10,6 +10,7 @@ Specifically, it provides test coverage for:
 
 local lester = require("cartesi.third-party.lester")
 local cartesi = require("cartesi")
+local test_util = require("cartesi.tests.util")
 local describe, it, expect = lester.describe, lester.it, lester.expect
 
 local variants = {
@@ -163,5 +164,49 @@ for _, variant in ipairs(variants) do
                 expect.equal(machine:get_address_name(cartesi.AR_LAST_VIRTIO_END - 1), "virtio")
             end)
         end)
+
+        describe("write_memory over shadow state", function()
+            -- Regression: overwriting the whole shadow state (its special case in
+            -- machine::write_memory) resets the hot TLB. Pages written by the guest
+            -- through the write TLB but not yet flushed into the dirty-page tree
+            -- would lose their pending dirty mark, so a later incremental hash would
+            -- not reflect them. write_memory must flush the write TLB dirty pages
+            -- before replacing the shadow.
+            it("should keep the root hash consistent with memory", function()
+                -- auipc t0, 0x2 ; addi t1, x0, 0x42 ; sd t1, 0(t0) ; jal x0, 0
+                -- The store dirties page RAM_START+0x2000 through the write TLB.
+                local program = string.char(
+                    0x97,
+                    0x22,
+                    0x00,
+                    0x00,
+                    0x13,
+                    0x03,
+                    0x20,
+                    0x04,
+                    0x23,
+                    0xb0,
+                    0x62,
+                    0x00,
+                    0x6f,
+                    0x00,
+                    0x00,
+                    0x00
+                )
+                local m <close> = variant.create({ ram = { length = 1 << 20 } })
+                m:write_memory(cartesi.AR_RAM_START, program)
+                -- Snapshot the shadow while its TLB references no written page.
+                local shadow = m:read_memory(cartesi.AR_SHADOW_STATE_START, cartesi.AR_SHADOW_STATE_LENGTH)
+                -- Establish a baseline so the later hash update is incremental.
+                m:get_root_hash()
+                -- Execute the store, leaving the page dirty in host memory but only
+                -- tracked by the write TLB, not yet by the dirty-page tree.
+                m:run(100)
+                -- Overwrite the shadow with the snapshot, whose TLB no longer
+                -- references the written page.
+                m:write_memory(cartesi.AR_SHADOW_STATE_START, shadow)
+                expect.equal(m:get_root_hash(), test_util.calculate_emulator_hash(m))
+            end)
+        end)
     end)
 end
diff --git a/tests/lua/spec-verify-uarch-failure.lua b/tests/lua/spec-verify-uarch-failure.lua
index 3f33c8d92..02cd7e2ef 100644
--- a/tests/lua/spec-verify-uarch-failure.lua
+++ b/tests/lua/spec-verify-uarch-failure.lua
@@ -106,11 +106,11 @@ local function cmio_should_fail(expected_error, corrupt, options)
     local reason = options.reason or 1
     local data = options.data or "test cmio data"
     local initial_hash = machine:get_root_hash()
-    local log = machine:log_send_cmio_response(reason, data)
+    local log = machine:log_send_cmio_response(initial_hash, reason, data)
     local final_hash = machine:get_root_hash()
     corrupt(log)
     expect.fail(function()
-        machine:verify_send_cmio_response(reason, data, initial_hash, log, final_hash)
+        machine:verify_send_cmio_response(initial_hash, reason, data, initial_hash, log, final_hash)
     end, expected_error)
 end
 
@@ -364,10 +364,11 @@ describe("verify_step_uarch", function()
 end)
 
 -- The access pattern for send_cmio_response with non-empty data is:
---   1: read iflags.Y       (check_read)
---   2: write cmio rx buffer (do_write_memory_with_padding)
---   3: write htif.fromhost  (check_write)
---   4: write iflags.Y       (check_write)
+--   1: read iflags.Y          (check_read)
+--   2: write revert root hash (check_write_memory_with_padding)
+--   3: write cmio rx buffer   (check_write_memory_with_padding)
+--   4: write htif.fromhost    (check_write)
+--   5: write iflags.Y         (check_write)
 
 describe("verify_send_cmio_response", function()
     describe("log structure", function()
@@ -389,8 +390,8 @@ describe("verify_send_cmio_response", function()
             end)
         end)
 
-        it("should reject truncated log (missing buffer write)", function()
-            -- Keep only the first access (read iflags.Y), so do_write_memory_with_padding
+        it("should reject truncated log (missing revert root hash write)", function()
+            -- Keep only the first access (read iflags.Y), so check_write_memory_with_padding
             -- hits "too few accesses in log"
             cmio_should_fail("too few accesses in log", function(log)
                 while #log.accesses > 1 do
@@ -400,8 +401,9 @@ describe("verify_send_cmio_response", function()
         end)
 
         it("should reject truncated log (missing check_read)", function()
-            -- With zero-length data, accesses are: read iflags.Y, write htif.fromhost, write iflags.Y
-            -- Keep only the first two so check_write for iflags.Y hits "too few accesses"
+            -- With zero-length data, accesses are: read iflags.Y, write revert root hash,
+            -- write htif.fromhost, write iflags.Y
+            -- Keep only the first three so check_write for iflags.Y hits "too few accesses"
             cmio_should_fail("too few accesses in log", function(log)
                 log.accesses[#log.accesses] = nil
             end, { data = "" })
@@ -413,9 +415,9 @@ describe("verify_send_cmio_response", function()
             local reason = 1
             local data = "test"
             local initial_hash = machine:get_root_hash()
-            local log = machine:log_send_cmio_response(reason, data)
+            local log = machine:log_send_cmio_response(initial_hash, reason, data)
             expect.fail(function()
-                machine:verify_send_cmio_response(reason, data, initial_hash, log, bad_hash)
+                machine:verify_send_cmio_response(initial_hash, reason, data, initial_hash, log, bad_hash)
             end, "mismatch in root hash after replay")
         end)
     end)
@@ -464,15 +466,15 @@ describe("verify_send_cmio_response", function()
         end)
     end)
 
-    describe("do_write_memory_with_padding (access 2: write cmio rx buffer)", function()
+    describe("check_write_memory_with_padding (access 2: write revert root hash)", function()
         it("should reject wrong type", function()
-            cmio_should_fail("expected 2nd access to write cmio rx buffer", function(log)
+            cmio_should_fail("expected 2nd access to write revert root hash", function(log)
                 log.accesses[2].type = "read"
             end)
         end)
 
         it("should reject wrong address", function()
-            cmio_should_fail("expected address of 2nd access to match address of cmio rx buffer", function(log)
+            cmio_should_fail("expected address of 2nd access to match address of revert root hash", function(log)
                 log.accesses[2].address = 0
             end)
         end)
@@ -483,16 +485,51 @@ describe("verify_send_cmio_response", function()
             end)
         end)
 
+        it("should reject wrong written_hash", function()
+            cmio_should_fail(
+                "logged written hash of revert root hash does not match the hash of data argument",
+                function(log)
+                    log.accesses[2].written_hash = bad_hash
+                end
+            )
+        end)
+
+        it("should reject corrupt sibling hash", function()
+            cmio_should_fail("Mismatch in root hash of 2nd access", function(log)
+                log.accesses[2].sibling_hashes[1] = bad_hash
+            end)
+        end)
+    end)
+
+    describe("check_write_memory_with_padding (access 3: write cmio rx buffer)", function()
+        it("should reject wrong type", function()
+            cmio_should_fail("expected 3rd access to write cmio rx buffer", function(log)
+                log.accesses[3].type = "read"
+            end)
+        end)
+
+        it("should reject wrong address", function()
+            cmio_should_fail("expected address of 3rd access to match address of cmio rx buffer", function(log)
+                log.accesses[3].address = 0
+            end)
+        end)
+
+        it("should reject wrong log2_size", function()
+            cmio_should_fail("expected 3rd access to write 2^", function(log)
+                log.accesses[3].log2_size = 2
+            end)
+        end)
+
         it("should reject corrupt read data", function()
-            cmio_should_fail("hash of read data and read hash at 2nd access does not match", function(log)
-                local size = 1 << log.accesses[2].log2_size
-                log.accesses[2].read = string.rep("\xff", size)
+            cmio_should_fail("hash of read data and read hash at 3rd access does not match", function(log)
+                local size = 1 << log.accesses[3].log2_size
+                log.accesses[3].read = string.rep("\xff", size)
             end)
         end)
 
         it("should reject missing written_hash", function()
-            cmio_should_fail("write 2nd access has no written hash", function(log)
-                log.accesses[2].written_hash = nil
+            cmio_should_fail("write 3rd access has no written hash", function(log)
+                log.accesses[3].written_hash = nil
             end)
         end)
 
@@ -500,77 +537,77 @@ describe("verify_send_cmio_response", function()
             cmio_should_fail(
                 "logged written hash of cmio rx buffer does not match the hash of data argument",
                 function(log)
-                    log.accesses[2].written_hash = bad_hash
+                    log.accesses[3].written_hash = bad_hash
                 end
             )
         end)
 
         it("should reject corrupt written data", function()
-            cmio_should_fail("written hash and written data mismatch at 2nd access", function(log)
-                local size = 1 << log.accesses[2].log2_size
-                log.accesses[2].written = string.rep("\xff", size)
+            cmio_should_fail("written hash and written data mismatch at 3rd access", function(log)
+                local size = 1 << log.accesses[3].log2_size
+                log.accesses[3].written = string.rep("\xff", size)
             end)
         end)
 
         it("should reject corrupt sibling hash", function()
-            cmio_should_fail("Mismatch in root hash of 2nd access", function(log)
-                log.accesses[2].sibling_hashes[1] = bad_hash
+            cmio_should_fail("Mismatch in root hash of 3rd access", function(log)
+                log.accesses[3].sibling_hashes[1] = bad_hash
             end)
         end)
     end)
 
-    describe("check_write (access 3: write htif.fromhost)", function()
+    describe("check_write (access 4: write htif.fromhost)", function()
         it("should reject wrong type", function()
-            cmio_should_fail("expected 3rd access to write htif.fromhost", function(log)
-                log.accesses[3].type = "read"
+            cmio_should_fail("expected 4th access to write htif.fromhost", function(log)
+                log.accesses[4].type = "read"
             end)
         end)
 
         it("should reject wrong address", function()
-            cmio_should_fail("expected 3rd access to write htif.fromhost to address", function(log)
-                log.accesses[3].address = 0
+            cmio_should_fail("expected 4th access to write htif.fromhost to address", function(log)
+                log.accesses[4].address = 0
             end)
         end)
 
         it("should reject wrong log2_size", function()
-            cmio_should_fail("expected 3rd access to write 2^", function(log)
-                log.accesses[3].log2_size = 2
+            cmio_should_fail("expected 4th access to write 2^", function(log)
+                log.accesses[4].log2_size = 2
             end)
         end)
 
         it("should reject missing read data", function()
-            cmio_should_fail("missing read htif.fromhost data at 3rd access", function(log)
-                log.accesses[3].read = nil
+            cmio_should_fail("missing read htif.fromhost data at 4th access", function(log)
+                log.accesses[4].read = nil
             end)
         end)
 
         it("should reject wrong read data size", function()
             cmio_should_fail("expected overwritten data from htif.fromhost to contain 2^", function(log)
-                log.accesses[3].read = "\0"
+                log.accesses[4].read = "\0"
             end)
         end)
 
         it("should reject read data that does not hash to read_hash", function()
             cmio_should_fail("logged read data of htif.fromhost does not hash to the logged read hash", function(log)
-                log.accesses[3].read = string.rep("\xff", #log.accesses[3].read)
+                log.accesses[4].read = string.rep("\xff", #log.accesses[4].read)
             end)
         end)
 
         it("should reject missing written_hash", function()
-            cmio_should_fail("missing written htif.fromhost hash at 3rd access", function(log)
-                log.accesses[3].written_hash = nil
+            cmio_should_fail("missing written htif.fromhost hash at 4th access", function(log)
+                log.accesses[4].written_hash = nil
             end)
         end)
 
         it("should reject missing written data", function()
-            cmio_should_fail("missing written htif.fromhost data at 3rd access", function(log)
-                log.accesses[3].written = nil
+            cmio_should_fail("missing written htif.fromhost data at 4th access", function(log)
+                log.accesses[4].written = nil
             end)
         end)
 
         it("should reject wrong written data size", function()
             cmio_should_fail("expected written htif.fromhost data to contain 2^", function(log)
-                log.accesses[3].written = "\0"
+                log.accesses[4].written = "\0"
             end)
         end)
 
@@ -578,14 +615,14 @@ describe("verify_send_cmio_response", function()
             cmio_should_fail(
                 "logged written data of htif.fromhost does not hash to the logged written hash",
                 function(log)
-                    log.accesses[3].written = string.rep("\xff", #log.accesses[3].written)
+                    log.accesses[4].written = string.rep("\xff", #log.accesses[4].written)
                 end
             )
         end)
 
         it("should reject value that does not match logged written value", function()
             cmio_should_fail("value being written to htif.fromhost does not match", function(log)
-                local a = log.accesses[3]
+                local a = log.accesses[4]
                 local new_written = string.rep("\x42", #a.written)
                 a.written = new_written
                 a.written_hash = cartesi.keccak256(new_written)
@@ -594,7 +631,7 @@ describe("verify_send_cmio_response", function()
 
         it("should reject written data that differs from read in unexpected way", function()
             cmio_should_fail("doesn't differ from the logged read data only by the written word", function(log)
-                local a = log.accesses[3]
+                local a = log.accesses[4]
                 -- htif.fromhost is at offset 16 within the 32-byte leaf,
                 -- so we corrupt byte 0 (outside the written word) while keeping the word intact
                 local corrupted = string.char(a.written:byte(1) ~ 0xff) .. a.written:sub(2)
@@ -604,30 +641,30 @@ describe("verify_send_cmio_response", function()
         end)
 
         it("should reject corrupt sibling hash", function()
-            cmio_should_fail("Mismatch in root hash of 3rd access", function(log)
-                log.accesses[3].sibling_hashes[1] = bad_hash
+            cmio_should_fail("Mismatch in root hash of 4th access", function(log)
+                log.accesses[4].sibling_hashes[1] = bad_hash
             end)
         end)
     end)
 
-    describe("ordinal coverage (4th access: write iflags.Y)", function()
-        it("should reject wrong type on 4th access", function()
-            cmio_should_fail("expected 4th access to write iflags.Y", function(log)
-                log.accesses[4].type = "read"
+    describe("ordinal coverage (5th access: write iflags.Y)", function()
+        it("should reject wrong type on 5th access", function()
+            cmio_should_fail("expected 5th access to write iflags.Y", function(log)
+                log.accesses[5].type = "read"
             end)
         end)
     end)
 
     describe("zero-length data (no buffer write)", function()
-        it("should reject wrong type on 2nd access", function()
-            cmio_should_fail("expected 2nd access to write htif.fromhost", function(log)
-                log.accesses[2].type = "read"
+        it("should reject wrong type on 3rd access", function()
+            cmio_should_fail("expected 3rd access to write htif.fromhost", function(log)
+                log.accesses[3].type = "read"
             end, { data = "" })
         end)
 
-        it("should reject wrong type on 3rd access", function()
-            cmio_should_fail("expected 3rd access to write iflags.Y", function(log)
-                log.accesses[3].type = "read"
+        it("should reject wrong type on 4th access", function()
+            cmio_should_fail("expected 4th access to write iflags.Y", function(log)
+                log.accesses[4].type = "read"
             end, { data = "" })
         end)
     end)
diff --git a/tests/lua/test-spec.lua b/tests/lua/test-spec.lua
index d3a647404..fe0725622 100755
--- a/tests/lua/test-spec.lua
+++ b/tests/lua/test-spec.lua
@@ -26,12 +26,14 @@ require("spec-verify-uarch-failure")
 require("spec-fuzzer-bugs")
 require("spec-hash-functions")
 require("spec-hash-tree")
+require("spec-hash-tree-lua")
 require("spec-collect-hashes")
 require("spec-backing-stores")
 require("spec-runtime-console")
 require("spec-cm-cli")
 require("spec-evmu")
 require("spec-machine-api")
+require("spec-json")
 
 lester.report() -- Print overall statistic of the tests run.
 lester.exit() -- Exit with success if all tests passed.
diff --git a/tests/lua/uarch-riscv-tests.lua b/tests/lua/uarch-riscv-tests.lua
index 1ebe4c94c..55ffb6ba9 100755
--- a/tests/lua/uarch-riscv-tests.lua
+++ b/tests/lua/uarch-riscv-tests.lua
@@ -76,9 +76,9 @@ local riscv_tests = {
     { "rv64ui-uarch-xori.bin", 177 },
     { "rv64ui-uarch-fence.bin", 12 },
     { "rv64ui-uarch-ecall-putchar.bin", 14 },
-    { "rv64ui-uarch-ecall-mark-page-dirty.bin", 15 },
     { "rv64ui-uarch-ecall-write-tlb.bin", 46 },
     { "rv64ui-uarch-ecall-unsupported.bin", 1, "unsupported ecall function" },
+    { "rv64ui-uarch-ecall-removed-mark-page-dirty.bin", 1, "unsupported ecall function" },
     { "rv64ui-uarch-ebreak.bin", 1, "uarch aborted" },
 }
 
@@ -520,6 +520,64 @@ local function create_json_reset_log()
     return ctx
 end
 
+local function create_json_reset_rejected_log()
+    local machine <close> = build_machine()
+    local test_name = "reset-uarch-rejected"
+    machine:write_reg("uarch_halt_flag", 1)
+    -- pretend an input was fed from a state with this root hash and later rejected
+    local revert_root_hash = machine:get_root_hash()
+    machine:write_revert_root_hash(revert_root_hash)
+    machine:write_reg("iflags_Y", 1)
+    machine:write_reg("htif_tohost_dev", cartesi.HTIF_DEV_YIELD)
+    machine:write_reg("htif_tohost_cmd", cartesi.HTIF_YIELD_CMD_MANUAL)
+    machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED)
+    local initial_root_hash = machine:get_root_hash()
+    local log = machine:log_reset_uarch()
+    local out = create_json_log_file(test_name .. "-steps")
+    write_log_to_file(log, out, 0, true)
+    out:close()
+    local ctx = {
+        initial_root_hash = initial_root_hash,
+        -- the reset reverts the canonical state to the recorded revert root hash
+        final_root_hash = revert_root_hash,
+        ram_image = "",
+        test_name = test_name,
+        expected_cycles = 1,
+        step_count = 1,
+        failed = false,
+        accesses_count = #log.accesses,
+    }
+    return ctx
+end
+
+local function create_json_reset_accepted_log()
+    local machine <close> = build_machine()
+    local test_name = "reset-uarch-accepted"
+    machine:write_reg("uarch_halt_flag", 1)
+    -- pretend an input was fed and later accepted, so the reset must not revert
+    machine:write_reg("iflags_Y", 1)
+    machine:write_reg("htif_tohost_dev", cartesi.HTIF_DEV_YIELD)
+    machine:write_reg("htif_tohost_cmd", cartesi.HTIF_YIELD_CMD_MANUAL)
+    machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_ACCEPTED)
+    local initial_root_hash = machine:get_root_hash()
+    local log = machine:log_reset_uarch()
+    local out = create_json_log_file(test_name .. "-steps")
+    write_log_to_file(log, out, 0, true)
+    out:close()
+    local ctx = {
+        initial_root_hash = initial_root_hash,
+        -- no revert: the canonical state is the post-reset state
+        final_root_hash = machine:get_root_hash(),
+        ram_image = "",
+        test_name = test_name,
+        expected_cycles = 1,
+        step_count = 1,
+        failed = false,
+        accesses_count = #log.accesses,
+    }
+    return ctx
+end
+
 local function create_json_send_cmio_response_log()
     local machine <close> = build_machine()
     local test_name = "send-cmio-response"
@@ -527,7 +585,36 @@ local function create_json_send_cmio_response_log()
     local reason = 1
     machine:write_reg("iflags_Y", 1)
     local initial_root_hash = machine:get_root_hash()
-    local log = machine:log_send_cmio_response(reason, response_data)
+    local log = machine:log_send_cmio_response(initial_root_hash, reason, response_data)
+    local out = create_json_log_file(test_name .. "-steps")
+    write_log_to_file(log, out, 0, true)
+    out:close()
+    local ctx = {
+        initial_root_hash = initial_root_hash,
+        final_root_hash = machine:get_root_hash(),
+        ram_image = "",
+        test_name = test_name,
+        expected_cycles = 1,
+        step_count = 1,
+        failed = false,
+        accesses_count = #log.accesses,
+    }
+    return ctx
+end
+
+local function create_json_send_cmio_response_noop_log()
+    local machine <close> = build_machine()
+    local test_name = "send-cmio-response-noop"
+    local response_data = "This is a test cmio response"
+    local reason = cartesi.HTIF_YIELD_REASON_ADVANCE_STATE
+    -- the machine yielded manual, but rejected the previous input, so the
+    -- advance-state response is logged as a no-op
+    machine:write_reg("iflags_Y", 1)
+    machine:write_reg("htif_tohost_dev", cartesi.HTIF_DEV_YIELD)
+    machine:write_reg("htif_tohost_cmd", cartesi.HTIF_YIELD_CMD_MANUAL)
+    machine:write_reg("htif_tohost_reason", cartesi.HTIF_YIELD_MANUAL_REASON_RX_REJECTED)
+    local initial_root_hash = machine:get_root_hash()
+    local log = machine:log_send_cmio_response(initial_root_hash, reason, response_data)
     local out = create_json_log_file(test_name .. "-steps")
     write_log_to_file(log, out, 0, true)
     out:close()
@@ -579,10 +666,13 @@ local function json_step_logs(tests)
     if create_uarch_reset_log then
         local ctx = create_json_reset_log()
         contexts[#contexts + 1] = ctx
+        contexts[#contexts + 1] = create_json_reset_rejected_log()
+        contexts[#contexts + 1] = create_json_reset_accepted_log()
     end
     if create_send_cmio_response_log then
         local ctx = create_json_send_cmio_response_log()
         contexts[#contexts + 1] = ctx
+        contexts[#contexts + 1] = create_json_send_cmio_response_noop_log()
     end
 
     -- build catalog
diff --git a/tests/misc/test-machine-c-api.cpp b/tests/misc/test-machine-c-api.cpp
index 10cce41d3..a2c5a7d39 100644
--- a/tests/misc/test-machine-c-api.cpp
+++ b/tests/misc/test-machine-c-api.cpp
@@ -436,7 +436,10 @@ BOOST_FIXTURE_TEST_CASE_NOLINT(nvram_no_start_test, incomplete_machine_fixture)
     cm_error error_code = test_create_new(dumped_config.c_str(), nullptr, nullptr, &_machine);
     BOOST_CHECK_EQUAL(error_code, CM_ERROR_OK);
     std::array<uint8_t, 4> read_data{};
-    error_code = cm_read_memory(_machine, CM_AR_DRIVE_START, read_data.data(), read_data.size());
+    // A drive without an explicit start is auto-placed past the end of RAM, at
+    // CM_AR_RAM_START plus the RAM length rounded up to the next power of two.
+    // The fixture's RAM length (1 << 20) is already a power of two.
+    error_code = cm_read_memory(_machine, CM_AR_RAM_START + (1 << 20), read_data.data(), read_data.size());
     BOOST_CHECK_EQUAL(error_code, CM_ERROR_OK);
 }
 
@@ -446,7 +449,19 @@ BOOST_FIXTURE_TEST_CASE_NOLINT(nvram_no_length_no_file_test, incomplete_machine_
     cm_error error_code = test_create_new(dumped_config.c_str(), nullptr, nullptr, &_machine);
     BOOST_CHECK_EQUAL(error_code, CM_ERROR_RUNTIME_ERROR);
     std::string result = cm_get_last_error_message();
-    std::string origin("nvram 0 has no length");
+    std::string origin("unable to auto-detect length of nvram 0 with empty image file");
+    BOOST_CHECK_EQUAL(origin, result);
+}
+
+// A length whose next power of two, once aligned, leaves no address space past
+// its own end overflows during start auto-detection and must be rejected.
+BOOST_FIXTURE_TEST_CASE_NOLINT(nvram_no_start_space_test, incomplete_machine_fixture) {
+    _machine_config["nvram"] = {{{"length", 0x8000000000000000}}};
+    const auto dumped_config = _machine_config.dump();
+    cm_error error_code = test_create_new(dumped_config.c_str(), nullptr, nullptr, &_machine);
+    BOOST_CHECK_EQUAL(error_code, CM_ERROR_RUNTIME_ERROR);
+    std::string result = cm_get_last_error_message();
+    std::string origin("no address space to auto-detect start of nvram 0");
     BOOST_CHECK_EQUAL(origin, result);
 }
 
@@ -827,6 +842,43 @@ BOOST_FIXTURE_TEST_CASE_NOLINT(get_root_hash_machine_hash_test, ordinary_machine
     BOOST_CHECK_EQUAL_COLLECTIONS(verification.begin(), verification.end(), result_hash, result_hash + sizeof(cm_hash));
 }
 
+BOOST_AUTO_TEST_CASE_NOLINT(read_revert_root_hash_null_machine_test) {
+    cm_hash result_hash;
+    cm_error error_code = cm_read_revert_root_hash(nullptr, &result_hash);
+    BOOST_CHECK_EQUAL(error_code, CM_ERROR_INVALID_ARGUMENT);
+}
+
+BOOST_FIXTURE_TEST_CASE_NOLINT(read_revert_root_hash_null_hash_test, ordinary_machine_fixture) {
+    cm_error error_code = cm_read_revert_root_hash(_machine, nullptr);
+    BOOST_CHECK_EQUAL(error_code, CM_ERROR_INVALID_ARGUMENT);
+}
+
+BOOST_AUTO_TEST_CASE_NOLINT(write_revert_root_hash_null_machine_test) {
+    cm_hash hash{};
+    cm_error error_code = cm_write_revert_root_hash(nullptr, &hash);
+    BOOST_CHECK_EQUAL(error_code, CM_ERROR_INVALID_ARGUMENT);
+}
+
+BOOST_FIXTURE_TEST_CASE_NOLINT(write_revert_root_hash_null_hash_test, ordinary_machine_fixture) {
+    cm_error error_code = cm_write_revert_root_hash(_machine, nullptr);
+    BOOST_CHECK_EQUAL(error_code, CM_ERROR_INVALID_ARGUMENT);
+}
+
+BOOST_FIXTURE_TEST_CASE_NOLINT(revert_root_hash_round_trip_test, ordinary_machine_fixture) {
+    cm_hash original_hash;
+    cm_error error_code = cm_get_root_hash(_machine, &original_hash);
+    BOOST_REQUIRE_EQUAL(error_code, CM_ERROR_OK);
+
+    error_code = cm_write_revert_root_hash(_machine, &original_hash);
+    BOOST_REQUIRE_EQUAL(error_code, CM_ERROR_OK);
+
+    cm_hash result_hash;
+    error_code = cm_read_revert_root_hash(_machine, &result_hash);
+    BOOST_REQUIRE_EQUAL(error_code, CM_ERROR_OK);
+    BOOST_CHECK_EQUAL_COLLECTIONS(original_hash, original_hash + sizeof(cm_hash), result_hash,
+        result_hash + sizeof(cm_hash));
+}
+
 BOOST_AUTO_TEST_CASE_NOLINT(get_proof_null_machine_test) {
     const char *proof{};
     cm_error error_code = cm_get_proof(nullptr, 0, CM_HASH_TREE_LOG2_PAGE_SIZE, CM_HASH_TREE_LOG2_ROOT_SIZE, &proof);
diff --git a/tests/scripts/run-lua-tests.sh b/tests/scripts/run-lua-tests.sh
index ef360a19e..7ebb2a21d 100755
--- a/tests/scripts/run-lua-tests.sh
+++ b/tests/scripts/run-lua-tests.sh
@@ -43,5 +43,5 @@ for x in ${TEST_LIST[@]}; do
         continue
     fi
     echo "Running $x"
-    echo -n 'CTSICTSI' | (bash -c "${LUA} $test_path local") || exit 1
+    bash -c "${LUA} $test_path local" || exit 1
 done
diff --git a/tests/uarch/Makefile b/tests/uarch/Makefile
index 04079ab09..e4ce44bd5 100644
--- a/tests/uarch/Makefile
+++ b/tests/uarch/Makefile
@@ -26,7 +26,7 @@ RISCV_OBJDUMP ?= $(RISCV_PREFIX)objdump --disassemble-all --disassemble-zeroes -
 RISCV_OBJCOPY ?= $(RISCV_PREFIX)objcopy -S -O binary
 
 # Tests provided by us
-TESTS = fence ebreak ecall-putchar ecall-unsupported ecall-mark-page-dirty ecall-write-tlb
+TESTS = fence ebreak ecall-putchar ecall-unsupported ecall-removed-mark-page-dirty ecall-write-tlb
 SRC_DIR = $(abspath .)
 BUILDDIR ?= $(abspath ./build)
 TEST_NAMES = $(addprefix rv64ui-uarch-, $(TESTS))
diff --git a/tests/uarch/ecall-mark-page-dirty.S b/tests/uarch/ecall-removed-mark-page-dirty.S
similarity index 83%
rename from tests/uarch/ecall-mark-page-dirty.S
rename to tests/uarch/ecall-removed-mark-page-dirty.S
index 95f95fa22..300c2c3db 100644
--- a/tests/uarch/ecall-mark-page-dirty.S
+++ b/tests/uarch/ecall-removed-mark-page-dirty.S
@@ -21,12 +21,10 @@
 RVTEST_RV64U
 RVTEST_CODE_BEGIN
 
-  li a7, UARCH_ECALL_FN_MARK_DIRTY_PAGE_DEF
-  li a0, 0   // physical address in page to be marked dirty
-  li a1, 0   // index of PMA where page falls
+  li a7, 3 // function code 3 was mark_dirty_page, now removed and unsupported
   ecall
 
-RVTEST_PASS
+RVTEST_FAIL // it should fail previously so it can't reach this point
 
 RVTEST_CODE_END
 
diff --git a/tests/uarch/rv64ui-uarch-catalog.json b/tests/uarch/rv64ui-uarch-catalog.json
index 716d33797..b94403318 100644
--- a/tests/uarch/rv64ui-uarch-catalog.json
+++ b/tests/uarch/rv64ui-uarch-catalog.json
@@ -51,7 +51,6 @@
     { "path": "rv64ui-uarch-xori.bin", "cycle": 178},
     { "path": "rv64ui-uarch-fence.bin", "cycle": 13},
     { "path": "rv64ui-uarch-ecall-putchar.bin", "cycle": 15},
-    { "path": "rv64ui-uarch-ecall-mark-page-dirty.bin", "cycle": 15},
     { "path": "rv64ui-uarch-ecall-write-tlb.bin", "cycle": 46}
 
 ]
diff --git a/tools/docker-entrypoint.sh b/tools/docker-entrypoint.sh
index 34385844b..eb478aead 100644
--- a/tools/docker-entrypoint.sh
+++ b/tools/docker-entrypoint.sh
@@ -17,26 +17,26 @@
 #
 
 if [ -z "$GID" -o -z "$UID" -o -z "$USER" -o -z "$GROUP" ]; then
-    echo Running as $(whoami)
+    echo Running as $(whoami) >&2
     exec "$@"
 else
   if [ ! $(getent group $GID) ]; then
     if [ $(getent group $GROUP) ]; then
-      echo Group name $GROUP already exists
+      echo Group name $GROUP already exists >&2
       GROUP=container-group-$GID
     fi
     groupadd -g $GID $GROUP
   else
-    echo The id $GID of group $GROUP already exists
+    echo The id $GID of group $GROUP already exists >&2
   fi
   if [ ! $(getent passwd $UID) ]; then
     if [ $(getent passwd $USER) ]; then
-      echo User name $USER already exists.
+      echo User name $USER already exists. >&2
       USER=container-user-$UID
     fi
     useradd -u $UID -g $GID -G $GROUP $USER
   else
-    echo The id $UID of user $USER already exists
+    echo The id $UID of user $USER already exists >&2
   fi
   USERNAME=$(id -nu $UID)
   export HOME=/home/$USERNAME
@@ -51,6 +51,6 @@ else
     chown $UID:$GID $(/usr/bin/tty)
   fi
 
-  echo Running as $USERNAME and group $(id -ng $UID)
+  echo Running as $USERNAME and group $(id -ng $UID) >&2
   exec gosu $USERNAME "$@"
 fi
diff --git a/uarch/Makefile b/uarch/Makefile
index 7da2c771a..db6546b39 100644
--- a/uarch/Makefile
+++ b/uarch/Makefile
@@ -49,6 +49,7 @@ WARNFLAGS := -Wall -Wextra -Wpedantic -Wno-array-bounds -Werror
 
 BASEFLAGS := -march=rv64i -mabi=lp64 $(UBFLAGS) $(WARNFLAGS) \
 	-DMICROARCHITECTURE=1 \
+	-DNO_STD_VECTOR=1 \
 	-DAVOID_NATIVE_UINT128_T=1 \
 	-ffreestanding \
 	-nostartfiles \
diff --git a/uarch/uarch-bridge-state-access.hpp b/uarch/uarch-bridge-state-access.hpp
index 1a3c6a889..8eee1e76d 100644
--- a/uarch/uarch-bridge-state-access.hpp
+++ b/uarch/uarch-bridge-state-access.hpp
@@ -196,11 +196,6 @@ class uarch_bridge_state_access :
         return false;
     }
 
-    // NOLINTNEXTLINE(readability-convert-member-functions-to-static)
-    void do_mark_dirty_page(uint64_t paddr, uint64_t pma_index) const {
-        ua_mark_dirty_page_ECALL(paddr, pma_index);
-    }
-
     constexpr const char *do_get_name() const { // NOLINT(readability-convert-member-functions-to-static)
         return "uarch_bridge_state_access";
     }
diff --git a/uarch/uarch-ecall.c b/uarch/uarch-ecall.c
index 9b85b739d..15f0085c5 100644
--- a/uarch/uarch-ecall.c
+++ b/uarch/uarch-ecall.c
@@ -41,18 +41,6 @@ void ua_putchar_ECALL(uint8_t c) {
     );
 }
 
-void ua_mark_dirty_page_ECALL(uint64_t paddr, uint64_t pma_index) {
-    // NOLINTNEXTLINE(hicpp-no-assembler)
-    asm volatile("mv a7, %0\n"
-                 "mv a0, %1\n"
-                 "mv a1, %2\n"
-                 "ecall\n"
-                 : // no output
-                 : "r"(UARCH_ECALL_FN_MARK_DIRTY_PAGE_DEF), "r"(paddr), "r"(pma_index)
-                 : "a7", "a0", "a1" // clobbered registers
-    );
-}
-
 void ua_write_tlb_ECALL(uint64_t use, uint64_t slot_index, uint64_t vaddr_page, uint64_t vp_offset,
     uint64_t pma_index) {
     // NOLINTNEXTLINE(hicpp-no-assembler)
diff --git a/uarch/uarch-ecall.h b/uarch/uarch-ecall.h
index 08bdc27af..0e161a021 100644
--- a/uarch/uarch-ecall.h
+++ b/uarch/uarch-ecall.h
@@ -26,7 +26,6 @@ extern "C" {
 
 void ua_halt_ECALL();
 void ua_putchar_ECALL(uint8_t c);
-void ua_mark_dirty_page_ECALL(uint64_t paddr, uint64_t pma_index);
 void ua_write_tlb_ECALL(uint64_t use, uint64_t slot_index, uint64_t vaddr_page, uint64_t vp_offset, uint64_t pma_index);
 
 #ifdef __cplusplus