diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
new file mode 100644
index 000000000..2fb740ede
--- /dev/null
+++ b/.github/workflows/docs.yml
@@ -0,0 +1,60 @@
+name: Deploy docs to GitHub Pages
+
+on:
+  push:
+    branches: [trunk]
+    paths:
+      - 'components/**'
+      - 'docs/**'
+      - 'bin/build-docs*'
+      - 'composer.json'
+      - 'composer.lock'
+      - '.github/workflows/docs.yml'
+  workflow_dispatch:
+
+permissions:
+  contents: read
+  pages: write
+  id-token: write
+
+concurrency:
+  group: pages
+  cancel-in-progress: true
+
+jobs:
+  build:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Set up PHP
+        uses: shivammathur/setup-php@v2
+        with:
+          php-version: '8.1'
+          tools: composer
+          coverage: none
+
+      - name: Install dependencies
+        run: composer install --no-dev --optimize-autoloader --no-progress
+
+      - name: Bundle toolkit and regenerate docs
+        run: |
+          mkdir -p docs/assets
+          rm -f docs/assets/php-toolkit.zip
+          zip -qr docs/assets/php-toolkit.zip components vendor bootstrap.php composer.json \
+            -x "*/Tests/*" "*/tests/*" "*/.git/*" "*/.github/*" "*/node_modules/*"
+          python3 bin/build-docs.py
+
+      - uses: actions/upload-pages-artifact@v3
+        with:
+          path: ./docs
+
+  deploy:
+    needs: build
+    runs-on: ubuntu-latest
+    environment:
+      name: github-pages
+      url: ${{ steps.deployment.outputs.page_url }}
+    steps:
+      - id: deployment
+        uses: actions/deploy-pages@v4
diff --git a/.github/workflows/snippet-tests.yml b/.github/workflows/snippet-tests.yml
new file mode 100644
index 000000000..7b8ab1f24
--- /dev/null
+++ b/.github/workflows/snippet-tests.yml
@@ -0,0 +1,47 @@
+name: Verify docs snippets
+
+# Runs every PHP snippet in bin/_docs_components.py against the local toolkit
+# and compares stdout against bin/_expected_outputs.json. Anything that drifts
+# fails CI; anything that errors out also fails CI.
+#
+# Snippets that can't run locally (need network, a listening port, or other
+# Playground-only features) are not in the JSON and are skipped — the runner
+# only enforces matches for snippets that already have captured output.
+
+on:
+  pull_request:
+    paths:
+      - 'components/**'
+      - 'bin/_docs_components.py'
+      - 'bin/_expected_outputs.json'
+      - 'bin/run-snippets.py'
+      - 'composer.json'
+      - 'composer.lock'
+      - '.github/workflows/snippet-tests.yml'
+  push:
+    branches: [trunk]
+  workflow_dispatch:
+
+jobs:
+  run-snippets:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Set up PHP
+        uses: shivammathur/setup-php@v2
+        with:
+          php-version: '8.3'
+          tools: composer
+          coverage: none
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: '3.11'
+
+      - name: Install toolkit dependencies
+        run: composer install --no-dev --optimize-autoloader --no-progress
+
+      - name: Run docs snippets and compare to expected output
+        run: bin/run-snippets.py --check
diff --git a/bin/_docs_components.py b/bin/_docs_components.py
new file mode 100644
index 000000000..29aed0ef1
--- /dev/null
+++ b/bin/_docs_components.py
@@ -0,0 +1,2871 @@
+# Component catalog for the runnable docs site. Imported by bin/build-docs.py.
+#
+# Format: list of (slug, title, lede_html, install_package, sections), where sections is a list of
+#   (heading, body_html, snippet_or_None)
+# and snippet is (filename, php_code). Use (filename, php_code, False) for a
+# non-runnable <php-snippet runnable="false"> example.
+#
+# Both body_html and php_code may use HTML entities (&lt; &gt; &amp; &quot; &#x27;)
+# — the renderer in build-docs.py decodes them before output. That keeps the
+# embedded snippets readable when this file is edited as Python.
+
+LOAD = "require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';\n\n"
+
+
+def php(snippet):
+    return '<?php\n' + LOAD + snippet
+
+
+COMPONENTS = []
+
+
+# Upstream credits surfaced as a callout on each reference page.
+# Keep these brief — the landing page's "Credits" section carries the longer note.
+CREDITS = {
+    'html': (
+        'Ported from WordPress core',
+        'The HTML component is a port of WordPress core\'s '
+        '<code>WP_HTML_Tag_Processor</code> and <code>WP_HTML_Processor</code>. '
+        'Source: <a href="https://github.com/WordPress/wordpress-develop/tree/trunk/src/wp-includes/html-api">WordPress/wordpress-develop</a>. '
+        'Bug fixes flow in both directions.',
+    ),
+    'blockparser': (
+        'WordPress core, packaged standalone',
+        '<code>WP_Block_Parser</code> is WordPress core\'s block parser, '
+        'packaged here so importers and linters can read '
+        '<a href="https://developer.wordpress.org/block-editor/reference-guides/block-api/">block markup</a> '
+        'without booting WordPress. Source: '
+        '<a href="https://github.com/WordPress/wordpress-develop/blob/trunk/src/wp-includes/class-wp-block-parser.php">WordPress/wordpress-develop</a>.',
+    ),
+    'markdown': (
+        'Built on league/commonmark',
+        'Markdown parsing is delegated to '
+        '<a href="https://commonmark.thephpleague.com/"><code>league/commonmark</code></a>; '
+        'YAML frontmatter is handled by '
+        '<a href="https://github.com/webuni/front-matter"><code>webuni/front-matter</code></a>. '
+        'The toolkit\'s own work is the bridge between CommonMark\'s AST and '
+        '<a href="https://developer.wordpress.org/block-editor/reference-guides/block-api/">WordPress block markup</a>, in both directions.',
+    ),
+    'polyfill': (
+        'WordPress-shaped behavior',
+        'When WordPress is loaded, every function in this component defers to WordPress. '
+        'The standalone implementations of <code>esc_html()</code>, <code>add_filter()</code>, '
+        '<code>__()</code>, and friends match WordPress core\'s behavior so the same code runs '
+        'inside and outside the platform.',
+    ),
+}
+
+
+COMPONENT_GUIDES = {
+    'html': {
+        'mental_model':
+            '<p>Start with the tag processor when you need to change markup that WordPress already stored: add <code>loading="lazy"</code> to post images, make feed links absolute, or remove inline event handlers from pasted HTML. It scans forward and preserves every byte it does not touch.</p>'
+            '<p>Switch to the full processor when the browser tree matters. Use it to find images inside figures, walk heading depth, or return to a saved parent after inspecting child tags.</p>',
+        'journey': (
+            ('Rewrite one tag safely', 'Add image attributes without parsing a DOM or changing surrounding whitespace.'),
+            ('Protect real content', 'Rewrite relative links, remove script behavior, and add CSP nonces without clobbering author-provided attributes.'),
+            ('Use structure when you need it', 'Find figure images, print a heading outline, and use bookmarks to annotate a parent after scanning its children.'),
+        ),
+    },
+    'zip': {
+        'mental_model':
+            '<p>Treat a ZIP as a small filesystem with a table of contents at the end. Read the central directory, open one entry stream, and copy that entry where it belongs.</p>'
+            '<p>Use <code>ZipFilesystem</code> when your code wants <code>get_contents()</code> and <code>ls()</code>. Use <code>ZipEncoder</code> and <code>ZipDecoder</code> when the archive format matters, such as an EPUB that must store <code>mimetype</code> first and uncompressed.</p>',
+        'journey': (
+            ('Open an archive as files', 'Read <code>readme.txt</code> through <code>ZipFilesystem</code> before touching entry headers.'),
+            ('Write a format with rules', 'Build an EPUB and make the first entry Stored, not Deflated.'),
+            ('Move archives through streams', 'Repack entries, reject <code>../</code> paths, and copy a remote ZIP entry into another filesystem without a manual byte loop.'),
+        ),
+    },
+    'bytestream': {
+        'mental_model':
+            '<p>A read stream separates three actions: pull bytes, inspect the buffer, then consume the bytes you accepted. That pattern lets a parser wait for a full line, a ZIP decoder wait for a complete header, or an HTTP client report progress without losing data.</p>'
+            '<p>Write streams make the destination boring. The caller writes chunks; the sink decides whether those bytes go to memory, a file, a compressor, or another component.</p>',
+        'journey': (
+            ('Read in chunks', 'Pull from memory and files with the same loop, then stop only when the stream reaches end-of-data.'),
+            ('Handle awkward boundaries', 'Read lines split across chunks and connect producers to consumers with <code>MemoryPipe</code>.'),
+            ('Add behavior around bytes', 'Wrap streams with gzip, hashing, limits, and windows while keeping the caller on the same interface.'),
+        ),
+    },
+    'filesystem': {
+        'mental_model':
+            '<p>Write your tool against a filesystem object, not against the host machine. Tests can pass an in-memory tree, a CLI command can pass a local directory, and an importer can pass a ZIP-backed filesystem.</p>'
+            '<p>Every toolkit path uses forward slashes. A path such as <code>wp-content/uploads/2026/logo.png</code> means the same thing on macOS, Windows, Playground, and inside an archive.</p>',
+        'journey': (
+            ('Start in memory', 'Write and list files without touching disk, which makes examples and tests deterministic.'),
+            ('Move to a real backend', 'Use local, SQLite, and atomic-write examples to keep the same calling style while changing storage.'),
+            ('Copy between backends', 'Move a generated theme file from memory to disk, or from a ZIP archive into a local staging directory, through one helper.'),
+        ),
+    },
+    'blockparser': {
+        'mental_model':
+            '<p>The parser turns serialized post content into the block array shape WordPress core returns. It does not render blocks, load <code>block.json</code>, or ask a registry whether a block exists.</p>'
+            '<p>Handle <code>blockName === null</code> first. A real post can contain a paragraph block, a custom block, and loose HTML before or after both.</p>',
+        'journey': (
+            ('Inspect the returned shape', 'Parse one paragraph block and read <code>blockName</code>, <code>attrs</code>, <code>innerBlocks</code>, <code>innerHTML</code>, and <code>innerContent</code>.'),
+            ('Walk the tree', 'Count nested blocks and find custom blocks without writing recursive boilerplate everywhere.'),
+            ('Ask editorial questions', 'Detect skipped heading levels, stale embeds, and blocks that need a migration before import.'),
+        ),
+    },
+    'markdown': {
+        'mental_model':
+            '<p>Use Markdown for files that humans edit and block markup for content that WordPress stores. This component translates the supported middle ground: headings, paragraphs, lists, code blocks, links, images, and frontmatter-backed metadata.</p>'
+            '<p>Keep unsupported syntax visible. A migration tool should tell you that a file contains an unsupported table instead of silently dropping it before publishing.</p>',
+        'journey': (
+            ('Convert one document', 'Turn <code>posts/launch.md</code> into block markup and turn supported blocks back into readable Markdown.'),
+            ('Carry metadata beside content', 'Read frontmatter for title, slug, date, tags, and import hints.'),
+            ('Prepare a folder import', 'Map filenames to slugs, audit generated blocks, and hand the result to DataLiberation when you need WXR.'),
+        ),
+    },
+    'xml': {
+        'mental_model':
+            '<p><code>XMLProcessor</code> walks XML as a cursor. It reads the next tag, exposes attributes and text, records edits, and emits updated XML only when you call <code>get_updated_xml()</code>.</p>'
+            '<p>Query namespaces by URI, not by prefix. In WXR, look for <code>http://wordpress.org/export/1.2/</code> even when the source file writes the prefix as <code>wp:</code>.</p>',
+        'journey': (
+            ('Edit one attribute', 'Bump product prices and see how buffered updates keep untouched XML intact.'),
+            ('Read namespaced exports', 'Find WXR status fields and attachment URLs by namespace URI and local name.'),
+            ('Process export-sized files', 'Rewrite staging URLs and parse OPML without building a full in-memory tree.'),
+        ),
+    },
+    'encoding': {
+        'mental_model':
+            '<p>Validate text with the Encoding helpers before a stricter parser sees unfamiliar bytes. A Latin-1 title from an old export, an overlong UTF-8 sequence in an upload, or a Unicode noncharacter can break XML, JSON, or a database write later in the pipeline — and the further downstream the failure happens, the harder it is to trace.</p>'
+            '<p>The component gives the same answer whether PHP has <code>mbstring</code> available or falls back to the pure-PHP scanner.</p>',
+        'journey': (
+            ('Reject invalid bytes', 'Separate clean UTF-8 from Latin-1 bytes, overlong forms, surrogate halves, and incomplete sequences.'),
+            ('Repair when content matters', 'Replace invalid bytes with <code>U+FFFD</code> when keeping the rest of a post title beats stopping the import.'),
+            ('Check downstream limits', 'Detect noncharacters before writing XML or handing text to a system with stricter Unicode rules.'),
+        ),
+    },
+    'dataliberation': {
+        'mental_model':
+            '<p>Model a migration as a stream of WordPress-shaped entities. Read a post, rewrite its content and metadata, write it out, then move to the next entity.</p>'
+            '<p>The useful work happens between readers and writers: rewrite <code>https://staging.example.test</code> inside HTML, block attributes, CSS, GUIDs, and media URLs; download attachments; and keep enough state to resume after a failed request.</p>',
+        'journey': (
+            ('Write one entity', 'Create a WXR post record and read it back before building a site-sized pipeline.'),
+            ('Transform as you stream', 'Rewrite URLs on each entity without loading the whole export.'),
+            ('Compose a migration', 'Convert a Markdown folder, frontload media with HttpClient, and write WXR through XML and ByteStream layers.'),
+        ),
+    },
+    'git': {
+        'mental_model':
+            '<p>Git stores snapshots as objects: blobs hold file bytes, trees hold directory listings, commits point at trees, and refs name commits.</p>'
+            '<p>This component keeps those objects visible. A browser-based editor can commit generated files, move <code>refs/heads/main</code>, expose a commit tree as a filesystem, and merge another branch without running the <code>git</code> binary.</p>',
+        'journey': (
+            ('Create a snapshot', 'Commit files into an in-memory repository and print the resulting object ID.'),
+            ('Read history by name', 'Resolve refs, walk parent commits, and mount a commit tree with <code>GitFilesystem</code>.'),
+            ('Coordinate edits', 'Create branches, merge content, and keep conflicts explicit for the caller.'),
+        ),
+    },
+    'merge': {
+        'mental_model':
+            '<p>A three-way merge needs the common base, your version, and their version. The base tells the merger whether two lines changed independently or collided.</p>'
+            '<p>Start with line merges for Markdown, config files, and generated PHP. Move to a domain-specific differ only when lines hide the real unit of change.</p>',
+        'journey': (
+            ('See the edit', 'Generate a diff and patch so the merge inputs feel concrete.'),
+            ('Auto-merge independent lines', 'Combine two edits that touch different parts of the same file.'),
+            ('Surface conflicts', 'Return conflict records for a UI, CLI prompt, or sync log instead of guessing a winner.'),
+        ),
+    },
+    'httpclient': {
+        'mental_model':
+            '<p>Make the first request boring: <code>GET https://api.wordpress.org/plugins/info/1.2/</code>, then read the response status and body. From there, add the details the workflow actually needs: a POST body, JSON headers, redirects, cache policy, or a chosen transport.</p>'
+            '<p>When the response becomes a file, keep it as a stream. A plugin installer can show progress while downloading a ZIP, resume a partial archive with <code>Range</code>, and hand the remote body to ZipFilesystem without first building a giant string.</p>',
+        'journey': (
+            ('Start with GET and POST', 'Fetch a URL, submit form data, and build a JSON request before touching lower-level objects.'),
+            ('Configure the request path', 'Choose a transport, follow redirects, cache responses, and report failures with useful context.'),
+            ('Scale the transfer', 'Show progress, keep ten media downloads active, resume a partial ZIP, and stream-unzip a remote archive through Filesystem helpers.'),
+        ),
+    },
+    'httpserver': {
+        'mental_model':
+            '<p>Use HttpServer when a PHP tool needs one local endpoint. A CLI command can open <code>http://127.0.0.1:8765/callback</code> for an OAuth flow, serve fixture JSON to HttpClient tests, or expose a tiny status page during an import.</p>'
+            '<p>The server accepts a connection, parses one request, and gives your handler a response writer. Keep the process lifetime and shutdown rule in your command.</p>',
+        'journey': (
+            ('Serve one response', 'Bind to loopback and return text from a handler.'),
+            ('Route a small local API', 'Branch on method and path for <code>/api/status</code> and <code>/api/echo</code>.'),
+            ('Buffer when headers depend on the body', 'Use the buffered writer when the runtime needs the full response before sending headers.'),
+        ),
+    },
+    'corsproxy': {
+        'mental_model':
+            '<p>A browser app cannot read <code>https://api.github.com/repos/WordPress/php-toolkit</code> unless GitHub sends CORS headers the app can use. A PHP proxy can fetch that URL server-side and return a controlled browser-readable response.</p>'
+            '<p>Deploy the proxy as a gate, not as an open tunnel. Allow <code>api.github.com</code> and <code>raw.githubusercontent.com</code> for a docs tool; reject private IP ranges, unknown hosts, oversized responses, and credential-bearing request headers.</p>',
+        'journey': (
+            ('See the proxy URL shape', 'Request <code>/cors-proxy.php/https://api.github.com/repos/WordPress/php-toolkit</code> from a local PHP server.'),
+            ('Lock down deployment', 'Add a rate limiter and a host allowlist before exposing the proxy.'),
+            ('Use it from the browser', 'Wrap <code>fetch()</code> once, then deploy the PHP script behind nginx or another SAPI.'),
+        ),
+    },
+    'cli': {
+        'mental_model':
+            '<p>Define the command-line contract once, then parse <code>argv</code> against it. The parser returns positional arguments and named options; your application validates them and runs the command.</p>'
+            '<p>A command such as <code>toolkit import posts/launch.md --site=demo --dry-run -vv</code> should not need a console framework just to understand flags, values, and positionals.</p>',
+        'journey': (
+            ('Parse the smallest command', 'Read one boolean flag and one positional argument.'),
+            ('Accept normal shell shapes', 'Handle <code>--port=8080</code>, <code>--port 8080</code>, <code>-p 8080</code>, and bundled booleans such as <code>-afv</code>.'),
+            ('Build command behavior', 'Add required options, help output, and subcommand dispatch in application code.'),
+        ),
+    },
+    'polyfill': {
+        'mental_model':
+            '<p>Load Polyfill when toolkit code runs outside WordPress but still calls WordPress-shaped helpers. Standalone tests can call <code>esc_html()</code>, add a filter, or use a translation stub without booting WordPress.</p>'
+            '<p>The component defines only missing functions. If WordPress or the current PHP runtime already provides a function, the polyfill leaves it alone.</p>',
+        'journey': (
+            ('Backfill missing PHP helpers', 'Use PHP 7.2-compatible helpers without dropping support for older runtimes.'),
+            ('Keep familiar WordPress calls', 'Escape output and keep translation-shaped call sites in standalone tools.'),
+            ('Expose extension points', 'Register filters and actions for library code that needs hooks outside WordPress.'),
+        ),
+    },
+    'blueprints': {
+        'mental_model':
+            '<p>A Blueprint is a versioned recipe for a WordPress site. It can install Gutenberg, set permalink structure, import content, copy files, and run WP-CLI steps in a predictable order.</p>'
+            '<p>The runner supplies the environment: site root, site URL, execution mode, and filesystem access. The validator checks user-authored JSON before the runner mutates the target site.</p>',
+        'journey': (
+            ('Configure the target', 'Create a <code>RunnerConfiguration</code> with the site path, URL, and execution mode.'),
+            ('Generate repeatable recipes', 'Build JSON from PHP when tests or docs need a fresh site with the same plugins and options.'),
+            ('Validate before running', 'Catch misspelled step names and missing fields before installing packages or changing options.'),
+        ),
+    },
+    'coding-standards': {
+        'mental_model':
+            '<p>Turn repeat review comments into PHPCS sniffs. If the project always rejects short ternaries, loose comparisons, or a confusing Yoda condition, the tool should report it before a reviewer does.</p>'
+            '<p>Keep each sniff narrow. A useful sniff names the risky pattern and shows the replacement code shape contributors should write.</p>',
+        'journey': (
+            ('Enable the ruleset', 'Point PHPCS at the toolkit standard from a component or CI job.'),
+            ('Read the rule as review guidance', 'Learn why the Yoda and short-ternary sniffs exist instead of treating them as arbitrary style.'),
+            ('Write the explicit form', 'Replace compact syntax with code that stays clear on PHP 7.2 and across WordPress-style projects.'),
+        ),
+    },
+}
+
+
+STARTER_PATHS = (
+    (
+        'Content and migration',
+        'Start here when you are importing, exporting, rewriting, or auditing WordPress content.',
+        ('html', 'blockparser', 'markdown', 'xml', 'dataliberation'),
+    ),
+    (
+        'Streams and storage',
+        'Use this path for archives, large files, testable storage backends, and pure-PHP file movement.',
+        ('bytestream', 'filesystem', 'zip', 'git', 'merge'),
+    ),
+    (
+        'Networked tools',
+        'Use this path for clients, local fixture servers, browser-facing proxies, and CLI workflows.',
+        ('httpclient', 'httpserver', 'corsproxy', 'cli'),
+    ),
+    (
+        'WordPress runtime support',
+        'Use this path when your code needs WordPress-shaped helpers, repeatable sites, or project-specific review rules.',
+        ('polyfill', 'blueprints', 'coding-standards'),
+    ),
+)
+
+
+COMPONENT_RELATIONS = {
+    'html': (
+        ('blockparser', 'BlockParser', 'Parse block comments first, then rewrite the HTML inside each block.'),
+        ('markdown', 'Markdown', 'Convert Markdown to blocks before polishing generated HTML.'),
+        ('dataliberation', 'DataLiberation', 'Rewrite URLs and media references during import/export pipelines.'),
+    ),
+    'zip': (
+        ('filesystem', 'Filesystem', 'Treat an archive like a swappable filesystem backend.'),
+        ('bytestream', 'ByteStream', 'Feed readers and writers without whole-file buffers.'),
+        ('httpclient', 'HttpClient', 'Stream downloaded archives into validation or extraction workflows.'),
+    ),
+    'bytestream': (
+        ('filesystem', 'Filesystem', 'Back file reads and writes with the same stream primitives.'),
+        ('zip', 'Zip', 'Read and write archive entries one stream at a time.'),
+        ('httpclient', 'HttpClient', 'Process request and response bodies incrementally.'),
+    ),
+    'filesystem': (
+        ('bytestream', 'ByteStream', 'Open files as readers and writers instead of loading full strings.'),
+        ('zip', 'Zip', 'Mount archives and copy data between archive-backed and normal filesystems.'),
+        ('git', 'Git', 'Expose repository trees through a filesystem-shaped API.'),
+    ),
+    'blockparser': (
+        ('html', 'HTML', 'Inspect or rewrite the HTML carried by parsed blocks.'),
+        ('markdown', 'Markdown', 'Move between author-friendly Markdown and serialized block markup.'),
+        ('dataliberation', 'DataLiberation', 'Audit and transform blocks while migrating content.'),
+    ),
+    'markdown': (
+        ('blockparser', 'BlockParser', 'Understand the block tree created from Markdown output.'),
+        ('html', 'HTML', 'Rewrite rendered HTML fragments without using DOMDocument.'),
+        ('dataliberation', 'DataLiberation', 'Turn Markdown folders into import/export streams.'),
+    ),
+    'xml': (
+        ('dataliberation', 'DataLiberation', 'Read and write WXR-sized WordPress exports as entities.'),
+        ('encoding', 'Encoding', 'Validate and scrub text before strict XML processing.'),
+        ('bytestream', 'ByteStream', 'Keep large XML reads incremental.'),
+    ),
+    'encoding': (
+        ('html', 'HTML', 'Normalize incoming text before HTML tokenization.'),
+        ('xml', 'XML', 'Keep invalid bytes out of XML streams.'),
+        ('dataliberation', 'DataLiberation', 'Clean content before importing it into WordPress.'),
+    ),
+    'dataliberation': (
+        ('markdown', 'Markdown', 'Use Markdown as a source or destination format.'),
+        ('blockparser', 'BlockParser', 'Analyze serialized blocks inside post content.'),
+        ('httpclient', 'HttpClient', 'Download media and remote source data while importing.'),
+    ),
+    'git': (
+        ('filesystem', 'Filesystem', 'Work with repository trees through a storage abstraction.'),
+        ('merge', 'Merge', 'Resolve divergent histories with explicit three-way merge logic.'),
+        ('bytestream', 'ByteStream', 'Read and write object data without accidental buffering.'),
+    ),
+    'merge': (
+        ('git', 'Git', 'Merge file contents discovered through repository history.'),
+        ('markdown', 'Markdown', 'Resolve file-based editorial workflows before converting to blocks.'),
+        ('dataliberation', 'DataLiberation', 'Make content synchronization conflicts visible.'),
+    ),
+    'httpclient': (
+        ('bytestream', 'ByteStream', 'Stream request and response bodies.'),
+        ('filesystem', 'Filesystem', 'Persist large downloads without buffering them in memory.'),
+        ('corsproxy', 'CORSProxy', 'Bridge browser-side tools to servers without CORS headers.'),
+    ),
+    'httpserver': (
+        ('cli', 'CLI', 'Expose a local browser UI from a command-line tool.'),
+        ('httpclient', 'HttpClient', 'Test client code against a small local fixture server.'),
+    ),
+    'corsproxy': (
+        ('httpclient', 'HttpClient', 'Fetch upstream responses from PHP when browser CORS blocks direct access.'),
+        ('httpserver', 'HttpServer', 'Understand the local-server shape before deploying a proxy endpoint.'),
+    ),
+    'cli': (
+        ('filesystem', 'Filesystem', 'Keep command behavior testable with in-memory storage.'),
+        ('blueprints', 'Blueprints', 'Build repeatable site setup commands around parsed options.'),
+        ('httpserver', 'HttpServer', 'Add a local web UI to a CLI workflow.'),
+    ),
+    'polyfill': (
+        ('html', 'HTML', 'Run WordPress-shaped escaping and translation helpers beside HTML processors.'),
+        ('blockparser', 'BlockParser', 'Keep standalone block tooling familiar outside WordPress.'),
+    ),
+    'blueprints': (
+        ('filesystem', 'Filesystem', 'Prepare files and fixtures before applying site setup steps.'),
+        ('httpclient', 'HttpClient', 'Download packages or source data as part of provisioning workflows.'),
+        ('cli', 'CLI', 'Wrap repeatable blueprint operations in a small command.'),
+    ),
+    'coding-standards': (
+        ('polyfill', 'Polyfill', 'Share WordPress-style compatibility expectations across standalone packages.'),
+    ),
+}
+
+
+# ===========================================================================
+# HTML
+# ===========================================================================
+COMPONENTS.append(('html', 'HTML',
+    'A pure-PHP HTML5 parser and tag rewriter mirroring WordPress core\'s HTML API. Treat HTML the way browsers do — without <code>libxml2</code>, <code>DOMDocument</code>, or regex hacks — and rewrite attributes in a single linear pass.',
+    'wp-php-toolkit/html',
+    [
+        ('Why this exists',
+            '<p>WordPress runs HTML fragments through filters every time a request renders: post content, block markup, comments, excerpts, widgets, feeds, imported documents. Those fragments can omit <code>&lt;html&gt;</code> and <code>&lt;body&gt;</code>, close tags implicitly, or mix browser-correct markup with author mistakes that <code>DOMDocument</code> and regular expressions do not model well.</p>'
+            '<p>The HTML component gives WordPress-style code the same parsing model WordPress core uses: a browser-compatible tokenizer and tree-aware processor that run in pure PHP. Choose it for exact-byte rewrites, imperfect fragments, and post-content filters where a full DOM would do too much work.</p>'
+            '<p>The component gives you two processors. <code>WP_HTML_Tag_Processor</code> is a forward-only cursor over tags and tokens — useful for attribute rewriting at scale. <code>WP_HTML_Processor</code> layers HTML5 tree construction on top so you can query by ancestry (breadcrumbs), serialize the parsed document, and trust that <code>&lt;p&gt;one&lt;p&gt;two</code> parses as two paragraphs the way a browser sees it.</p>'
+            '<p><strong>Footgun:</strong> mutations are buffered. Nothing changes in the source string until you call <code>get_updated_html()</code>. If you read <code>get_attribute()</code> after a <code>set_attribute()</code> on the same tag, you see the new value — but downstream tooling reading the original string sees stale HTML until you serialize.</p>',
+            None),
+        ('Add loading="lazy" to every image',
+            '<p>The "hello world" of tag rewriting. One linear pass, no DOM, no reserialization cost beyond the bytes you actually changed.</p>'
+            '<p><strong>Try this:</strong> click <em>Run</em>, then change <code>\'lazy\'</code> to <code>\'eager\'</code> on the first image only by guarding it with <code>$tags-&gt;get_attribute( \'src\' ) === \'hero.jpg\'</code>. Run again and notice that <code>get_updated_html()</code> only rewrites the bytes for that one tag.</p>',
+            ('lazy-load-images.php', php('''$html = '<article>
+\t<img src="hero.jpg" alt="Hero">
+\t<p>Intro copy.</p>
+\t<img src="inline.jpg" alt="Inline">
+</article>';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag( 'img' ) ) {
+\t// Don't clobber an explicit eager hint the author already set.
+\tif ( null === $tags->get_attribute( 'loading' ) ) {
+\t\t$tags->set_attribute( 'loading', 'lazy' );
+\t}
+\t$tags->set_attribute( 'decoding', 'async' );
+}
+
+echo $tags->get_updated_html();'''))),
+        ('Rewrite relative links to absolute URLs',
+            '<p>Use this before sending post content to an RSS feed, an email template, or a CDN-backed copy of a site. The processor rewrites only the changed bytes, so untouched markup stays byte-identical.</p>',
+            ('absolute-links.php', php('''$html = '<p>See <a href="/about">about</a>, <a href="https://example.com/x">x</a>, '
+\t. 'and <a href="contact.html">contact</a>.</p>';
+
+$base = 'https://my-site.test/';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag( 'a' ) ) {
+\t$href = $tags->get_attribute( 'href' );
+\tif ( null === $href || '' === $href ) {
+\t\tcontinue;
+\t}
+\tif ( preg_match( '#^[a-z][a-z0-9+.-]*:#i', $href ) || 0 === strpos( $href, '//' ) || 0 === strpos( $href, '#' ) ) {
+\t\tcontinue;
+\t}
+\t$tags->set_attribute( 'href', rtrim( $base, '/' ) . '/' . ltrim( $href, '/' ) );
+}
+
+echo $tags->get_updated_html();'''))),
+        ('Strip every script and inline event handler',
+            '<p>A common sanitization step: neutralize untrusted HTML before display. Blank a script\'s body with <code>set_modifiable_text()</code> and strip every <code>on*</code> attribute via <code>get_attribute_names_with_prefix()</code>.</p>',
+            ('sanitize-html.php', php('''$untrusted = '<p>Hi <b onclick="steal()">friend</b>!</p>'
+\t. '<script>alert("xss")</script>'
+\t. '<img src=x onerror="boom()">';
+
+$tags = new WP_HTML_Tag_Processor( $untrusted );
+while ( $tags->next_tag() ) {
+\tif ( 'SCRIPT' === $tags->get_tag() && ! $tags->is_tag_closer() ) {
+\t\t$tags->set_modifiable_text( '' );
+\t}
+\t$on_handlers = $tags->get_attribute_names_with_prefix( 'on' );
+\tif ( $on_handlers ) {
+\t\tforeach ( $on_handlers as $name ) {
+\t\t\t$tags->remove_attribute( $name );
+\t\t}
+\t}
+}
+
+echo $tags->get_updated_html();'''))),
+        ('Stamp a CSP nonce on inline scripts and styles',
+            '<p>Content Security Policy in <code>nonce-</code> mode requires every inline <code>&lt;script&gt;</code> and <code>&lt;style&gt;</code> to carry a matching nonce attribute. Tag-by-tag is exactly the right granularity.</p>',
+            ('csp-nonce.php', php('''$nonce = bin2hex( random_bytes( 8 ) );
+
+$html = '<head><style>body{font:16px sans-serif}</style></head>'
+\t. '<body><script>console.log("hi")</script><script src="vendor.js"></script></body>';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag() ) {
+\t$tag = $tags->get_tag();
+\tif ( ( 'SCRIPT' === $tag || 'STYLE' === $tag ) && ! $tags->is_tag_closer() ) {
+\t\t$tags->set_attribute( 'nonce', $nonce );
+\t}
+}
+
+echo "nonce: {$nonce}\\n\\n";
+echo $tags->get_updated_html();'''))),
+        ('Build a srcset from a single src',
+            '<p>Generate responsive image markup at render time without touching the editor data model. Read the existing <code>src</code>, derive a <code>srcset</code> with width descriptors, add a <code>sizes</code> hint.</p>',
+            ('srcset-rewrite.php', php('''$html = '<figure><img src="https://cdn.test/uploads/photo.jpg" alt="Sunset"></figure>';
+$widths = array( 480, 768, 1200 );
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag( 'img' ) ) {
+\t$src = $tags->get_attribute( 'src' );
+\tif ( null === $src || $tags->get_attribute( 'srcset' ) !== null ) {
+\t\tcontinue;
+\t}
+\t$variants = array();
+\tforeach ( $widths as $w ) {
+\t\t$variants[] = $src . '?w=' . $w . ' ' . $w . 'w';
+\t}
+\t$tags->set_attribute( 'srcset', implode( ', ', $variants ) );
+\t$tags->set_attribute( 'sizes', '(max-width: 768px) 100vw, 768px' );
+}
+
+echo $tags->get_updated_html();'''))),
+        ('Decode HTML entities the way the spec demands',
+            '<p>The HTML5 entity table has roughly 2,200 named references and a long list of edge cases. <code>WP_HTML_Decoder</code> implements the algorithm — don\'t roll your own.</p>',
+            ('decode-entities.php', php('''echo "attribute: " . WP_HTML_Decoder::decode_attribute( 'path?a=1&amp;b=2&amp;copy' ) . "\\n";
+echo "text:      " . WP_HTML_Decoder::decode_text_node( 'AT&amp;T &mdash; 100&percnt; &#x1F600;' ) . "\\n";
+
+// Safe URL prefix check that respects encoded colons (a classic XSS vector).
+$is_javascript = WP_HTML_Decoder::attribute_starts_with(
+\t'java&#x09;script:alert(1)',
+\t'javascript:',
+\t'ascii-case-insensitive'
+);
+var_dump( $is_javascript );'''))),
+        ('Find images by ancestry with breadcrumbs',
+            '<p>The full <code>WP_HTML_Processor</code> understands HTML5 tree construction, so you can ask "find every <code>&lt;img&gt;</code> directly inside a <code>&lt;figure&gt;</code>" without writing your own DOM walker.</p>',
+            ('breadcrumbs.php', php('''$html = '<article>'
+\t. '<figure><img src="hero.jpg" alt="Hero"><figcaption>Hero shot</figcaption></figure>'
+\t. '<p>Body copy <img src="emoji.png" alt=""> mid-paragraph.</p>'
+\t. '<figure><img src="diagram.png" alt="Diagram"></figure>'
+\t. '</article>';
+
+$p = WP_HTML_Processor::create_fragment( $html );
+$figure_images = 0;
+while ( $p->next_tag( array( 'breadcrumbs' => array( 'FIGURE', 'IMG' ) ) ) ) {
+\t$p->add_class( 'figure-image' );
+\t$figure_images++;
+}
+
+echo "found {$figure_images} figure images\\n";
+echo $p->get_updated_html();'''))),
+        ('Outline a document by walking tokens with depth',
+            '<p>The full processor exposes <code>get_current_depth()</code> and <code>get_breadcrumbs()</code>. Combine with <code>next_token()</code> to print a structural outline.</p>',
+            ('outline.php', php('''$html = '<section><h1>Title</h1>'
+\t. '<section><h2>Chapter 1</h2><p>Body</p></section>'
+\t. '<section><h2>Chapter 2</h2><p>More body</p></section>'
+\t. '</section>';
+
+$p = WP_HTML_Processor::create_fragment( $html );
+while ( $p->next_token() ) {
+\tif ( '#tag' !== $p->get_token_type() || $p->is_tag_closer() ) {
+\t\tcontinue;
+\t}
+\t$tag = $p->get_tag();
+\tif ( ! preg_match( '/^H[1-6]$/', $tag ) ) {
+\t\tcontinue;
+\t}
+\t$indent = str_repeat( '  ', max( 0, $p->get_current_depth() - 2 ) );
+\t$text = '';
+\twhile ( $p->next_token() ) {
+\t\tif ( '#text' === $p->get_token_type() ) {
+\t\t\t$text .= $p->get_modifiable_text();
+\t\t\tcontinue;
+\t\t}
+\t\tif ( '#tag' === $p->get_token_type() && $tag === $p->get_tag() && $p->is_tag_closer() ) {
+\t\t\tbreak;
+\t\t}
+\t}
+\techo "{$indent}{$tag}  {$text}\\n";
+}'''))),
+        ('Bookmarks: annotate a parent based on its children',
+            '<p>Bookmarks are the one escape from forward-only scanning. Save a position, scan ahead, decide what to do, then <code>seek()</code> back and rewrite the earlier tag.</p>',
+            ('bookmarks.php', php('''$html = '<ul>'
+\t. '<li><input type="checkbox" checked> Buy milk</li>'
+\t. '<li><input type="checkbox"> Walk the dog</li>'
+\t. '<li><input type="checkbox" checked> Read book</li>'
+\t. '</ul>';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+$tags->next_tag( 'ul' );
+$tags->set_bookmark( 'list' );
+
+$total = 0;
+$done = 0;
+while ( $tags->next_tag( 'input' ) ) {
+\t$total++;
+\tif ( null !== $tags->get_attribute( 'checked' ) ) {
+\t\t$done++;
+\t}
+}
+
+$tags->seek( 'list' );
+$tags->set_attribute( 'data-progress', $done . '/' . $total );
+$tags->release_bookmark( 'list' );
+
+echo $tags->get_updated_html();'''))),
+    ]))
+
+# ===========================================================================
+# Zip
+# ===========================================================================
+COMPONENTS.append(('zip', 'Zip',
+    'Read and write ZIP archives in pure PHP — no <code>libzip</code>, no <code>ZipArchive</code>. Streams entries one at a time, so you can build EPUBs, .docx files, and multi-gigabyte plugin bundles without buffering the archive in memory.',
+    'wp-php-toolkit/zip',
+    [
+        ('Why this exists',
+            '<p>Common PHP ZIP workflows rely on the <code>ZipArchive</code> extension or shelling out to <code>zip</code>. Those are awkward in hosts without libzip, WebAssembly builds, and code paths that need to stream archive data through toolkit byte streams.</p>'
+            '<p>The Zip component reads and writes Stored and Deflate archives in pure PHP. The decoder is pull-based, so listing the central directory of a 2 GB ZIP costs roughly the size of the directory itself. The encoder accepts any <code>ByteWriteStream</code> as a sink and writes one entry at a time.</p>',
+            None),
+        ('Read a file out of a ZIP',
+            '<p><code>ZipFilesystem</code> implements this toolkit\'s <code>Filesystem</code> interface, so once you wrap the byte reader you can call <code>get_contents()</code>, <code>ls()</code>, and <code>is_dir()</code> just like the other filesystem backends.</p>'
+            '<p><strong>Try this:</strong> after <em>Run</em>, add a second <code>append_file()</code> call before <code>$enc-&gt;close()</code> for a <code>notes.md</code> entry, then call <code>print_r( $zip-&gt;ls( \'/\' ) )</code> at the end. The directory listing reflects the new entry without re-reading the file.</p>',
+            ('teaser-read.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\ByteStream\\ReadStream\\FileReadStream;
+use WordPress\\ByteStream\\WriteStream\\FileWriteStream;
+use WordPress\\Zip\\FileEntry;
+use WordPress\\Zip\\ZipDecoder;
+use WordPress\\Zip\\ZipEncoder;
+use WordPress\\Zip\\ZipFilesystem;
+
+$path = tempnam( sys_get_temp_dir(), 'demo' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+$enc->append_file( new FileEntry( array(
+\t'path'               => 'readme.txt',
+\t'compression_method' => ZipDecoder::COMPRESSION_NONE,
+\t'body_reader'        => new MemoryPipe( 'Hello from inside the zip.' ),
+) ) );
+$enc->close();
+$out->close_writing();
+
+$zip = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+echo $zip->get_contents( 'readme.txt' );'''))),
+        ('Build an EPUB from scratch',
+            '<p>An EPUB follows one strict ZIP rule: write the <code>mimetype</code> entry first and store it without compression. Deflate the rest of the archive normally.</p>'
+            '<p>Gotcha: e-readers reject EPUBs whose <code>mimetype</code> entry has compression. Use <code>COMPRESSION_NONE</code> for that single entry.</p>',
+            ('epub.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\ByteStream\\ReadStream\\FileReadStream;
+use WordPress\\ByteStream\\WriteStream\\FileWriteStream;
+use WordPress\\Zip\\FileEntry;
+use WordPress\\Zip\\ZipDecoder;
+use WordPress\\Zip\\ZipEncoder;
+use WordPress\\Zip\\ZipFilesystem;
+
+$path = tempnam( sys_get_temp_dir(), 'book' ) . '.epub';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+
+// 1) The mimetype entry MUST be first and stored uncompressed.
+$enc->append_file( new FileEntry( array(
+\t'path'               => 'mimetype',
+\t'compression_method' => ZipDecoder::COMPRESSION_NONE,
+\t'body_reader'        => new MemoryPipe( 'application/epub+zip' ),
+) ) );
+
+$container = '<?xml version="1.0"?>'
+\t. '<container version="1.0" xmlns="urn:oasis:names:tc:opendocument:xmlns:container">'
+\t. '<rootfiles><rootfile full-path="EPUB/package.opf" media-type="application/oebps-package+xml"/></rootfiles>'
+\t. '</container>';
+
+foreach ( array(
+\t'META-INF/container.xml' => $container,
+\t'EPUB/package.opf'       => '<package version="3.0" xmlns="http://www.idpf.org/2007/opf"><metadata/><manifest/><spine/></package>',
+\t'EPUB/chapter1.xhtml'    => '<html xmlns="http://www.w3.org/1999/xhtml"><body><h1>Chapter 1</h1><p>It was a dark and stormy night.</p></body></html>',
+) as $name => $body ) {
+\t$enc->append_file( new FileEntry( array(
+\t\t'path'               => $name,
+\t\t'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+\t\t'body_reader'        => new MemoryPipe( $body ),
+\t) ) );
+}
+$enc->close();
+$out->close_writing();
+
+$zip = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+printf( "mimetype: %s\\n", $zip->get_contents( 'mimetype' ) );
+printf( "size on disk: %d bytes\\n", filesize( $path ) );'''))),
+        ('Stream a large entry without buffering it',
+            '<p>Calling <code>get_contents()</code> on a 500 MB CSV inside a ZIP would eat 500 MB of RAM. Use <code>open_read_stream()</code> instead and inflate-as-you-go.</p>'
+            '<p>Gotcha: only one entry stream open at a time. Drain or finish the previous stream before opening the next.</p>',
+            ('stream-large.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\ByteStream\\ReadStream\\FileReadStream;
+use WordPress\\ByteStream\\WriteStream\\FileWriteStream;
+use WordPress\\Zip\\FileEntry;
+use WordPress\\Zip\\ZipDecoder;
+use WordPress\\Zip\\ZipEncoder;
+use WordPress\\Zip\\ZipFilesystem;
+
+$path = tempnam( sys_get_temp_dir(), 'big' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+$enc->append_file( new FileEntry( array(
+\t'path'               => 'data.csv',
+\t'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+\t'body_reader'        => new MemoryPipe( str_repeat( "id,value,timestamp\\n1,foo,2024\\n2,bar,2024\\n", 5000 ) ),
+) ) );
+$enc->close();
+$out->close_writing();
+
+$zip    = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+$stream = $zip->open_read_stream( 'data.csv' );
+
+$rows  = 0;
+$bytes = 0;
+$tail  = '';
+while ( ! $stream->reached_end_of_data() ) {
+\t$n = $stream->pull( 8192 );
+\tif ( 0 === $n ) break;
+\t$chunk  = $tail . $stream->consume( $n );
+\t$lines  = explode( "\\n", $chunk );
+\t$tail   = array_pop( $lines );
+\t$rows  += count( $lines );
+\t$bytes += $n;
+}
+printf( "Inflated %d bytes in 8 KB chunks, parsed %d rows.\\n", $bytes, $rows );'''))),
+        ('Repack: modify one file, copy the rest',
+            '<p>Updating one file in a ZIP without rewriting the others is impossible at the format level — the central directory points at byte offsets. The pragmatic answer is repack: stream the source archive into a new one, swapping the file you care about.</p>',
+            ('repack.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\ByteStream\\ReadStream\\FileReadStream;
+use WordPress\\ByteStream\\WriteStream\\FileWriteStream;
+use WordPress\\Zip\\FileEntry;
+use WordPress\\Zip\\ZipDecoder;
+use WordPress\\Zip\\ZipEncoder;
+use WordPress\\Zip\\ZipFilesystem;
+
+$src_path = tempnam( sys_get_temp_dir(), 'orig' ) . '.zip';
+$src_out  = FileWriteStream::from_path( $src_path, 'truncate' );
+$src_enc  = new ZipEncoder( $src_out );
+foreach ( array(
+\t'config.json'   => '{"debug":false,"version":"1.0"}',
+\t'app/index.php' => '<?php echo "hello";',
+\t'app/style.css' => 'body{color:#333}',
+) as $name => $body ) {
+\t$src_enc->append_file( new FileEntry( array(
+\t\t'path'               => $name,
+\t\t'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+\t\t'body_reader'        => new MemoryPipe( $body ),
+\t) ) );
+}
+$src_enc->close();
+$src_out->close_writing();
+
+$source   = ZipFilesystem::create( FileReadStream::from_path( $src_path ) );
+$dst_path = tempnam( sys_get_temp_dir(), 'repacked' ) . '.zip';
+$dst_out  = FileWriteStream::from_path( $dst_path, 'truncate' );
+$dst_enc  = new ZipEncoder( $dst_out );
+
+$dirs = array( '/' );
+while ( $dirs ) {
+\t$dir = array_shift( $dirs );
+\tforeach ( $source->ls( $dir ) as $name ) {
+\t\t$path = rtrim( $dir, '/' ) . '/' . $name;
+\t\tif ( $source->is_dir( $path ) ) {
+\t\t\t$dirs[] = $path;
+\t\t\tcontinue;
+\t\t}
+\t\t$rel  = ltrim( $path, '/' );
+\t\t$body = ( 'config.json' === $rel )
+\t\t\t? '{"debug":true,"version":"1.0.1"}'
+\t\t\t: $source->get_contents( $rel );
+\t\t$dst_enc->append_file( new FileEntry( array(
+\t\t\t'path'               => $rel,
+\t\t\t'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+\t\t\t'body_reader'        => new MemoryPipe( $body ),
+\t\t) ) );
+\t}
+}
+$dst_enc->close();
+$dst_out->close_writing();
+
+$repacked = ZipFilesystem::create( FileReadStream::from_path( $dst_path ) );
+echo "new config.json: " . $repacked->get_contents( 'config.json' ) . "\\n";
+echo "untouched: " . $repacked->get_contents( 'app/index.php' ) . "\\n";'''))),
+        ('Defend against zip-slip',
+            '<p>A malicious archive can name an entry <code>../../etc/passwd</code> and trick a naive extractor into clobbering files outside the destination. <code>ZipDecoder::sanitize_path()</code> strips leading <code>../</code> segments and collapses internal <code>/../</code> sequences before exposing the path.</p>',
+            ('zip-slip.php', php('''use WordPress\\Zip\\ZipDecoder;
+
+$evil_inputs = array(
+\t'../../etc/passwd',
+\t'./safe/path.txt',
+\t'a/../../b/secret',
+\t'a//b///c.txt',
+\t'../../../../root/.ssh/authorized_keys',
+);
+foreach ( $evil_inputs as $name ) {
+\tprintf( "%-45s => %s\\n", $name, ZipDecoder::sanitize_path( $name ) );
+}'''))),
+        ('Pipe ZIP entries into an InMemoryFilesystem',
+            '<p>Real-world recipe: take an uploaded plugin ZIP, expand it into an <code>InMemoryFilesystem</code> so you can validate, edit, or scan it before it ever touches disk. Three components compose into something you couldn\'t build with <code>ZipArchive</code> alone.</p>',
+            ('zip-to-memfs.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\ByteStream\\ReadStream\\FileReadStream;
+use WordPress\\ByteStream\\WriteStream\\FileWriteStream;
+use WordPress\\Filesystem\\InMemoryFilesystem;
+use WordPress\\Zip\\FileEntry;
+use WordPress\\Zip\\ZipDecoder;
+use WordPress\\Zip\\ZipEncoder;
+use WordPress\\Zip\\ZipFilesystem;
+use function WordPress\\Filesystem\\copy_between_filesystems;
+
+$path = tempnam( sys_get_temp_dir(), 'app' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+foreach ( array(
+\t'app/index.php'        => '<?php echo "ok";',
+\t'app/lib/util.php'     => '<?php // util',
+\t'app/assets/style.css' => 'body{margin:0}',
+\t'app/README.md'        => '# App',
+) as $name => $body ) {
+\t$enc->append_file( new FileEntry( array(
+\t\t'path'               => $name,
+\t\t'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+\t\t'body_reader'        => new MemoryPipe( $body ),
+\t) ) );
+}
+$enc->close();
+$out->close_writing();
+
+$zip = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+$mem = InMemoryFilesystem::create();
+copy_between_filesystems( array(
+\t'source_filesystem' => $zip,
+\t'source_path'       => '/',
+\t'target_filesystem' => $mem,
+\t'target_path'       => '/',
+) );
+
+$mem->put_contents( '/app/VERSION', '1.0.0' );
+echo "files now in memory:\\n";
+$dirs = array( '/' );
+$files = array();
+while ( $dirs ) {
+\t$dir = array_shift( $dirs );
+\tforeach ( $mem->ls( $dir ) as $name ) {
+\t\t$p = rtrim( $dir, '/' ) . '/' . $name;
+\t\tif ( $mem->is_dir( $p ) ) {
+\t\t\t$dirs[] = $p;
+\t\t\tcontinue;
+\t\t}
+\t\t$files[] = $p;
+\t}
+}
+sort( $files );
+foreach ( $files as $path ) {
+\techo "  " . $path . "\\n";
+}'''))),
+    ]))
+
+# ===========================================================================
+# ByteStream
+# ===========================================================================
+COMPONENTS.append(('bytestream', 'ByteStream',
+    'Composable streaming primitives for reading, writing, transforming, hashing, and compressing byte data. Pull/peek/consume semantics let parsers backtrack without copying, and deflate, inflate, and checksum filters snap together like Lego.',
+    'wp-php-toolkit/bytestream',
+    [
+        ('Why this exists',
+            '<p>PHP\'s native streams are powerful but inconsistent. <code>fread</code> on a socket may return short reads with no warning; <code>stream_filter_append</code> is awkward to compose; gzip helpers and file handles expose different APIs. The ByteStream component normalizes these behind one small interface — <code>pull / peek / consume</code> — so a parser, a hash function, and a deflate filter all see the same shape.</p>'
+            '<p>The split between <em>pull</em> (buffer up to N bytes) and <em>consume</em> (advance past N bytes) is the secret. Parsers can <code>peek</code> ahead to detect a record boundary and decide whether to <code>consume</code>, without copying or allocating.</p>',
+            None),
+        ('Read a file in chunks',
+            '<p>The canonical loop. <code>pull(N)</code> reads up to <code>N</code> bytes from the underlying source into an internal buffer and returns how many ended up there; <code>consume(N)</code> reads <code>N</code> bytes from that buffer and advances past them. The buffer never grows beyond the chunk size you ask for.</p>',
+            ('teaser-read.php', php('''use WordPress\\ByteStream\\ReadStream\\FileReadStream;
+
+$path = tempnam( sys_get_temp_dir(), 'demo' );
+file_put_contents( $path, str_repeat( "log line\\n", 200 ) );
+
+$reader = FileReadStream::from_path( $path );
+$total = 0;
+while ( ! $reader->reached_end_of_data() ) {
+\t$n = $reader->pull( 256 );
+\tif ( 0 === $n ) break;
+\t$total += strlen( $reader->consume( $n ) );
+}
+$reader->close_reading();
+echo "Read {$total} bytes in 256-byte chunks.\\n";'''))),
+        ('MemoryPipe as write-then-read buffer',
+            '<p><code>MemoryPipe</code> is bidirectional: you <code>append_bytes()</code> as a writer and <code>pull/consume</code> as a reader. Easiest way to wire one component\'s output into another\'s input.</p>'
+            '<p>Gotcha: a producer must call <code>close_writing()</code> when done — otherwise the consumer eventually throws <code>NotEnoughDataException</code> instead of seeing EOF.</p>',
+            ('memory-pipe.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+
+$pipe = new MemoryPipe();
+$pipe->append_bytes( "first chunk\\n" );
+$pipe->append_bytes( "second chunk\\n" );
+$pipe->append_bytes( "third chunk\\n" );
+$pipe->close_writing();
+
+while ( ! $pipe->reached_end_of_data() ) {
+\t$n = $pipe->pull( 1024 );
+\tif ( 0 === $n ) break;
+\techo "got: " . $pipe->consume( $n );
+}'''))),
+        ('Compress on the way in, decompress on the way out',
+            '<p>Wrap a stream in <code>DeflateReadStream</code> to get compressed bytes out; wrap it in <code>InflateReadStream</code> to get decompressed bytes out. Both are full <code>ByteReadStream</code> implementations, so they nest into anything else that takes a stream.</p>',
+            ('deflate-roundtrip.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\ByteStream\\ReadStream\\DeflateReadStream;
+use WordPress\\ByteStream\\ReadStream\\InflateReadStream;
+
+$original = str_repeat( "the quick brown fox. ", 50 );
+
+$src        = new MemoryPipe( $original );
+$src->close_writing();
+$deflated   = new DeflateReadStream( $src, ZLIB_ENCODING_DEFLATE );
+$compressed = $deflated->consume_all();
+
+$src2     = new MemoryPipe( $compressed );
+$src2->close_writing();
+$inflated = new InflateReadStream( $src2, ZLIB_ENCODING_DEFLATE );
+$round    = $inflated->consume_all();
+
+printf( "original  : %d bytes\\n", strlen( $original ) );
+printf( "deflated  : %d bytes (%.1f%%)\\n", strlen( $compressed ), 100 * strlen( $compressed ) / strlen( $original ) );
+printf( "round-trip: %s\\n", $round === $original ? 'OK' : 'BROKEN' );'''))),
+        ('Line-by-line reads from a chunked source',
+            '<p>Reading text by line means handling chunk boundaries that fall mid-line. Keep the trailing partial line and prepend it to the next pull. The rest of the loop pretends the data was always whole.</p>',
+            ('lines.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+
+$pipe = new MemoryPipe();
+$pipe->append_bytes( "alpha\\nbravo\\ncharl" );
+$pipe->append_bytes( "ie\\ndelta\\necho\\n" );
+$pipe->close_writing();
+
+$tail = '';
+$count = 0;
+while ( ! $pipe->reached_end_of_data() ) {
+\t$n = $pipe->pull( 8 );
+\tif ( 0 === $n ) break;
+\t$buf   = $tail . $pipe->consume( $n );
+\t$lines = explode( "\\n", $buf );
+\t$tail  = array_pop( $lines );
+\tforeach ( $lines as $line ) {
+\t\tprintf( "[%d] %s\\n", ++$count, $line );
+\t}
+}
+if ( '' !== $tail ) {
+\tprintf( "[%d] %s\\n", ++$count, $tail );
+}'''))),
+        ('Limit a stream to a fixed window',
+            '<p><code>LimitedByteReadStream</code> exposes only the next N bytes of an underlying stream as if those were the entire stream. This is how the ZIP decoder hands you the body of one entry without letting you read into the next.</p>',
+            ('limited.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\ByteStream\\ReadStream\\LimitedByteReadStream;
+
+$source = new MemoryPipe( "HEADER:42|BODY:hello there|FOOTER:done" );
+$source->close_writing();
+
+$source->pull( 10 );
+$source->consume( 10 );
+
+$body = new LimitedByteReadStream( $source, 16 );
+echo "body sees: " . $body->consume_all() . "\\n";
+echo "remaining in source: " . $source->consume_all() . "\\n";'''))),
+    ]))
+
+# ===========================================================================
+# Filesystem
+# ===========================================================================
+COMPONENTS.append(('filesystem', 'Filesystem',
+    'One <code>Filesystem</code> interface across local disk, in-memory trees, SQLite databases, and ZIP archives. Forward-slash paths everywhere — even on Windows — so the same code runs in tests, in production, and inside read-only ZIPs.',
+    'wp-php-toolkit/filesystem',
+    [
+        ('Why this exists',
+            '<p>Code that touches the filesystem is hard to test, hard to port to Windows, and impossible to point at non-disk storage without rewriting it. Swap <code>LocalFilesystem</code> for <code>InMemoryFilesystem</code> in tests and your suite stops touching <code>/tmp</code>; swap it for <code>SQLiteFilesystem</code> and your "files" become rows in a portable database; swap it for <code>ZipFilesystem</code> and you can read inside an archive with the same calls.</p>'
+            '<p>Every backend uses forward slashes regardless of host OS. No <code>DIRECTORY_SEPARATOR</code> juggling, no Windows-only test failures, no surprises when a path moves between backends.</p>',
+            None),
+        ('In-memory tree',
+            '<p>The fastest backend. No disk I/O, no cleanup, no test-isolation problems.</p>',
+            ('teaser-memory.php', php('''use WordPress\\Filesystem\\InMemoryFilesystem;
+
+$fs = InMemoryFilesystem::create();
+$fs->put_contents( '/hello.txt', 'Hello, world!' );
+echo $fs->get_contents( '/hello.txt' );'''))),
+        ('Test code without touching disk',
+            '<p>Code that takes a <code>Filesystem</code> parameter, instead of calling <code>file_get_contents()</code> directly, can be tested against an <code>InMemoryFilesystem</code>. The test sets up files in memory, exercises the function, and asserts on what got written — no temp directories, no cleanup.</p>',
+            ('test-without-disk.php', php('''use WordPress\\Filesystem\\Filesystem;
+use WordPress\\Filesystem\\InMemoryFilesystem;
+
+function bump_version( Filesystem $fs, $path ) {
+\t$json = json_decode( $fs->get_contents( $path ), true );
+\tlist( $maj, $min, $patch ) = explode( '.', $json['version'] );
+\t$json['version'] = $maj . '.' . $min . '.' . ( (int) $patch + 1 );
+\t$fs->put_contents( $path, json_encode( $json ) );
+}
+
+$fs = InMemoryFilesystem::create();
+$fs->put_contents( '/package.json', '{"version":"1.2.3"}' );
+bump_version( $fs, '/package.json' );
+
+echo $fs->get_contents( '/package.json' ) . "\\n";'''))),
+        ('Local disk with a chrooted root',
+            '<p><code>LocalFilesystem::create($root)</code> is implicitly chrooted: every path resolves relative to <code>$root</code> and a <code>../</code> cannot escape. Reach for it when a request path or CLI argument names a file inside one project directory.</p>',
+            ('local-chroot.php', php('''use WordPress\\Filesystem\\LocalFilesystem;
+
+$root = sys_get_temp_dir() . '/toolkit-' . uniqid();
+$fs   = LocalFilesystem::create( $root );
+
+$fs->mkdir( '/uploads', array( 'recursive' => true ) );
+$fs->put_contents( '/uploads/note.txt', 'Hi from local disk.' );
+
+echo $fs->get_contents( '/uploads/../uploads/note.txt' ) . "\\n";
+
+$fs->rmdir( '/', array( 'recursive' => true ) );
+echo "exists after cleanup? " . ( is_dir( $root ) ? 'yes' : 'no' ) . "\\n";'''))),
+        ('SQLite as a portable file store',
+            '<p>The whole tree lives in one SQLite database file. Use it for self-contained scratch storage that survives process boundaries without leaving loose files behind.</p>',
+            ('sqlite.php', php('''use WordPress\\Filesystem\\SQLiteFilesystem;
+
+$fs = SQLiteFilesystem::create( ':memory:' );
+$fs->mkdir( '/posts', array( 'recursive' => true ) );
+for ( $i = 1; $i <= 3; $i++ ) {
+\t$fs->put_contents( "/posts/post-{$i}.md", "# Post {$i}\\n\\nBody {$i}." );
+}
+
+foreach ( $fs->ls( '/posts' ) as $name ) {
+\t$first = strtok( $fs->get_contents( '/posts/' . $name ), "\\n" );
+\techo "{$name}: {$first}\\n";
+}'''))),
+        ('Copy a tree across backends',
+            '<p>The killer composability move: <code>copy_between_filesystems()</code> streams files chunk-by-chunk from any source to any target. Pull a ZIP into SQLite, snapshot SQLite to disk, mirror disk into RAM — all the same call.</p>',
+            ('cross-backend-copy.php', php('''use WordPress\\Filesystem\\InMemoryFilesystem;
+use WordPress\\Filesystem\\LocalFilesystem;
+use WordPress\\Filesystem\\SQLiteFilesystem;
+use function WordPress\\Filesystem\\copy_between_filesystems;
+
+$root  = sys_get_temp_dir() . '/copytree-' . uniqid();
+$local = LocalFilesystem::create( $root );
+$local->mkdir( '/site/posts', array( 'recursive' => true ) );
+$local->put_contents( '/site/posts/2024-01.md', '# Hello 2024' );
+$local->put_contents( '/site/index.html', '<h1>Home</h1>' );
+
+$sqlite = SQLiteFilesystem::create( ':memory:' );
+copy_between_filesystems( array(
+\t'source_filesystem' => $local,
+\t'source_path'       => '/site',
+\t'target_filesystem' => $sqlite,
+\t'target_path'       => '/snapshot',
+) );
+
+$mem = InMemoryFilesystem::create();
+copy_between_filesystems( array(
+\t'source_filesystem' => $sqlite,
+\t'source_path'       => '/snapshot',
+\t'target_filesystem' => $mem,
+\t'target_path'       => '/copy',
+) );
+
+echo "in memory after two copies:\\n";
+echo "  posts: " . implode( ', ', $mem->ls( '/copy/posts' ) ) . "\\n";
+echo "  index: " . $mem->get_contents( '/copy/index.html' ) . "\\n";
+
+$local->rmdir( '/', array( 'recursive' => true ) );'''))),
+        ('Atomic write via tempfile rename',
+            '<p>Write to a sibling tempfile, then rename — that\'s how you avoid leaving a half-written file on crash. <code>rename()</code> is atomic within a single filesystem.</p>',
+            ('atomic-write.php', php('''use WordPress\\Filesystem\\Filesystem;
+use WordPress\\Filesystem\\LocalFilesystem;
+
+function atomic_put_contents( Filesystem $fs, $path, $bytes ) {
+\t$tmp = $path . '.tmp.' . bin2hex( random_bytes( 4 ) );
+\t$fs->put_contents( $tmp, $bytes );
+\t$fs->rename( $tmp, $path );
+}
+
+$root = sys_get_temp_dir() . '/atomic-' . uniqid();
+$fs   = LocalFilesystem::create( $root );
+
+$fs->put_contents( '/config.json', '{"v":1}' );
+atomic_put_contents( $fs, '/config.json', '{"v":2}' );
+
+echo "config: " . $fs->get_contents( '/config.json' ) . "\\n";
+echo "no .tmp leftovers: " . count( $fs->ls( '/' ) ) . " entries in root\\n";
+
+$fs->rmdir( '/', array( 'recursive' => true ) );'''))),
+        ('Path helpers that behave the same on Windows',
+            '<p>Unix path semantics apply on every host OS. This matters for abstract paths such as a SQLite key or a ZIP entry name because those paths do not live on a real drive.</p>',
+            ('path-helpers.php', php('''use function WordPress\\Filesystem\\wp_join_unix_paths;
+use function WordPress\\Filesystem\\wp_unix_dirname;
+use function WordPress\\Filesystem\\wp_unix_path_resolve_dots;
+
+echo wp_join_unix_paths( '/var/www', '/site/', '/index.php' ) . "\\n";
+echo wp_unix_dirname( '/a/b/c/d.txt', 2 ) . "\\n";
+echo wp_unix_path_resolve_dots( '/a/b/../c/./d/../e' ) . "\\n";'''))),
+    ]))
+
+# ===========================================================================
+# BlockParser
+# ===========================================================================
+COMPONENTS.append(('blockparser', 'BlockParser',
+    'WordPress core\'s block parser, packaged as a standalone library. Turn block markup into a structured tree, lint posts for common authoring mistakes, and audit block usage — all without booting WordPress.',
+    'wp-php-toolkit/blockparser',
+    [
+        ('Why this exists',
+            '<p>Block markup is not plain HTML. A post can contain HTML comments that identify blocks, JSON attributes inside those comments, freeform HTML between blocks, and nested blocks whose rendered HTML is interleaved with parent markup.</p>'
+            '<p>This component packages WordPress core\'s block parser so importers, linters, migration tools, and static analyzers can understand block content without loading WordPress. It deliberately mirrors core behavior — same array shape, same <code>null</code> blocks for freeform HTML, same core block names such as <code>core/paragraph</code> — so code written against this parser keeps working when run inside WordPress, and vice versa.</p>'
+            '<p>Reach for it when you need answers about the block tree: which blocks a post uses, which attributes they carry, where nested blocks appear, or whether content violates a rule your project cares about.</p>',
+            None),
+        ('What you get back',
+            '<p><code>WP_Block_Parser::parse()</code> returns an array of blocks. Each block is an associative array with five keys: <code>blockName</code>, <code>attrs</code>, <code>innerBlocks</code>, <code>innerHTML</code>, and <code>innerContent</code>.</p>'
+            '<p><code>innerHTML</code> is the HTML inside the block <em>with inner blocks stripped out</em>. <code>innerContent</code> is the interleaved version: an array of HTML strings with <code>null</code> placeholders marking where each inner block belongs.</p>'
+            '<p>Most code starts by checking <code>blockName</code>, then reading <code>attrs</code> or <code>innerHTML</code>. When a post has container blocks such as Group, Columns, or Navigation, look inside <code>innerBlocks</code> too.</p>'
+            '<p><strong>Footgun:</strong> freeform HTML between blocks shows up as a block with <code>blockName === null</code>. Always skip that case before comparing names.</p>',
+            None),
+        ('Parse a document',
+            '<p>The simplest possible use. Pass a string, get back a tree.</p>',
+            ('parse.php', php('''$document = "<!-- wp:heading {\\"level\\":2} -->\\n<h2>Welcome</h2>\\n<!-- /wp:heading -->\\n\\n"
+\t. "<!-- wp:paragraph -->\\n<p>Hello from the block editor.</p>\\n<!-- /wp:paragraph -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+foreach ( $blocks as $block ) {
+\tif ( null === $block['blockName'] ) {
+\t\tcontinue;
+\t}
+\techo $block['blockName'] . ': ' . trim( strip_tags( $block['innerHTML'] ) ) . "\\n";
+}'''))),
+        ('Count every block type in a post',
+            '<p>A common audit task: "How many Paragraph, Image, and Gallery blocks does this post use?" A small queue keeps the example readable while still visiting nested blocks.</p>',
+            ('count-blocks.php', php('''$document = "<!-- wp:group --><div class=\\"wp-block-group\\">"
+\t. "<!-- wp:heading --><h2>Title</h2><!-- /wp:heading -->"
+\t. "<!-- wp:paragraph --><p>One.</p><!-- /wp:paragraph -->"
+\t. "<!-- wp:paragraph --><p>Two.</p><!-- /wp:paragraph -->"
+\t. "<!-- wp:image {\\"id\\":1} --><figure><img src=\\"a.jpg\\"/></figure><!-- /wp:image -->"
+\t. "</div><!-- /wp:group -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+$counts = array();
+$queue  = $blocks;
+
+while ( ! empty( $queue ) ) {
+\t$block = array_shift( $queue );
+
+\tif ( null !== $block['blockName'] ) {
+\t\t$name             = $block['blockName'];
+\t\t$counts[ $name ] = isset( $counts[ $name ] ) ? $counts[ $name ] + 1 : 1;
+\t}
+
+\tforeach ( $block['innerBlocks'] as $inner_block ) {
+\t\t$queue[] = $inner_block;
+\t}
+}
+
+arsort( $counts );
+foreach ( $counts as $name => $n ) {
+\techo str_pad( (string) $n, 4, ' ', STR_PAD_LEFT ) . '  ' . $name . "\\n";
+}'''))),
+        ('Check whether a post uses a block',
+            '<p>Useful for templates, audits, and migrations: answer one yes/no question without caring where the block appears in the tree.</p>',
+            ('has-block.php', php('''$document = "<!-- wp:group --><div class=\\"wp-block-group\\">"
+\t. "<!-- wp:buttons --><div class=\\"wp-block-buttons\\">"
+\t. "<!-- wp:button --><div class=\\"wp-block-button\\"><a>Buy now</a></div><!-- /wp:button -->"
+\t. "</div><!-- /wp:buttons -->"
+\t. "</div><!-- /wp:group -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+function post_has_block( $blocks, $name ) {
+\t$queue = $blocks;
+
+\twhile ( ! empty( $queue ) ) {
+\t\t$block = array_shift( $queue );
+\t\tif ( $name === $block['blockName'] ) {
+\t\t\treturn true;
+\t\t}
+
+\t\tforeach ( $block['innerBlocks'] as $inner_block ) {
+\t\t\t$queue[] = $inner_block;
+\t\t}
+\t}
+
+\treturn false;
+}
+
+echo post_has_block( $blocks, 'core/button' ) ? "has button\\n" : "missing button\\n";
+echo post_has_block( $blocks, 'core/gallery' ) ? "has gallery\\n" : "missing gallery\\n";'''))),
+        ('Lint headings for hierarchy mistakes',
+            '<p>"Don\'t skip from H2 to H4" is a real accessibility rule. The helper below keeps headings in document order, including headings nested inside Group, Column, and Cover blocks.</p>',
+            ('lint-headings.php', php('''$document = "<!-- wp:heading -->\\n<h2>Intro</h2>\\n<!-- /wp:heading -->"
+\t. "<!-- wp:heading {\\"level\\":4} -->\\n<h4>Subsection</h4>\\n<!-- /wp:heading -->"
+\t. "<!-- wp:heading {\\"level\\":3} -->\\n<h3>Body</h3>\\n<!-- /wp:heading -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+function collect_headings( $blocks, &$headings ) {
+\tforeach ( $blocks as $block ) {
+\t\tif ( 'core/heading' === $block['blockName'] ) {
+\t\t\t$headings[] = array(
+\t\t\t\t'level' => isset( $block['attrs']['level'] ) ? (int) $block['attrs']['level'] : 2,
+\t\t\t\t'text'  => trim( strip_tags( $block['innerHTML'] ) ),
+\t\t\t);
+\t\t}
+
+\t\tcollect_headings( $block['innerBlocks'], $headings );
+\t}
+}
+
+$headings = array();
+collect_headings( $blocks, $headings );
+
+$last = 1;
+foreach ( $headings as $heading ) {
+\t$level = $heading['level'];
+\t$label = $heading['text'];
+
+\tif ( $level > $last + 1 ) {
+\t\techo "WARN {$label}: jumped from H{$last} to H{$level}\\n";
+\t} else {
+\t\techo "ok   {$label}: H{$level}\\n";
+\t}
+\t$last = $level;
+}'''))),
+        ('Find all instances of a custom block',
+            '<p>When auditing an export for a block your plugin owns, collect every match and print the fields a human cares about.</p>',
+            ('find-custom-block.php', php('''$document = "<!-- wp:paragraph --><p>Reviews</p><!-- /wp:paragraph -->"
+\t. "<!-- wp:my-plugin/testimonial {\\"author\\":\\"Jane\\",\\"rating\\":5} -->"
+\t. "<blockquote>Loved it.</blockquote>"
+\t. "<!-- /wp:my-plugin/testimonial -->"
+\t. "<!-- wp:my-plugin/testimonial {\\"author\\":\\"Joe\\",\\"rating\\":4} -->"
+\t. "<blockquote>Pretty good.</blockquote>"
+\t. "<!-- /wp:my-plugin/testimonial -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+function find_blocks_by_name( $blocks, $name, &$matches ) {
+\tforeach ( $blocks as $block ) {
+\t\tif ( $name === $block['blockName'] ) {
+\t\t\t$matches[] = $block;
+\t\t}
+
+\t\tfind_blocks_by_name( $block['innerBlocks'], $name, $matches );
+\t}
+}
+
+$testimonials = array();
+find_blocks_by_name( $blocks, 'my-plugin/testimonial', $testimonials );
+
+foreach ( $testimonials as $i => $b ) {
+\techo ( $i + 1 ) . '. ' . $b['attrs']['author'] . ' (' . $b['attrs']['rating'] . '/5): '
+\t\t. trim( strip_tags( $b['innerHTML'] ) ) . "\\n";
+}'''))),
+        ('Detect blocks with stale embed URLs',
+            '<p>A real-world content audit: find every <code>core/embed</code> whose URL points at a domain you have retired.</p>',
+            ('audit-embeds.php', php('''$document = '<!-- wp:embed {"url":"https://twitter.com/wordpress/status/1","providerNameSlug":"twitter"} /-->'
+\t. '<!-- wp:embed {"url":"https://youtube.com/watch?v=abc","providerNameSlug":"youtube"} /-->'
+\t. '<!-- wp:embed {"url":"https://vine.co/v/xyz","providerNameSlug":"vine"} /-->';
+
+$retired = array( 'vine.co', 'plus.google.com' );
+
+foreach ( ( new WP_Block_Parser() )->parse( $document ) as $b ) {
+\tif ( 'core/embed' !== $b['blockName'] ) {
+\t\tcontinue;
+\t}
+\t$url  = isset( $b['attrs']['url'] ) ? $b['attrs']['url'] : '';
+\t$host = parse_url( $url, PHP_URL_HOST );
+\t$bad  = $host && in_array( $host, $retired, true );
+\techo ( $bad ? 'STALE  ' : 'ok     ' ) . $url . "\\n";
+}'''))),
+    ]))
+
+# ===========================================================================
+# Markdown
+# ===========================================================================
+COMPONENTS.append(('markdown', 'Markdown',
+    'Bidirectional converter between Markdown and WordPress block markup. Useful for moving content between Markdown files and WordPress while preserving the structures both formats can express.',
+    'wp-php-toolkit/markdown',
+    [
+        ('Why this exists',
+            '<p>Many publishing workflows start in Markdown: documentation sites, static-site generators, Git-backed editorial workflows, Obsidian vaults, and developer notes. WordPress stores editor content as block markup. Moving between those worlds by string replacement loses metadata and quickly breaks on lists, tables, code blocks, and frontmatter.</p>'
+            '<p>The Markdown component provides a structured bridge. <code>MarkdownConsumer</code> turns Markdown plus frontmatter into block markup and metadata; <code>MarkdownProducer</code> turns supported block markup back into Markdown. The conversion is meant for practical content workflows, not byte-identical round-tripping of every custom block attribute.</p>',
+            None),
+        ('Markdown to blocks',
+            '<p>Feed Markdown into <code>MarkdownConsumer</code>, get block markup back. The result is a <code>BlocksWithMetadata</code> object that holds both the rendered blocks and any frontmatter parsed from the document.</p>',
+            ('quickstart.php', php('''use WordPress\\Markdown\\MarkdownConsumer;
+
+$result = ( new MarkdownConsumer( "# Hello\\n\\nWelcome to **WordPress**." ) )->consume();
+echo $result->get_block_markup();'''))),
+        ('Round-trip: blocks back to Markdown',
+            '<p>Pair <code>MarkdownProducer</code> with <code>MarkdownConsumer</code> to convert in either direction. Round-tripping is lossy for block attributes that have no Markdown representation (custom classes, alignment), so do not expect byte-perfect equality.</p>',
+            ('roundtrip.php', php('''use WordPress\\Markdown\\MarkdownConsumer;
+use WordPress\\Markdown\\MarkdownProducer;
+
+$md       = "## Round trip\\n\\n- one\\n- two\\n- three\\n";
+$blocks   = ( new MarkdownConsumer( $md ) )->consume();
+$markdown = ( new MarkdownProducer( $blocks ) )->produce();
+
+echo $markdown;'''))),
+        ('Reading YAML frontmatter as post meta',
+            '<p>Frontmatter keys come back as arrays so a single key can hold multiple values. Use <code>get_meta_value()</code> when you only want the first scalar.</p>',
+            ('frontmatter.php', php('''use WordPress\\Markdown\\MarkdownConsumer;
+
+$md = <<<MD
+---
+post_title: "The Name of the Wind"
+post_status: publish
+tags: [fantasy, kingkiller]
+---
+
+Once upon a time...
+MD;
+
+$consumer = new MarkdownConsumer( $md );
+$consumer->consume();
+
+echo 'Title: '   . $consumer->get_meta_value( 'post_title' )  . "\\n";
+echo 'Status: '  . $consumer->get_meta_value( 'post_status' ) . "\\n";
+$metadata = $consumer->get_all_metadata();
+echo 'Tags: ' . implode( ', ', $metadata['tags'][0] ) . "\\n";'''))),
+        ('Migrating an Obsidian or Hugo folder of Markdown',
+            '<p>Walk a directory of <code>.md</code> files (Obsidian vault, Hugo <code>content/</code>, Jekyll <code>_posts</code>) and emit one block-markup record per file.</p>',
+            ('migrate-folder.php', php('''use WordPress\\Markdown\\MarkdownConsumer;
+
+@mkdir( '/tmp/vault', 0777, true );
+file_put_contents( '/tmp/vault/welcome.md', "---\\ntitle: Welcome\\n---\\n\\nHello world." );
+file_put_contents( '/tmp/vault/roadmap.md', "# Roadmap\\n\\n1. Ship\\n2. Iterate" );
+
+foreach ( glob( '/tmp/vault/*.md' ) as $path ) {
+\t$consumer = new MarkdownConsumer( file_get_contents( $path ) );
+\t$consumer->consume();
+\t$title = $consumer->get_meta_value( 'title' );
+\tif ( ! $title ) $title = basename( $path, '.md' );
+\techo "=== $title ($path) ===\\n";
+\techo substr( $consumer->get_block_markup(), 0, 120 ) . "...\\n\\n";
+}'''))),
+        ('Counting blocks produced by a Markdown document',
+            '<p>After conversion, the block markup is plain WordPress block markup, so <code>parse_blocks()</code> works on it directly. The standard way to introspect what the converter emitted before saving to the database.</p>',
+            ('count-blocks.php', php('''use WordPress\\Markdown\\MarkdownConsumer;
+
+$md = <<<MD
+# Title
+
+A paragraph with **bold** and *italics*.
+
+| Col A | Col B |
+|-------|-------|
+| 1     | 2     |
+
+```php
+echo 'hi';
+```
+
+> A quote.
+MD;
+
+$blocks = ( new MarkdownConsumer( $md ) )->consume()->get_block_markup();
+$counts = array();
+$queue  = parse_blocks( $blocks );
+
+while ( $queue ) {
+\t$block = array_shift( $queue );
+\tif ( null !== $block['blockName'] ) {
+\t\t$name             = $block['blockName'];
+\t\t$counts[ $name ] = isset( $counts[ $name ] ) ? $counts[ $name ] + 1 : 1;
+\t}
+\tforeach ( $block['innerBlocks'] as $inner_block ) {
+\t\t$queue[] = $inner_block;
+\t}
+}
+foreach ( $counts as $name => $count ) {
+\techo "{$name}: {$count}\\n";
+}'''))),
+    ]))
+
+# ===========================================================================
+# XML
+# ===========================================================================
+COMPONENTS.append(('xml', 'XML',
+    'A streaming, namespace-aware XML processor in pure PHP. Read and modify huge feeds, WXR exports, ePub manifests, and Office Open XML parts without ever loading the document into memory and without depending on <code>libxml2</code>.',
+    'wp-php-toolkit/xml',
+    [
+        ('Why this exists',
+            '<p><code>SimpleXMLElement</code> and <code>DOMDocument</code> both need <code>libxml2</code> and both build a complete in-memory tree. <code>XMLProcessor</code> walks the document forward as a cursor, keeps modifications in a side buffer, and emits the full updated XML with <code>get_updated_xml()</code> only when you ask for it.</p>'
+            '<p>This design came from WordPress-scale documents such as WXR exports. A migration may only need to rewrite <code>wp:attachment_url</code> values or bump a feed attribute, so the processor optimizes for targeted cursor edits instead of a full validating XML stack.</p>'
+            '<p><strong>Footgun #1:</strong> namespace-aware methods use the namespace name declared in <code>xmlns</code>, not the prefix written in the tag. In WXR, <code>get_attribute( \'wp\', \'status\' )</code> looks for a namespace literally named <code>wp</code>; for the usual WXR declaration you want <code>get_attribute( \'http://wordpress.org/export/1.2/\', \'status\' )</code>.</p>'
+            '<p><strong>Footgun #2:</strong> in streaming mode <code>next_tag()</code> can return false because input ran out, not because the document ended. Check <code>is_paused_at_incomplete_input()</code> before assuming you\'re done.</p>',
+            None),
+        ('Bump every price in a catalog',
+            '<p>Find each <code>&lt;book&gt;</code>, read its price, write a new one, emit the updated document.</p>',
+            ('bump-prices.php', php('''use WordPress\\XML\\XMLProcessor;
+
+$xml = '<catalog>'
+\t. '<book sku="A1" price="29.99"><title>PHP Internals</title></book>'
+\t. '<book sku="A2" price="14.50"><title>WordPress at Scale</title></book>'
+\t. '</catalog>';
+
+$p = XMLProcessor::create_from_string( $xml );
+while ( $p->next_tag( 'book' ) ) {
+\t$old = (float) $p->get_attribute( '', 'price' );
+\t$new = number_format( $old * 1.10, 2, '.', '' );
+\t$p->set_attribute( '', 'price', $new );
+}
+
+echo $p->get_updated_xml();'''))),
+        ('Read namespaced attributes from a WXR export',
+            '<p>WordPress\'s WXR commonly uses <code>wp:</code>, <code>dc:</code>, and <code>content:</code> prefixes bound to namespace names such as <code>http://wordpress.org/export/1.2/</code>. Pass that expanded namespace name, not the prefix; the processor handles whichever prefix the document actually uses.</p>',
+            ('wxr-namespaces.php', php('''use WordPress\\XML\\XMLProcessor;
+
+$wxr = '<?xml version="1.0"?>'
+\t. '<rss xmlns:wp="http://wordpress.org/export/1.2/" xmlns:dc="http://purl.org/dc/elements/1.1/">'
+\t. '<channel><item>'
+\t. '<title>Hello World</title>'
+\t. '<dc:creator>admin</dc:creator>'
+\t. '<wp:post_id>42</wp:post_id>'
+\t. '<wp:status>publish</wp:status>'
+\t. '</item></channel></rss>';
+
+$WP = 'http://wordpress.org/export/1.2/';
+$DC = 'http://purl.org/dc/elements/1.1/';
+
+$p = XMLProcessor::create_from_string( $wxr );
+while ( $p->next_tag( 'item' ) ) {
+\twhile ( $p->next_token() ) {
+\t\tif ( $p->is_tag_closer() && 'item' === $p->get_tag_local_name() ) break;
+\t\tif ( ! $p->is_tag_opener() ) continue;
+\t\t$ns = $p->get_tag_namespace();
+\t\t$local = $p->get_tag_local_name();
+\t\t$prefix = ( $WP === $ns ) ? 'wp/' : ( ( $DC === $ns ) ? 'dc/' : '' );
+\t\techo "{$prefix}{$local}: ";
+\t\twhile ( $p->next_token() && '#text' !== $p->get_token_name() ) {}
+\t\techo trim( $p->get_modifiable_text() ) . "\\n";
+\t}
+}'''))),
+        ('Rewrite URLs across an entire WXR export',
+            '<p>Large WXR exports can hold many URLs in <code>&lt;link&gt;</code>, <code>&lt;guid&gt;</code>, and post content. Streaming the file lets you rewrite large exports without loading the whole XML document into memory.</p>',
+            ('rewrite-wxr-urls.php', php('''use WordPress\\XML\\XMLProcessor;
+
+$wxr = '<?xml version="1.0"?><rss xmlns:wp="http://wordpress.org/export/1.2/"><channel>'
+\t. '<wp:base_site_url>https://old.example.com</wp:base_site_url>'
+\t. '<item><link>https://old.example.com/2024/post-1</link>'
+\t. '<guid>https://old.example.com/?p=1</guid></item>'
+\t. '</channel></rss>';
+
+$from = 'https://old.example.com';
+$to   = 'https://new.example.com';
+
+$p = XMLProcessor::create_from_string( $wxr );
+$rewritten = 0;
+
+while ( $p->next_token() ) {
+\tif ( '#text' !== $p->get_token_name() ) continue;
+\t$text = $p->get_modifiable_text();
+\tif ( false === strpos( $text, $from ) ) continue;
+\t$p->set_modifiable_text( str_replace( $from, $to, $text ) );
+\t$rewritten++;
+}
+
+echo "rewrote {$rewritten} text nodes\\n\\n";
+echo $p->get_updated_xml();'''))),
+        ('Parse OPML to extract feed URLs',
+            '<p>OPML is the format Feedly and many readers use to import/export feed lists. Flat, attribute-heavy XML — exactly what a tag processor handles best.</p>',
+            ('opml.php', php('''use WordPress\\XML\\XMLProcessor;
+
+$opml = '<?xml version="1.0"?><opml version="2.0"><head><title>My Feeds</title></head>'
+\t. '<body>'
+\t. '<outline text="Tech"><outline text="Hacker News" type="rss" xmlUrl="https://news.ycombinator.com/rss"/>'
+\t. '<outline text="LWN" type="rss" xmlUrl="https://lwn.net/headlines/rss"/></outline>'
+\t. '<outline text="WordPress" type="rss" xmlUrl="https://wordpress.org/news/feed/"/>'
+\t. '</body></opml>';
+
+$p = XMLProcessor::create_from_string( $opml );
+while ( $p->next_tag( 'outline' ) ) {
+\t$url = $p->get_attribute( '', 'xmlUrl' );
+\tif ( null === $url ) continue;
+\techo $p->get_attribute( '', 'text' ) . "\\t" . $url . "\\n";
+}'''))),
+    ]))
+
+# ===========================================================================
+# Encoding
+# ===========================================================================
+COMPONENTS.append(('encoding', 'Encoding',
+    'UTF-8 validation and scrubbing with a pure-PHP fallback when <code>mbstring</code> is unavailable. Detects malformed bytes and replaces them per the Unicode maximal-subpart algorithm.',
+    'wp-php-toolkit/encoding',
+    [
+        ('Why this exists',
+            '<p>Every parser in this toolkit eventually has to decide what to do with text bytes. XML rejects malformed UTF-8. JSON and databases can fail late. CSS, HTML, WXR, and Blueprint validation all need consistent answers about whether a string is well-formed Unicode.</p>'
+            '<p>The Encoding component provides the small UTF-8 primitives the rest of the toolkit can share: validate bytes, scrub invalid sequences, scan code points, and detect Unicode noncharacters. When <code>mbstring</code> is available it can delegate to it; when it is not, the component uses its own byte scanner so behavior stays available in restricted PHP environments.</p>'
+            '<p>Historically, this became the common foundation for Blueprint validation and CSS/XML processing, replacing ad hoc Unicode helpers with the WordPress core UTF-8 routines used here.</p>',
+            None),
+        ('Validating UTF-8 before storing it',
+            '<p><code>wp_is_valid_utf8()</code> rejects overlong sequences, surrogate halves, and stray ISO-8859-1 bytes. Use it as a guard in front of any code path that assumes UTF-8 (database, JSON, XML).</p>',
+            ('validate.php', php('''use function WordPress\\Encoding\\wp_is_valid_utf8;
+
+$samples = array(
+\t'ASCII'          => 'just a test',
+\t'UTF-8 pencil'   => "\\xE2\\x9C\\x8F",
+\t'latin-1 byte'   => "B\\xFCch",
+\t'overlong slash' => "\\xC1\\xBF",
+\t'surrogate half' => "\\xED\\xB0\\x80",
+);
+
+foreach ( $samples as $label => $bytes ) {
+\techo sprintf( "%-14s %s\\n", $label . ':', wp_is_valid_utf8( $bytes ) ? 'valid' : 'invalid' );
+}'''))),
+        ('Scrubbing invalid bytes with U+FFFD',
+            '<p>Replace each ill-formed sequence with the Unicode replacement character. Useful right before serializing to XML, JSON, or sending to an LLM that will choke on broken bytes.</p>',
+            ('scrub.php', php('''use function WordPress\\Encoding\\wp_scrub_utf8;
+
+$broken = "the byte \\xC0 should not be here.";
+echo wp_scrub_utf8( $broken ) . "\\n";
+
+echo wp_scrub_utf8( ".\\xE2\\x8C\\xE2\\x8C." ) . "\\n";'''))),
+        ('Detecting noncharacters MySQL/utf8mb4 will reject',
+            '<p>Code points like U+FFFE, U+FFFF, and the U+FDD0–U+FDEF block are valid Unicode but forbidden in XML and rejected by some databases. Check before inserting user-submitted content into a strict <code>utf8mb4</code> column.</p>',
+            ('noncharacters.php', php('''use function WordPress\\Encoding\\wp_has_noncharacters;
+
+$samples = array(
+\t'normal text' => 'normal text',
+\t'U+FFFE'      => "oops \\u{FFFE}",
+\t'U+FDD0'      => "hi \\u{FDD0} bye",
+);
+
+foreach ( $samples as $label => $text ) {
+\techo sprintf( "%-12s %s\\n", $label . ':', wp_has_noncharacters( $text ) ? 'reject' : 'ok' );
+}'''))),
+        ('Three-way pipeline: validate, scrub, then check noncharacters',
+            '<p>Real-world inputs are messy: an old WXR export, a CSV with mixed encodings, a paste from Word. Combination of validate + scrub + noncharacter-check covers the three classes of breakage that bite later.</p>',
+            ('pipeline.php', php('''use function WordPress\\Encoding\\wp_is_valid_utf8;
+use function WordPress\\Encoding\\wp_scrub_utf8;
+use function WordPress\\Encoding\\wp_has_noncharacters;
+
+$inputs = array(
+\t'good'      => 'Café',
+\t'latin1'    => "caf\\xE9",
+\t'overlong'  => "x\\xC1\\xBFy",
+\t'noncharac' => "hi \\u{FFFE} there",
+);
+
+foreach ( $inputs as $label => $bytes ) {
+\t$valid    = wp_is_valid_utf8( $bytes );
+\t$cleaned  = wp_scrub_utf8( $bytes );
+\t$weird    = wp_has_noncharacters( $cleaned );
+\techo sprintf( "%-10s valid=%s noncharacter=%s -> %s\\n", $label, $valid ? 'Y' : 'N', $weird ? 'Y' : 'N', $cleaned );
+}'''))),
+        ('Salvaging a legacy ISO-8859-1 column inside a UTF-8 corpus',
+            '<p>Old WordPress databases sometimes mix encodings: most rows are UTF-8 but a few were stored as latin-1. Detect the bad rows with <code>wp_is_valid_utf8()</code> and only re-encode those.</p>',
+            ('mixed-encoding.php', php('''use function WordPress\\Encoding\\wp_is_valid_utf8;
+use function WordPress\\Encoding\\wp_scrub_utf8;
+
+$rows = array(
+\t1 => 'Plain ASCII',
+\t2 => 'Café',
+\t3 => "caf\\xE9",
+\t4 => "weird \\xC0 byte",
+);
+
+foreach ( $rows as $id => $value ) {
+\tif ( wp_is_valid_utf8( $value ) ) {
+\t\techo "#$id ok: $value\\n";
+\t\tcontinue;
+\t}
+\t$converted = @iconv( 'ISO-8859-1', 'UTF-8', $value );
+\tif ( false !== $converted && wp_is_valid_utf8( $converted ) ) {
+\t\techo "#$id recovered as latin1: $converted\\n";
+\t} else {
+\t\techo "#$id unrecoverable, scrubbing: " . wp_scrub_utf8( $value ) . "\\n";
+\t}
+}'''))),
+    ]))
+
+# ===========================================================================
+# DataLiberation
+# ===========================================================================
+COMPONENTS.append(('dataliberation', 'DataLiberation',
+    'Streaming WordPress import/export. WXR, SQL, block markup — without loading whole datasets into memory.',
+    'wp-php-toolkit/data-liberation',
+    [
+        ('Why this exists',
+            '<p>WordPress content should be portable, but real migrations cross several formats. A site export might arrive as WXR, a Markdown folder, or entities from another CMS. URLs can hide in block attributes, HTML, CSS, feeds, GUIDs, and post meta. Importers must also resume after a failed media download or upload.</p>'
+            '<p>The DataLiberation component streams WordPress-shaped data through readers, transformers, and writers. It models posts, terms, comments, attachments, and metadata as <code>ImportEntity</code> objects, then lets a pipeline rewrite each entity without loading the full export into memory.</p>'
+            '<p>The API reflects specific migration bugs: relative URLs in known block attributes, URLs inside inline CSS, self-closing block comments that must keep their shape, and origin-only URLs whose trailing slash style should not change during a rewrite.</p>'
+            '<p>Reach for it when the job combines formats: build WXR from another CMS, rewrite a staging export for production, frontload remote assets, or compose Markdown, XML, HTML, CSS, and URL rewriting into one pipeline.</p>',
+            None),
+        ('Write a WXR file in five lines',
+            '<p>Stream a single post into a WXR document via <code>WXRWriter</code>. The writer holds no buffer beyond what is needed to close currently-open tags, so memory stays flat regardless of input size.</p>',
+            ('wxr-quickstart.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\DataLiberation\\EntityWriter\\WXRWriter;
+use WordPress\\DataLiberation\\ImportEntity;
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+$writer->append_entity( new ImportEntity( 'post', array(
+\t'post_title' => 'Hello',
+\t'content'    => 'World.',
+\t'post_id'    => '1',
+\t'status'     => 'publish',
+) ) );
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+$wxr = $pipe->consume_all();
+
+echo "bytes: " . strlen( $wxr ) . "\\n";
+echo false !== strpos( $wxr, '<title>Hello</title>' ) ? "title exported\\n" : "title missing\\n";
+echo false !== strpos( $wxr, '<wp:status>publish</wp:status>' ) ? "status exported\\n" : "status missing\\n";'''))),
+        ('Build a WXR programmatically from any source',
+            '<p>The writer doesn\'t care where entities come from. Loop over rows from a CMS, a CSV, or a Notion API dump and emit posts plus their meta and comments.</p>',
+            ('build-wxr.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\DataLiberation\\EntityWriter\\WXRWriter;
+use WordPress\\DataLiberation\\ImportEntity;
+
+$rows = array(
+\tarray( 'id' => 10, 'title' => 'About', 'body' => '<p>About us.</p>', 'tags' => array( 'company' ) ),
+\tarray( 'id' => 11, 'title' => 'Blog',  'body' => '<p>Hello world.</p>', 'tags' => array( 'news', 'launch' ) ),
+);
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+
+foreach ( $rows as $row ) {
+\t$writer->append_entity( new ImportEntity( 'post', array(
+\t\t'post_id'    => (string) $row['id'],
+\t\t'post_title' => $row['title'],
+\t\t'content'    => $row['body'],
+\t\t'status'     => 'publish',
+\t\t'post_type'  => 'post',
+\t) ) );
+\tforeach ( $row['tags'] as $i => $tag ) {
+\t\t$writer->append_entity( new ImportEntity( 'term', array(
+\t\t\t'term_id'  => (string) ( $row['id'] * 100 + $i ),
+\t\t\t'taxonomy' => 'post_tag',
+\t\t\t'slug'     => $tag,
+\t\t\t'parent'   => '0',
+\t\t) ) );
+\t}
+}
+
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+
+$wxr = $pipe->consume_all();
+echo "items: " . substr_count( $wxr, '<item>' ) . "\\n";
+echo "terms: " . substr_count( $wxr, '<wp:term>' ) . "\\n";
+echo false !== strpos( $wxr, '<title>Blog</title>' ) ? "Blog post exported\\n" : "Blog post missing\\n";'''))),
+        ('Read entities from a WXR file with constant memory',
+            '<p><code>WXREntityReader</code> emits one entity at a time. A 10 GB WXR uses the same memory as a 10 KB one.</p>',
+            ('wxr-read.php', php('''use WordPress\\DataLiberation\\EntityReader\\WXREntityReader;
+
+$wxr = <<<XML
+<?xml version="1.0" encoding="UTF-8" ?>
+<rss version="2.0" xmlns:wp="http://wordpress.org/export/1.2/" xmlns:content="http://purl.org/rss/1.0/modules/content/">
+<channel>
+<title>Demo</title>
+<item><title>First</title><wp:post_id>1</wp:post_id><wp:post_type>post</wp:post_type><content:encoded>Body 1</content:encoded></item>
+<item><title>Second</title><wp:post_id>2</wp:post_id><wp:post_type>post</wp:post_type><content:encoded>Body 2</content:encoded></item>
+</channel>
+</rss>
+XML;
+
+$reader = WXREntityReader::create();
+$reader->append_bytes( $wxr );
+$reader->input_finished();
+
+while ( $reader->next_entity() ) {
+\t$entity = $reader->get_entity();
+\techo $entity->get_type() . ': ' . json_encode( $entity->get_data() ) . "\\n";
+}'''))),
+        ('Streaming transform: rewrite URLs while copying WXR',
+            '<p>Wire reader to writer to rewrite a WXR file on the fly. This pattern is how you migrate a staging export to production: swap <code>staging.example.com</code> for <code>example.com</code> without ever loading the file into memory.</p>',
+            ('rewrite-urls.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\DataLiberation\\EntityReader\\WXREntityReader;
+use WordPress\\DataLiberation\\EntityWriter\\WXRWriter;
+use WordPress\\DataLiberation\\ImportEntity;
+
+$source_xml = <<<XML
+<?xml version="1.0" encoding="UTF-8" ?>
+<rss version="2.0" xmlns:wp="http://wordpress.org/export/1.2/" xmlns:content="http://purl.org/rss/1.0/modules/content/">
+<channel>
+<item><title>Hello</title><wp:post_id>1</wp:post_id><wp:post_type>post</wp:post_type>
+<content:encoded>Visit https://staging.example.com/about for more.</content:encoded></item>
+</channel>
+</rss>
+XML;
+
+$reader = WXREntityReader::create();
+$reader->append_bytes( $source_xml );
+$reader->input_finished();
+
+$out_pipe = new MemoryPipe();
+$writer   = new WXRWriter( $out_pipe );
+
+while ( $reader->next_entity() ) {
+\t$entity = $reader->get_entity();
+\t$data   = $entity->get_data();
+\tforeach ( array( 'post_content', 'content', 'description' ) as $field ) {
+\t\tif ( isset( $data[ $field ] ) ) {
+\t\t\t$data[ $field ] = str_replace( 'staging.example.com', 'example.com', $data[ $field ] );
+\t\t}
+\t}
+\tif ( 'post' === $entity->get_type() ) {
+\t\t$data['content'] = isset( $data['post_content'] ) ? $data['post_content'] : ( isset( $data['content'] ) ? $data['content'] : '' );
+\t}
+\t$writer->append_entity( new ImportEntity( $entity->get_type(), $data ) );
+}
+
+$writer->finalize();
+$writer->close_writing();
+$out_pipe->close_writing();
+
+$wxr = $out_pipe->consume_all();
+echo false !== strpos( $wxr, 'https://example.com/about' ) ? "new URL present\\n" : "new URL missing\\n";
+echo false === strpos( $wxr, 'staging.example.com' ) ? "old URL removed\\n" : "old URL still present\\n";'''))),
+        ('Render Markdown into a WXR import in one pipeline',
+            '<p>Compose <code>MarkdownConsumer</code> with <code>WXRWriter</code> to publish a folder of Markdown directly as a WordPress import file.</p>',
+            ('md-to-wxr.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\DataLiberation\\EntityWriter\\WXRWriter;
+use WordPress\\DataLiberation\\ImportEntity;
+use WordPress\\Markdown\\MarkdownConsumer;
+
+@mkdir( '/tmp/md-src', 0777, true );
+file_put_contents( '/tmp/md-src/hello.md',  "---\\ntitle: Hello\\n---\\n\\n# Hello\\n\\nFirst post." );
+file_put_contents( '/tmp/md-src/second.md', "---\\ntitle: Second\\n---\\n\\nMore text **here**." );
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+
+$id = 1;
+foreach ( glob( '/tmp/md-src/*.md' ) as $path ) {
+\t$consumer = new MarkdownConsumer( file_get_contents( $path ) );
+\t$consumer->consume();
+\t$writer->append_entity( new ImportEntity( 'post', array(
+\t\t'post_id'    => (string) $id++,
+\t\t'post_title' => $consumer->get_meta_value( 'title' ) ?: basename( $path, '.md' ),
+\t\t'content'    => $consumer->get_block_markup(),
+\t\t'status'     => 'publish',
+\t\t'post_type'  => 'post',
+\t\t'post_name'  => basename( $path, '.md' ),
+\t) ) );
+}
+
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+
+$wxr = $pipe->consume_all();
+echo "posts: " . substr_count( $wxr, '<item>' ) . "\\n";
+echo false !== strpos( $wxr, '&lt;!-- wp:heading' ) ? "block markup exported\\n" : "block markup missing\\n";
+echo false !== strpos( $wxr, '<title>Second</title>' ) ? "frontmatter title exported\\n" : "frontmatter title missing\\n";'''))),
+    ]))
+
+# ===========================================================================
+# Git
+# ===========================================================================
+COMPONENTS.append(('git', 'Git',
+    'A pure-PHP Git client and server. Commits, branches, diffs, HTTP push/pull — all without shelling out to <code>git</code>.',
+    'wp-php-toolkit/git',
+    [
+        ('Why this exists',
+            '<p>Git is a useful storage model even when a server cannot run the <code>git</code> binary: snapshots, branches, object-addressed files, diffs, merges, and sync over HTTP. That matters for WordPress tools that want revision history for generated files, content snapshots, site state, or collaborative edits in constrained runtimes.</p>'
+            '<p>The Git component implements the core repository operations in PHP and stores objects through the toolkit <code>Filesystem</code> interface. That means the same repository can live on disk, in memory, or in another backend, and higher-level code can commit files without knowing where objects are stored.</p>'
+            '<p>The docs start with simple commits because that mental model scales: a repository is just objects plus refs. From there, branches, history walking, root commits, and merges become details you can reason about instead of magic shell behavior.</p>'
+            '<p>Choose it for tests, browser-like sandboxes, hosted WordPress environments, and applications that need Git behavior through PHP APIs instead of shell commands.</p>',
+            None),
+        ('Commit files into an in-memory repo',
+            '<p>The simplest possible repository: an <code>InMemoryFilesystem</code> as object storage and one <code>commit()</code> call. Reach for this in tests, in WP-CLI snapshots, or any place you want versioning without touching disk.</p>',
+            ('commit-in-memory.php', php('''use WordPress\\Filesystem\\InMemoryFilesystem;
+use WordPress\\Git\\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+
+$oid = $repo->commit( array(
+\t'updates' => array(
+\t\t'README.md'           => "# My Project\\n",
+\t\t'src/hello-world.php' => '<?php echo "Hello!";',
+\t),
+) );
+
+echo "commit: {$oid}\\n";
+echo "HEAD:   " . $repo->get_branch_tip( 'HEAD' ) . "\\n";
+echo "README: " . $repo->read_object_by_path( '/README.md' )->consume_all();'''))),
+        ('Walk the commit history',
+            '<p>Follow the parent chain from <code>HEAD</code> backwards. Building block for a WP-CLI "post revisions" log or a "what changed since release X" report.</p>',
+            ('walk-history.php', php('''use WordPress\\Filesystem\\InMemoryFilesystem;
+use WordPress\\Git\\GitRepository;
+use WordPress\\Git\\Model\\Commit;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+foreach ( array( 'add intro', 'fix typo', 'expand examples' ) as $i => $msg ) {
+\t$repo->commit( array(
+\t\t'updates' => array( 'post.md' => "# Draft {$i}" ),
+\t\t'commit'  => array( 'message' => $msg ),
+\t) );
+}
+
+$oid = $repo->get_branch_tip( 'HEAD' );
+while ( ! Commit::is_null_hash( $oid ) ) {
+\t$c = $repo->read_object( $oid )->as_commit();
+\techo substr( $c->hash, 0, 7 ) . '  ' . trim( $c->message ) . "\\n";
+\t$oid = $c->get_first_parent_hash();
+\tif ( ! $oid || ! $repo->has_object( $oid ) ) break;
+}'''))),
+        ('Treat a repository like a filesystem',
+            '<p><code>GitFilesystem</code> wraps a repository in this toolkit\'s <code>Filesystem</code> interface. With the default options, each <code>put_contents()</code> records a new commit.</p>',
+            ('git-filesystem.php', php('''use WordPress\\Filesystem\\InMemoryFilesystem;
+use WordPress\\Git\\GitFilesystem;
+use WordPress\\Git\\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+$fs   = GitFilesystem::create( $repo );
+
+$fs->put_contents( '/posts/hello.md', "# Hello\\nFirst draft." );
+$fs->put_contents( '/posts/about.md', "# About\\nWho we are." );
+$fs->put_contents( '/posts/hello.md', "# Hello\\nSecond draft." );
+
+echo "tree:\\n";
+foreach ( $fs->ls( '/posts' ) as $name ) {
+\techo "  /posts/{$name}\\n";
+}
+echo "\\nhello.md now:\\n" . $fs->get_contents( '/posts/hello.md' ) . "\\n";'''))),
+        ('Branch, edit, and switch back',
+            '<p>Create a feature branch off the current commit, change files, flip <code>HEAD</code> back. Useful for experimental edits in collaborative tools.</p>',
+            ('branches.php', php('''use WordPress\\Filesystem\\InMemoryFilesystem;
+use WordPress\\Git\\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+$base = $repo->commit( array(
+\t'updates' => array( 'config.json' => '{"flag":false}' ),
+\t'commit'  => array( 'message' => 'baseline' ),
+) );
+
+$repo->create_branch( 'refs/heads/experiment', $base );
+$repo->checkout( 'refs/heads/experiment' );
+$repo->commit( array(
+\t'updates' => array( 'config.json' => '{"flag":true}' ),
+\t'commit'  => array( 'message' => 'flip the flag' ),
+) );
+
+echo "on experiment: " . $repo->read_object_by_path( '/config.json' )->consume_all() . "\\n";
+
+$repo->checkout( 'refs/heads/trunk' );
+echo "on trunk:      " . $repo->read_object_by_path( '/config.json' )->consume_all() . "\\n";'''))),
+        ('Three-way merge two branches',
+            '<p>The classic Git workflow: branch off, edit on each side, merge. <code>$repo-&gt;merge()</code> finds the common ancestor, three-way-merges every file, and creates a merge commit.</p>',
+            ('merge-branches.php', php('''use WordPress\\Filesystem\\InMemoryFilesystem;
+use WordPress\\Git\\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+$base = $repo->commit( array( 'updates' => array(
+\t'todo.txt' => "buy milk\\nwalk dog\\nread book\\n",
+) ) );
+
+$repo->commit( array( 'updates' => array(
+\t'todo.txt' => "buy oat milk\\nwalk dog\\nread book\\n",
+) ) );
+
+$repo->create_branch( 'refs/heads/feature', $base );
+$repo->checkout( 'refs/heads/feature' );
+$repo->commit( array( 'updates' => array(
+\t'todo.txt' => "buy milk\\nwalk dog\\nread book\\nwrite blog post\\n",
+) ) );
+
+$repo->checkout( 'refs/heads/trunk' );
+$result = $repo->merge( 'refs/heads/feature' );
+
+echo "merge head: {$result['new_head']}\\n";
+echo "conflicts:  " . ( $result['conflicts'] ? implode( ',', $result['conflicts'] ) : 'none' ) . "\\n";
+echo "result:\\n" . $repo->read_object_by_path( '/todo.txt' )->consume_all();'''))),
+        ('Snapshot WordPress options into a repo',
+            '<p>Serialize a chunk of WP state (options, post meta, a theme config) on every save and commit it. You get free history, diffs between snapshots, and a "rollback to last week" button.</p>',
+            ('options-snapshot.php', php('''use WordPress\\Filesystem\\InMemoryFilesystem;
+use WordPress\\Git\\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+
+$snapshots = array(
+\tarray( 'blogname' => 'My Site',  'posts_per_page' => 10, 'timezone_string' => 'UTC' ),
+\tarray( 'blogname' => 'My Site',  'posts_per_page' => 20, 'timezone_string' => 'UTC' ),
+\tarray( 'blogname' => 'New Name', 'posts_per_page' => 20, 'timezone_string' => 'Europe/Warsaw' ),
+);
+
+foreach ( $snapshots as $i => $options ) {
+\t$repo->commit( array(
+\t\t'updates' => array( 'options.json' => json_encode( $options, JSON_PRETTY_PRINT ) ),
+\t\t'commit'  => array( 'message' => "snapshot #{$i}" ),
+\t) );
+}
+
+$head    = $repo->get_branch_tip( 'HEAD' );
+$parent  = $repo->read_object( $head )->as_commit()->get_first_parent_hash();
+$diff    = $repo->diff_commits( $head, $parent );
+
+echo "Files changed in last snapshot:\\n";
+foreach ( $diff as $name => $entry ) {
+\techo "  {$name}\\n";
+}'''))),
+    ]))
+
+# ===========================================================================
+# Merge
+# ===========================================================================
+COMPONENTS.append(('merge', 'Merge',
+    'Three-way merge and diff. Pluggable differ + merger + optional validator.',
+    'wp-php-toolkit/merge',
+    [
+        ('Why this exists',
+            '<p>Content synchronization needs more than "last write wins." A Markdown file changes in Git while the same post changes in WordPress. A generated config changes through both a CLI tool and a UI. In those cases you need a common ancestor, two edited versions, and a way to explain conflicts to a human.</p>'
+            '<p>The Merge component provides the diff and three-way merge primitives used by those workflows. The default examples are line-oriented because that is the most familiar shape, but the strategy is intentionally pluggable: choose the differ, choose the merger, and optionally validate the merged result before accepting it.</p>'
+            '<p>Use the merge result to auto-accept independent edits and to show structured conflicts when a person must decide.</p>',
+            None),
+        ('Diff two strings line by line',
+            '<p>Feed two strings to <code>LineDiffer</code> and inspect the operations. Every <code>get_changes()</code> entry is a <code>[op, text]</code> pair.</p>',
+            ('line-diff.php', php('''use WordPress\\Merge\\Diff\\Diff;
+use WordPress\\Merge\\Diff\\LineDiffer;
+
+$diff = ( new LineDiffer() )->diff(
+\t"alpha\\nbeta\\ngamma\\n",
+\t"alpha\\nBETA\\ngamma\\ndelta\\n"
+);
+
+$labels = array( Diff::DIFF_EQUAL => '=', Diff::DIFF_DELETE => '-', Diff::DIFF_INSERT => '+' );
+foreach ( $diff->get_changes() as $change ) {
+\techo $labels[ $change[0] ] . ' ' . rtrim( $change[1] ) . "\\n";
+}'''))),
+        ('Render a unified patch',
+            '<p><code>format_as_git_patch()</code> produces output that mirrors <code>git diff</code>, including hunk headers — handy for emails, CI annotations, or a "what changed?" panel.</p>',
+            ('git-patch.php', php('''use WordPress\\Merge\\Diff\\LineDiffer;
+
+$old = "title: Hello\\nauthor: Alice\\nstatus: draft\\n";
+$new = "title: Hello, world\\nauthor: Alice\\nstatus: published\\ntags: greeting\\n";
+
+$diff = ( new LineDiffer() )->diff( $old, $new );
+echo $diff->format_as_git_patch( array(
+\t'a_source' => 'a/post.yml',
+\t'b_source' => 'b/post.yml',
+) );'''))),
+        ('Three-way merge with no conflicts',
+            '<p>The classic case: each branch changes a different region. Pass the common ancestor plus both edits to <code>MergeStrategy::merge()</code> and read the merged result.</p>',
+            ('three-way.php', php('''use WordPress\\Merge\\Diff\\LineDiffer;
+use WordPress\\Merge\\Merge\\LineMerger;
+use WordPress\\Merge\\MergeStrategy;
+
+$strategy = new MergeStrategy( new LineDiffer(), new LineMerger() );
+
+$result = $strategy->merge(
+\t"intro\\nbody\\noutro\\n",
+\t"intro updated\\nbody\\noutro\\n",
+\t"intro\\nbody\\noutro\\nappendix\\n"
+);
+
+echo $result->has_conflicts() ? "conflicts!\\n" : "clean merge:\\n";
+echo $result->get_merged_content();'''))),
+        ('Inspect and surface conflicts',
+            '<p>When both sides edit the same region, the merger produces a <code>MergeConflict</code>. The merged content carries Git-style markers, but the structured <code>get_conflicts()</code> output is what you want for a UI that lets the user pick a side.</p>',
+            ('conflicts.php', php('''use WordPress\\Merge\\Diff\\LineDiffer;
+use WordPress\\Merge\\Merge\\LineMerger;
+use WordPress\\Merge\\MergeStrategy;
+
+$strategy = new MergeStrategy( new LineDiffer(), new LineMerger() );
+$result = $strategy->merge(
+\t"line 1\\nline 2\\n",
+\t"line 1\\nline 2 from Alice\\n",
+\t"line 1\\nline 2 from Bob\\n"
+);
+
+if ( $result->has_conflicts() ) {
+\tforeach ( $result->get_conflicts() as $c ) {
+\t\techo "ours:   " . trim( $c->ours ) . "\\n";
+\t\techo "theirs: " . trim( $c->theirs ) . "\\n";
+\t}
+}
+echo "\\n--- merged content with markers ---\\n";
+echo $result->get_merged_content();'''))),
+        ('Sync a Markdown folder against an edited DB copy',
+            '<p>A real-world scenario: posts live both in a Git-tracked Markdown folder and in WordPress, and someone edits each. Three-way-merge each post against its common ancestor.</p>',
+            ('sync-folder-vs-db.php', php('''use WordPress\\Merge\\Diff\\LineDiffer;
+use WordPress\\Merge\\Merge\\LineMerger;
+use WordPress\\Merge\\MergeStrategy;
+
+$strategy = new MergeStrategy( new LineDiffer(), new LineMerger() );
+
+$posts = array(
+\t'hello.md' => array(
+\t\t'base' => "# Hello\\nDraft body.\\n",
+\t\t'disk' => "# Hello\\nDraft body, expanded on disk.\\n",
+\t\t'db'   => "# Hello\\nDraft body.\\nNew section from the editor.\\n",
+\t),
+\t'about.md' => array(
+\t\t'base' => "# About\\nWho we are.\\n",
+\t\t'disk' => "# About\\nWho *they* are.\\n",
+\t\t'db'   => "# About\\nWho we really are.\\n",
+\t),
+);
+
+foreach ( $posts as $name => $sides ) {
+\t$result = $strategy->merge( $sides['base'], $sides['disk'], $sides['db'] );
+\techo "=== {$name} ===\\n";
+\techo $result->has_conflicts() ? "(conflict — needs review)\\n" : "(auto-merged)\\n";
+\techo $result->get_merged_content() . "\\n";
+}'''))),
+    ]))
+
+# ===========================================================================
+# HttpClient
+# ===========================================================================
+COMPONENTS.append(('httpclient', 'HttpClient',
+    'Async HTTP client without <code>curl</code> required. Uses sockets when curl is missing, supports concurrent requests and streaming responses.',
+    'wp-php-toolkit/http-client',
+    [
+        ('Why this exists',
+            '<p>A plugin installer starts with one request to download <code>plugin.zip</code>. A migration then adds progress reporting, a ten-request media window, resumable downloads, and a remote ZIP reader that feeds ZipFilesystem directly. Those workflows need the same request API from the first GET to the final streamed archive.</p>'
+            '<p>The HttpClient component gives the toolkit a small request/response model, middleware for redirects and caching, concurrent fetches, and response bodies exposed as byte streams. It runs through curl when PHP provides curl and through pure PHP sockets when it does not. Callers keep the same code path.</p>'
+            '<p>Use it to fetch plugin metadata, submit import callbacks, mirror a media library, read a WXR export, or pipe a remote archive into Zip and Filesystem code.</p>',
+            None),
+        ('GET a URL',
+            '<p class="callout"><strong>Network access in the demo runtime.</strong> Live request examples show the real API, but outbound HTTP in browser sandboxes may require a CORS proxy.</p>'
+            '<p>The smallest flow has three steps: create a request, wait until headers arrive, then consume the body stream. This is intentionally close to the Fetch API shape, but the body is a toolkit byte stream instead of a buffered string.</p>',
+            ('get.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\Request;
+
+$client  = new Client();
+$stream  = $client->fetch( new Request( 'https://example.com/' ) );
+
+$response = $stream->await_response();
+echo "status: " . $response->status_code . "\\n";
+echo "first 80 bytes: " . substr( $stream->consume_all(), 0, 80 ) . "\\n";'''))),
+        ('POST to a URL',
+            '<p>Uploads use the same shape. The only difference is that the request declares a method, request headers, and an upload body stream. Here the body is form-encoded text wrapped in <code>MemoryPipe</code>; a file upload could provide a file-backed read stream instead.</p>',
+            ('post.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\Request;
+use WordPress\\ByteStream\\MemoryPipe;
+
+$payload = http_build_query(
+\tarray(
+\t\t'title' => 'Hello',
+\t\t'tags'  => 'http,php',
+\t),
+\t'',
+\t'&'
+);
+
+$client  = new Client();
+$request = new Request( 'https://httpbin.org/post', array(
+\t'method'      => 'POST',
+\t'headers'     => array(
+\t\t'content-type'   => 'application/x-www-form-urlencoded',
+\t\t'content-length' => (string) strlen( $payload ),
+\t),
+\t'body_stream' => new MemoryPipe( $payload ),
+) );
+
+$response = $client->fetch( $request )->json();
+echo "Server saw form title: " . $response['form']['title'] . "\\n";'''))),
+        ('Build a JSON request object',
+            '<p>A <code>Request</code> is just data until a client enqueues it. That makes it easy to test request construction without network access. The constructor normalizes headers, calculates <code>content-length</code> when the body stream has a known length, and moves URL credentials into an Authorization header.</p>',
+            ('request-object.php', php('''use WordPress\\ByteStream\\MemoryPipe;
+use WordPress\\HttpClient\\Request;
+
+$body = new MemoryPipe( json_encode( array(
+\t'title' => 'Hello',
+\t'tags'  => array( 'docs', 'php' ),
+) ) );
+$body->close_writing();
+
+$request = new Request( 'https://user:secret@api.example.test/posts', array(
+\t'method'      => 'POST',
+\t'headers'     => array( 'content-type' => 'application/json' ),
+\t'body_stream' => $body,
+) );
+
+echo $request->method . ' ' . $request->url . "\\n";
+echo "content-type: " . $request->get_header( 'content-type' ) . "\\n";
+echo "content-length: " . $request->get_header( 'content-length' ) . "\\n";
+echo "authorization: " . substr( $request->get_header( 'authorization' ), 0, 10 ) . "...\\n";'''))),
+        ('Parse response headers',
+            '<p>Most applications receive <code>Response</code> objects from <code>await_response()</code>. Transports, middleware, and tests sometimes need the lower-level parser: <code>Response::from_http_headers()</code> turns raw HTTP header bytes into normalized status and case-insensitive headers.</p>',
+            ('parse-response.php', php('''use WordPress\\HttpClient\\Request;
+use WordPress\\HttpClient\\Response;
+
+$request = new Request( 'https://api.example.test/posts/42' );
+$raw = "HTTP/1.1 201 Created\\r\\n"
+\t. "Content-Type: application/json\\r\\n"
+\t. "Location: /posts/42\\r\\n"
+\t. "Content-Length: 27\\r\\n\\r\\n";
+
+$response = Response::from_http_headers( $raw, $request );
+
+echo "status: " . $response->status_code . ' ' . $response->get_reason_phrase() . "\\n";
+echo "ok:     " . ( $response->ok() ? 'yes' : 'no' ) . "\\n";
+echo "type:   " . $response->get_header( 'CONTENT-TYPE' ) . "\\n";
+echo "size:   " . $response->total_bytes . " bytes\\n";'''))),
+        ('Pick the right reading style',
+            '<p>There are three common ways to consume a response. Start simple, then move down the table only when the workflow demands it.</p>'
+            '<table><thead><tr><th>Style</th><th>Use when</th><th>Tradeoff</th></tr></thead><tbody>'
+            '<tr><td><code>consume_all()</code> or <code>json()</code></td><td>Small HTML, JSON, or API responses.</td><td>Buffers the full body.</td></tr>'
+            '<tr><td><code>Client::await_next_event()</code></td><td>Progress bars, streaming to disk, queues, failure handling.</td><td>You own the event loop.</td></tr>'
+            '<tr><td>Filesystem and parser composition</td><td>Remote ZIPs, WXR files, import pipelines.</td><td>Requires a stream-aware consumer.</td></tr>'
+            '</tbody></table>',
+            None),
+        ('Choose a transport',
+            '<p>The transport is the I/O backend. It should not change your request, response, redirect, cache, or stream code; it only changes how bytes move across the network.</p>'
+            '<table><thead><tr><th>Transport</th><th>What it does</th><th>When to choose it</th></tr></thead><tbody>'
+            '<tr><td><code>auto</code></td><td>Uses curl when loaded, otherwise sockets.</td><td>Application default. Best when you want portability and the fastest available backend.</td></tr>'
+            '<tr><td><code>sockets</code></td><td>Uses PHP stream sockets, no curl extension.</td><td>Tests, Playground-style runtimes, hosts where curl is unavailable, or proving the dependency-free path works.</td></tr>'
+            '<tr><td><code>curl</code></td><td>Uses the curl extension.</td><td>Hosts where curl is available and you want to compare behavior or performance explicitly.</td></tr>'
+            '</tbody></table>'
+            '<p><code>concurrency</code>, <code>timeout_ms</code>, <code>cache_dir</code>, redirects, and response streaming sit above the transport, so the examples later on work with either backend.</p>',
+            ('transports.php', php('''use WordPress\\HttpClient\\Client;
+
+$default = new Client(); // Same as array( 'transport' => 'auto' ).
+
+$portable = new Client( array(
+\t'transport' => 'sockets',
+) );
+
+if ( extension_loaded( 'curl' ) ) {
+\t$curl = new Client( array(
+\t\t'transport' => 'curl',
+\t) );
+}'''), False)),
+        ('Follow redirects and inspect the final request',
+            '<p>Redirects are middleware, not transport behavior. The client follows up to five redirects by default. The original <code>Request</code> keeps a chain to the final request, so importers can log where a source URL actually landed.</p>',
+            ('redirects.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\Request;
+
+$client   = new Client();
+$request  = new Request( 'https://httpbin.org/redirect-to?url=https://example.com/' );
+$stream   = $client->fetch( $request );
+$response = $stream->await_response();
+$stream->consume_all();
+
+$final = $request->latest_redirect();
+echo "original: " . $request->url . "\\n";
+echo "final:    " . $final->url . "\\n";
+echo "status:   " . $response->status_code . "\\n";'''), False)),
+        ('Cache repeatable GET responses',
+            '<p>Pass <code>cache_dir</code> to add disk caching for cacheable GET and HEAD responses. Fresh cached responses replay the same header/body events as a network response, so crawlers and importers do not need a separate cache code path. Non-GET requests invalidate matching cache entries instead of being cached.</p>',
+            ('cache.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\Request;
+
+$cache_dir = sys_get_temp_dir() . '/http-cache-' . uniqid();
+mkdir( $cache_dir );
+
+$client = new Client( array( 'cache_dir' => $cache_dir ) );
+$url    = 'https://httpbin.org/cache/60';
+
+for ( $i = 1; $i <= 2; $i++ ) {
+\t$stream   = $client->fetch( new Request( $url ) );
+\t$response = $stream->await_response();
+\t$body     = $stream->consume_all();
+\techo "request {$i}: HTTP " . $response->status_code . ', body=' . strlen( $body ) . " bytes\\n";
+}
+
+echo "cache files: " . count( glob( $cache_dir . '/*' ) ) . "\\n";'''), False)),
+        ('Handle failures without losing the queue',
+            '<p>Failures arrive as events. That lets a crawler, importer, package installer, or media frontloader log one bad URL and keep processing the rest of the queue. Treat failure handling as part of the event loop, not as one global try/catch around the whole batch.</p>',
+            ('failures.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\Request;
+
+$client = new Client( array( 'timeout_ms' => 5000 ) );
+$client->enqueue( array(
+\tnew Request( 'https://example.com/', array( 'method' => 'HEAD' ) ),
+\tnew Request( 'https://example.invalid/missing' ),
+) );
+
+while ( $client->await_next_event() ) {
+\t$request = $client->get_request();
+\t$event   = $client->get_event();
+
+\tif ( Client::EVENT_GOT_HEADERS === $event ) {
+\t\techo "ok: " . $request->url . " HTTP " . $request->response->status_code . "\\n";
+\t} elseif ( Client::EVENT_FAILED === $event ) {
+\t\techo "failed: " . $request->url . "\\n";
+\t} elseif ( Client::EVENT_FINISHED === $event ) {
+\t\techo "finished: " . $request->url . "\\n";
+\t}
+}'''), False)),
+        ('Monitor download progress',
+            '<p>When you care about progress, use the event loop directly. Count bytes from each <code>EVENT_BODY_CHUNK_AVAILABLE</code> event and compare them with <code>Content-Length</code> when the server provides one.</p>',
+            ('progress.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\Request;
+
+$url  = 'https://raw.githubusercontent.com/WordPress/php-toolkit/trunk/components/Zip/Tests/fixtures/childrens-literature.zip';
+$dest = sys_get_temp_dir() . '/progress-' . uniqid() . '.zip';
+
+$client  = new Client();
+$request = new Request( $url );
+$client->enqueue( array( $request ) );
+
+$downloaded = 0;
+$last_step  = -1;
+@unlink( $dest );
+
+while ( $client->await_next_event() ) {
+\t$event   = $client->get_event();
+\t$request = $client->get_request();
+
+\tif ( Client::EVENT_GOT_HEADERS === $event ) {
+\t\techo "status: " . $request->response->status_code . "\\n";
+\t\tcontinue;
+\t}
+
+\tif ( Client::EVENT_BODY_CHUNK_AVAILABLE === $event ) {
+\t\t$chunk       = $client->get_response_body_chunk();
+\t\t$downloaded += strlen( $chunk );
+\t\tfile_put_contents( $dest, $chunk, FILE_APPEND );
+
+\t\t$total = $request->response->total_bytes;
+\t\tif ( $total ) {
+\t\t\t$step = min( 100, (int) floor( $downloaded / $total * 100 ) );
+\t\t\tif ( $step >= $last_step + 25 || 100 === $step ) {
+\t\t\t\techo "progress: {$step}% ({$downloaded}/{$total} bytes)\\n";
+\t\t\t\t$last_step = $step;
+\t\t\t}
+\t\t} else {
+\t\t\techo "downloaded: {$downloaded} bytes\\n";
+\t\t}
+\t\tcontinue;
+\t}
+
+\tif ( Client::EVENT_FINISHED === $event ) {
+\t\techo "saved: {$dest}\\n";
+\t} elseif ( Client::EVENT_FAILED === $event ) {
+\t\techo "failed: " . $request->error->message . "\\n";
+\t}
+}'''))),
+        ('Keep a sliding window of 10 requests',
+            '<p>For large queues, do not enqueue everything at once. Keep at most ten active requests, enqueue another as each one finishes, and let the client multiplex only that window.</p>',
+            ('sliding-window.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\Request;
+
+$urls = array();
+for ( $i = 1; $i <= 25; $i++ ) {
+\t$urls[] = 'https://example.com/?request=' . $i;
+}
+
+$client  = new Client( array( 'concurrency' => 10 ) );
+$pending = $urls;
+$active  = array();
+$done    = 0;
+
+$enqueue_next = function () use ( &$pending, &$active, $client ) {
+\tif ( ! $pending ) {
+\t\treturn;
+\t}
+\t$url     = array_shift( $pending );
+\t$request = new Request( $url, array( 'method' => 'HEAD' ) );
+\t$active[ $request->id ] = $request;
+\t$client->enqueue( array( $request ) );
+};
+
+for ( $i = 0; $i < 10; $i++ ) {
+\t$enqueue_next();
+}
+
+while ( $active && $client->await_next_event() ) {
+\t$request = $client->get_request();
+\t$event   = $client->get_event();
+
+\tif ( Client::EVENT_GOT_HEADERS === $event ) {
+\t\techo "headers {$request->id}: " . $request->response->status_code . "\\n";
+\t\tcontinue;
+\t}
+
+\tif ( Client::EVENT_FINISHED === $event || Client::EVENT_FAILED === $event ) {
+\t\tunset( $active[ $request->id ] );
+\t\t$done++;
+\t\techo "finished {$done}/25, active=" . count( $active ) . "\\n";
+\t\t$enqueue_next();
+\t}
+}'''))),
+        ('Resume a partial download',
+            '<p>Resuming is an HTTP contract between you and the server. Save what you already have, send a <code>Range</code> request for the remaining bytes, and append only if the server returns <code>206 Partial Content</code>.</p>',
+            ('resume-download.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\Request;
+
+$url  = 'https://raw.githubusercontent.com/WordPress/php-toolkit/trunk/components/Zip/Tests/fixtures/childrens-literature.zip';
+$dest = sys_get_temp_dir() . '/resume-' . uniqid() . '.zip';
+
+$client = new Client();
+
+// Simulate an interrupted first attempt by downloading only the first 32 KB.
+$first = new Request( $url, array(
+\t'headers' => array( 'range' => 'bytes=0-32767' ),
+) );
+$stream   = $client->fetch( $first );
+$response = $stream->await_response();
+file_put_contents( $dest, $stream->consume_all() );
+
+if ( 206 !== $response->status_code ) {
+\techo "Server did not honor Range; start over with a full download.\\n";
+\texit;
+}
+
+$downloaded = filesize( $dest );
+echo "partial file: {$downloaded} bytes\\n";
+
+$resume = new Request( $url, array(
+\t'headers' => array( 'range' => 'bytes=' . $downloaded . '-' ),
+) );
+$stream   = $client->fetch( $resume );
+$response = $stream->await_response();
+
+if ( 206 !== $response->status_code ) {
+\techo "Server did not resume; discard partial file and retry from byte 0.\\n";
+\texit;
+}
+
+while ( ! $stream->reached_end_of_data() ) {
+\t$n = $stream->pull( 8192 );
+\tif ( 0 === $n ) {
+\t\tbreak;
+\t}
+\tfile_put_contents( $dest, $stream->consume( $n ), FILE_APPEND );
+}
+
+echo "complete file: " . filesize( $dest ) . " bytes\\n";
+echo "saved: {$dest}\\n";'''))),
+        ('Stream-unzip a remote archive',
+            '<p>Mount the remote archive with <code>ZipFilesystem</code>, then copy it into any writable filesystem. <code>SeekableRequestReadStream</code> caches received bytes to a temporary file so <code>ZipFilesystem</code> can read the central directory and seek to entries without first writing the ZIP yourself.</p>',
+            ('stream-unzip.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\ByteStream\\SeekableRequestReadStream;
+use WordPress\\HttpClient\\Request;
+use WordPress\\Filesystem\\LocalFilesystem;
+use WordPress\\Zip\\ZipFilesystem;
+use function WordPress\\Filesystem\\copy_between_filesystems;
+use function WordPress\\Filesystem\\ls_recursive;
+
+$url  = 'https://raw.githubusercontent.com/WordPress/php-toolkit/trunk/components/Zip/Tests/fixtures/childrens-literature.zip';
+$root = sys_get_temp_dir() . '/remote-zip-' . uniqid();
+mkdir( $root );
+
+$client = new Client();
+$reader = new SeekableRequestReadStream(
+\tnew Request( $url ),
+\tarray( 'client' => $client )
+);
+
+$response = $reader->await_response();
+if ( ! $response->ok() ) {
+\techo "HTTP " . $response->status_code . "\\n";
+\texit;
+}
+
+$zip   = ZipFilesystem::create( $reader );
+$local = LocalFilesystem::create( $root );
+
+copy_between_filesystems( array(
+\t'source_filesystem' => $zip,
+\t'source_path'       => '/',
+\t'target_filesystem' => $local,
+\t'target_path'       => '/',
+) );
+
+$tree  = ls_recursive( $local, '/' );
+$files = 0;
+array_walk_recursive( $tree, function ( $value, $key ) use ( &$files ) {
+\tif ( 'type' === $key && 'file' === $value ) {
+\t\t$files++;
+\t}
+} );
+
+echo "extracted {$files} files\\n";
+echo "root: {$root}\\n";'''))),
+        ('Parallel fan-out: fetch many URLs at once',
+            '<p>Enqueue a batch of requests and react to events as they fire. The client multiplexes them — total wall time is roughly the slowest request, not the sum.</p>',
+            ('fan-out.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\Request;
+
+$urls = array(
+\t'https://wordpress.org/',
+\t'https://make.wordpress.org/',
+\t'https://developer.wordpress.org/',
+);
+
+$client = new Client();
+$client->enqueue( array_map( function ( $url ) {
+\treturn new Request( $url, array( 'method' => 'HEAD' ) );
+}, $urls ) );
+
+$results = array();
+while ( $client->await_next_event() ) {
+\t$request = $client->get_request();
+\tif ( Client::EVENT_GOT_HEADERS === $client->get_event() ) {
+\t\t$results[ $request->url ] = $request->response->status_code;
+\t} elseif ( Client::EVENT_FAILED === $client->get_event() ) {
+\t\t$results[ $request->url ] = 'ERR ' . $request->error->message;
+\t}
+}
+
+foreach ( $results as $url => $status ) {
+\tprintf( "%-40s %s\\n", $url, $status );
+}'''))),
+        ('Stream a download to disk without OOM',
+            '<p>Process the body chunk-by-chunk via the event loop. Memory stays flat regardless of file size.</p>',
+            ('stream-to-disk.php', php('''use WordPress\\HttpClient\\Client;
+use WordPress\\HttpClient\\Request;
+
+$dest   = sys_get_temp_dir() . '/wp-readme.html';
+$client = new Client();
+$client->enqueue( array( new Request( 'https://wordpress.org/' ) ) );
+
+$bytes = 0;
+@unlink( $dest );
+
+while ( $client->await_next_event() ) {
+\tswitch ( $client->get_event() ) {
+\t\tcase Client::EVENT_BODY_CHUNK_AVAILABLE:
+\t\t\t$chunk  = $client->get_response_body_chunk();
+\t\t\t$bytes += strlen( $chunk );
+\t\t\tfile_put_contents( $dest, $chunk, FILE_APPEND );
+\t\t\tbreak;
+\t\tcase Client::EVENT_FINISHED:
+\t\t\techo "Wrote {$bytes} bytes to {$dest}\\n";
+\t\t\tbreak;
+\t}
+}
+
+echo "Peak memory: " . round( memory_get_peak_usage( true ) / 1024 / 1024, 2 ) . " MB\\n";'''))),
+    ]))
+
+# ===========================================================================
+# HttpServer
+# ===========================================================================
+COMPONENTS.append(('httpserver', 'HttpServer',
+    'A minimal blocking TCP HTTP server in pure PHP. For CLI tools and tests, not for production traffic.',
+    'wp-php-toolkit/http-server',
+    [
+        ('Why this exists',
+            '<p>Sometimes a PHP tool needs a tiny local HTTP surface: a test fixture server, a webhook receiver during development, a CLI tool with a browser UI, or a demo endpoint for another component. Pulling in a production web framework would obscure the example and add dependencies the toolkit avoids.</p>'
+            '<p>The HttpServer component is intentionally small: a blocking TCP server, incoming request objects, and response writers. It is useful for local tools and tests. It is not a replacement for nginx, Apache, php-fpm, RoadRunner, Swoole, or a production application server.</p>',
+            None),
+        ('Hello world on port 8080',
+            '<p class="callout"><strong>Run on your machine:</strong> the Playground sandbox does not allow processes to bind listening TCP ports. Save this snippet locally and run <code>php hello-server.php</code>.</p>',
+            ('hello-server.php', '''<?php
+require __DIR__ . '/vendor/autoload.php';
+
+use WordPress\\HttpServer\\TcpServer;
+use WordPress\\HttpServer\\IncomingRequest;
+use WordPress\\HttpServer\\Response\\ResponseWriteStream;
+
+$server = new TcpServer( '127.0.0.1', 8080 );
+
+$server->set_handler( function ( IncomingRequest $request, ResponseWriteStream $response ) {
+\t$response->send_http_code( 200 );
+\t$response->send_header( 'Content-Type', 'text/plain' );
+\t$response->append_bytes( "Hello from " . $request->method . " " . $request->url . "\\n" );
+} );
+
+$server->serve( function ( $host, $port ) {
+\techo "Listening on http://{$host}:{$port}\\n";
+} );''', False)),
+        ('A tiny JSON router',
+            '<p class="callout"><strong>Run on your machine:</strong> needs a listening port. Once running, try <code>curl localhost:8080/api/status</code>.</p>'
+            '<p>Build a CLI tool with a web UI by switching on the parsed path and method.</p>',
+            ('mini-router.php', '''<?php
+require __DIR__ . '/vendor/autoload.php';
+
+use WordPress\\HttpServer\\TcpServer;
+use WordPress\\HttpServer\\IncomingRequest;
+use WordPress\\HttpServer\\Response\\ResponseWriteStream;
+
+$server = new TcpServer( '127.0.0.1', 8080 );
+
+$server->set_handler( function ( IncomingRequest $request, ResponseWriteStream $response ) {
+\t$path = $request->get_parsed_url()->pathname;
+
+\tif ( '/api/status' === $path ) {
+\t\t$response->send_http_code( 200 );
+\t\t$response->send_header( 'Content-Type', 'application/json' );
+\t\t$response->append_bytes( json_encode( array(
+\t\t\t'ok'     => true,
+\t\t\t'pid'    => getmypid(),
+\t\t\t'memory' => memory_get_usage( true ),
+\t\t) ) );
+\t\treturn;
+\t}
+
+\tif ( '/api/echo' === $path && 'POST' === $request->method ) {
+\t\t$body = '';
+\t\twhile ( ! $request->body_stream->reached_end_of_data() ) {
+\t\t\t$n = $request->body_stream->pull( 4096 );
+\t\t\tif ( $n > 0 ) $body .= $request->body_stream->consume( $n );
+\t\t}
+\t\t$response->send_http_code( 200 );
+\t\t$response->send_header( 'Content-Type', 'text/plain' );
+\t\t$response->append_bytes( $body );
+\t\treturn;
+\t}
+
+\t$response->send_http_code( 404 );
+\t$response->append_bytes( "Not found\\n" );
+} );
+
+$server->serve();''', False)),
+        ('Buffered response with auto Content-Length',
+            '<p>Use <code>BufferingResponseWriter</code> when you want the framework to compute <code>Content-Length</code> for you, or when the runtime is CGI-shaped and expects the full body up front. This one runs anywhere — no socket required.</p>',
+            ('buffered-writer.php', php('''use WordPress\\HttpServer\\Response\\BufferingResponseWriter;
+
+$writer = new BufferingResponseWriter();
+$writer->send_http_code( 200 );
+$writer->send_header( 'Content-Type', 'text/html' );
+$writer->append_bytes( '<!doctype html><title>Hi</title><h1>Hello</h1>' );
+$writer->append_bytes( '<p>Buffered body, sent at the end.</p>' );
+
+ob_start();
+$writer->close_writing();
+$response_body = ob_get_clean();
+
+echo "headers before send:\\n";
+foreach ( $writer->get_buffered_headers() as $name => $value ) {
+\techo "{$name}: {$value}\\n";
+}
+echo "\\nbody:\\n" . $response_body;'''))),
+    ]))
+
+# ===========================================================================
+# CORSProxy
+# ===========================================================================
+COMPONENTS.append(('corsproxy', 'CORSProxy',
+    'A small PHP CORS proxy intended for browser-side code that needs to reach servers without CORS headers.',
+    'wp-php-toolkit/corsproxy',
+    [
+        ('Why this exists',
+            '<p>A Playground-style browser tool reads <code>https://api.github.com/repos/WordPress/php-toolkit</code>, a plugin ZIP from <code>downloads.wordpress.org</code>, or a raw fixture from GitHub. The browser blocks the response when the upstream server does not send the required CORS headers, even though PHP can fetch the same public URL server-side.</p>'
+            '<p>The CORSProxy component is that server-side bridge. It accepts a target URL, fetches it from PHP, and returns a browser-readable response. Because an open proxy is a security and abuse risk, real deployments should add host allowlists, rate limits, header controls, and private-network protections appropriate to their environment.</p>',
+            None),
+        ('Run the proxy locally',
+            '<p class="callout"><strong>Run on your machine:</strong> the proxy needs to listen on a port. Start PHP\'s built-in server and request any HTTPS URL through it.</p>'
+            '<pre><code>PLAYGROUND_CORS_PROXY_DISABLE_RATE_LIMIT=1 \\\n  php -S 127.0.0.1:5263 vendor/wp-php-toolkit/corsproxy/cors-proxy.php\n\n# In another terminal:\ncurl -s "http://127.0.0.1:5263/cors-proxy.php/https://api.github.com/repos/WordPress/php-toolkit" | head\n</code></pre>',
+            None),
+        ('Production rate limiting',
+            '<p>Drop a <code>cors-proxy-config.php</code> next to <code>cors-proxy.php</code>. If that file defines a <code>playground_cors_proxy_maybe_rate_limit()</code> function, the proxy calls it before forwarding any request — your one chance to reject early. Without the file, the proxy applies its default rate limiter, which is fine for development but should be replaced for any deployment that gets real traffic.</p>'
+            '<p>This example uses a per-IP token bucket stored on disk. Replace with Redis or memcached for multi-host deployments.</p>',
+            ('cors-proxy-config.php', '''<?php
+// cors-proxy-config.php — placed next to cors-proxy.php.
+
+function playground_cors_proxy_maybe_rate_limit() {
+\t$ip      = isset( $_SERVER['REMOTE_ADDR'] ) ? $_SERVER['REMOTE_ADDR'] : '0.0.0.0';
+\t$bucket  = sys_get_temp_dir() . '/cors-rl-' . md5( $ip );
+\t$now     = time();
+\t$window  = 60;
+\t$max_req = 30;
+
+\t$hits = array();
+\tif ( file_exists( $bucket ) ) {
+\t\t$hits = json_decode( file_get_contents( $bucket ), true );
+\t\tif ( ! is_array( $hits ) ) $hits = array();
+\t}
+\t$hits = array_filter( $hits, function ( $t ) use ( $now, $window ) {
+\t\treturn $t > $now - $window;
+\t} );
+
+\tif ( count( $hits ) >= $max_req ) {
+\t\theader( 'Retry-After: ' . $window );
+\t\thttp_response_code( 429 );
+\t\techo 'Rate limit exceeded';
+\t\texit;
+\t}
+
+\t$hits[] = $now;
+\tfile_put_contents( $bucket, json_encode( array_values( $hits ) ) );
+}
+
+echo "Config loaded — rate limiter armed.\\n";''', False)),
+        ('Allowlist upstream hosts',
+            '<p>Out of the box the proxy will fetch any public URL. Most real deployments want a fixed list of upstreams — GitHub, Packagist, wp.org. Both the rate-limit logic and the allowlist live in the same hook, since <code>cors-proxy.php</code> only calls <code>playground_cors_proxy_maybe_rate_limit()</code> once. The example below shows just the allowlist concern; in practice you stack both in one function inside <code>cors-proxy-config.php</code>.</p>',
+            ('cors-proxy-config-allowlist.php', '''<?php
+// cors-proxy-config.php — combine with the rate-limit example above.
+
+function playground_cors_proxy_maybe_rate_limit() {
+\t$allow = array(
+\t\t'api.github.com',
+\t\t'raw.githubusercontent.com',
+\t\t'codeload.github.com',
+\t\t'repo.packagist.org',
+\t\t'downloads.wordpress.org',
+\t\t'api.wordpress.org',
+\t);
+
+\t$target = isset( $_SERVER['PATH_INFO'] ) ? $_SERVER['PATH_INFO'] : ( '/' . ( isset( $_SERVER['QUERY_STRING'] ) ? $_SERVER['QUERY_STRING'] : '' ) );
+\t$target = ltrim( $target, '/' );
+\t$host   = parse_url( $target, PHP_URL_HOST );
+
+\tif ( ! $host || ! in_array( strtolower( $host ), $allow, true ) ) {
+\t\thttp_response_code( 403 );
+\t\theader( 'Content-Type: text/plain' );
+\t\techo "Upstream not allowed: " . ( $host ? $host : '(none)' );
+\t\texit;
+\t}
+}
+
+echo "Allowlist config active.\\n";''', False)),
+        ('Browser-side fetch through the proxy',
+            '<p>Once deployed, the client side is just <code>fetch()</code> with the proxy URL. Drop this into any HTML page.</p>'
+            '<pre><code>const PROXY = "https://cors.example.com/cors-proxy.php";\n\nasync function viaProxy(url, init = {}) {\n  const res = await fetch(`${PROXY}/${url}`, {\n    ...init,\n    headers: {\n      ...(init.headers || {}),\n      "X-Cors-Proxy-Allowed-Request-Headers": "Authorization",\n    },\n  });\n  if (!res.ok) throw new Error(`Proxy returned ${res.status}`);\n  return res;\n}\n\nconst repo = await viaProxy("https://api.github.com/repos/WordPress/php-toolkit").then(r =&gt; r.json());\nconsole.log(repo.full_name, repo.stargazers_count);\n</code></pre>',
+            None),
+        ('Deploy behind nginx',
+            '<p>The proxy is a single PHP script — any SAPI works. nginx + php-fpm is a common production setup. <code>PATH_INFO</code> is what the proxy reads to learn the target URL.</p>'
+            '<pre><code>server {\n  listen 443 ssl http2;\n  server_name cors.example.com;\n\n  root /var/www/cors-proxy;\n  index cors-proxy.php;\n\n  location ~ ^/cors-proxy\\.php(/.*)?$ {\n    fastcgi_pass unix:/run/php/php8.1-fpm.sock;\n    fastcgi_split_path_info ^(.+\\.php)(/.*)$;\n    fastcgi_param SCRIPT_FILENAME $document_root/cors-proxy.php;\n    fastcgi_param PATH_INFO $fastcgi_path_info;\n    include fastcgi_params;\n  }\n}\n</code></pre>',
+            None),
+    ]))
+
+# ===========================================================================
+# CLI
+# ===========================================================================
+COMPONENTS.append(('cli', 'CLI',
+    'POSIX-style argument parser. Long options, short bundles, inline values, positional args — one static call.',
+    'wp-php-toolkit/cli',
+    [
+        ('Why this exists',
+            '<p>Real CLI tools in PHP usually mean either pulling in <code>symfony/console</code> (and the transitive dependencies that come with it) or hand-rolling argv parsing that breaks the first time someone writes <code>-vvv</code> or <code>--port=8080</code>. The toolkit\'s <code>CLI</code> class is one static method, no dependencies, and handles the POSIX shapes you actually see.</p>',
+            None),
+        ('Parse a single flag',
+            '<p>The smallest useful invocation: one boolean flag, one positional. Each option is a four-tuple of <code>[ short, has_value, default, description ]</code>.</p>',
+            ('parse-flag.php', php('''use WordPress\\CLI\\CLI;
+
+$option_defs = array(
+\t'verbose' => array( 'v', false, false, 'Enable verbose output' ),
+);
+
+list( $positionals, $options ) = CLI::parse_command_args_and_options(
+\tarray( '-v', 'input.txt' ),
+\t$option_defs
+);
+
+echo "verbose: " . ( $options['verbose'] ? 'yes' : 'no' ) . "\\n";
+echo "input:   " . $positionals[0] . "\\n";'''))),
+        ('Mix values, flags, and bundles',
+            '<p>The parser accepts <code>--port 8080</code>, <code>--port=8080</code>, <code>-p 8080</code>, and <code>-p=8080</code>. It also expands bundled boolean shorts such as <code>-afv</code>.</p>',
+            ('mix-shapes.php', php('''use WordPress\\CLI\\CLI;
+
+$option_defs = array(
+\t'all'     => array( 'a', false, false, 'Process everything' ),
+\t'force'   => array( 'f', false, false, 'Overwrite existing files' ),
+\t'verbose' => array( 'v', false, false, 'Verbose output' ),
+\t'output'  => array( 'o', true,  null,  'Output path' ),
+\t'port'    => array( 'p', true,  '3000', 'Server port' ),
+);
+
+$argv = array( '-afv', '--port=8080', '-o', '/tmp/result.txt', 'input.json' );
+list( $positionals, $options ) = CLI::parse_command_args_and_options( $argv, $option_defs );
+
+echo "input:   " . $positionals[0] . "\\n";
+echo "flags:   " . implode( ', ', array_keys( array_filter( array(
+\t'all'     => $options['all'],
+\t'force'   => $options['force'],
+\t'verbose' => $options['verbose'],
+) ) ) ) . "\\n";
+echo "output:  " . $options['output'] . "\\n";
+echo "port:    " . $options['port'] . "\\n";'''))),
+        ('Validate required options',
+            '<p>The parser fills in defaults but never enforces "required". Check for <code>null</code> after parsing — full control over the error message.</p>',
+            ('require-options.php', php('''use WordPress\\CLI\\CLI;
+
+$option_defs = array(
+\t'site-url'  => array( 'u', true, null, 'Public site URL (required)' ),
+\t'site-path' => array( null, true, null, 'Target directory (required)' ),
+);
+
+$argv = array( '--site-url', 'https://mysite.test' );
+
+try {
+\tlist( , $options ) = CLI::parse_command_args_and_options( $argv, $option_defs );
+\tforeach ( array( 'site-url', 'site-path' ) as $name ) {
+\t\tif ( null === $options[ $name ] ) {
+\t\t\tthrow new RuntimeException( "Missing required option --{$name}" );
+\t\t}
+\t}
+\techo "All good.\\n";
+} catch ( Exception $e ) {
+\techo "error: " . $e->getMessage() . "\\n";
+}'''))),
+        ('Generate --help from definitions',
+            '<p>Because each option carries its own description, you can render help text by walking the same definitions you parse with. No second source of truth.</p>',
+            ('help-text.php', php('''use WordPress\\CLI\\CLI;
+
+$option_defs = array(
+\t'output'  => array( 'o', true,  null,  'Write result to FILE' ),
+\t'force'   => array( 'f', false, false, 'Overwrite existing files' ),
+\t'verbose' => array( 'v', false, false, 'Verbose output' ),
+\t'help'    => array( 'h', false, false, 'Show this help and exit' ),
+);
+
+function render_help( array $defs ) {
+\techo "Usage: mytool [options] <input>\\n\\nOptions:\\n";
+\tforeach ( $defs as $long => $def ) {
+\t\tlist( $short, $has_value, $default, $desc ) = $def;
+\t\t$flag = ( $short ? "-{$short}, " : '    ' ) . "--{$long}";
+\t\tif ( $has_value ) $flag .= '=VALUE';
+\t\techo sprintf( "  %-28s %s\\n", $flag, $desc );
+\t}
+}
+
+list( , $options ) = CLI::parse_command_args_and_options( array( '-h' ), $option_defs );
+if ( $options['help'] ) render_help( $option_defs );'''))),
+        ('Git-style subcommands',
+            '<p>To build a tool with subcommands like <code>mytool deploy</code>, peel the first positional off <code>argv</code>, dispatch, and parse the rest with a per-command option set.</p>',
+            ('subcommands.php', php('''use WordPress\\CLI\\CLI;
+
+$commands = array(
+\t'deploy' => array(
+\t\t'env'     => array( 'e', true, 'staging', 'Target environment' ),
+\t\t'dry-run' => array( 'n', false, false, 'Preview without applying' ),
+\t),
+\t'rollback' => array(
+\t\t'to' => array( 't', true, null, 'Revision to roll back to' ),
+\t),
+);
+
+function run( array $argv, array $commands ) {
+\tif ( empty( $argv ) ) {
+\t\techo "Usage: mytool <command> [options]\\nCommands: " . implode( ', ', array_keys( $commands ) ) . "\\n";
+\t\treturn;
+\t}
+\t$command = array_shift( $argv );
+\tif ( ! isset( $commands[ $command ] ) ) {
+\t\techo "Unknown command: {$command}\\n";
+\t\treturn;
+\t}
+\tlist( $positionals, $options ) = CLI::parse_command_args_and_options( $argv, $commands[ $command ] );
+\techo "command={$command}\\n";
+\techo "options: " . json_encode( $options ) . "\\n";
+\techo "positionals: " . json_encode( $positionals ) . "\\n";
+}
+
+run( array( 'deploy', '--env=production', '-n', 'web-01', 'web-02' ), $commands );
+echo "---\\n";
+run( array( 'rollback', '-t', 'abc123' ), $commands );'''))),
+    ]))
+
+# ===========================================================================
+# Polyfill
+# ===========================================================================
+COMPONENTS.append(('polyfill', 'Polyfill',
+    'PHP 8 string functions on PHP 7.2+, WordPress hook stubs, and translation/escaping passthroughs so toolkit code runs without WordPress.',
+    'wp-php-toolkit/polyfill',
+    [
+        ('Why this exists',
+            '<p>A lot of WordPress-adjacent code wants to call <code>esc_html()</code>, <code>__()</code>, or <code>apply_filters()</code> without booting WordPress. The polyfill component provides minimal but real implementations so that code runs unchanged outside WordPress, and stays out of the way when WordPress is loaded (every function uses <code>function_exists()</code> guards).</p>',
+            None),
+        ('PHP 8 string functions on PHP 7.2',
+            '<p>The polyfills define <code>str_contains</code>, <code>str_starts_with</code>, <code>str_ends_with</code>, and <code>array_key_first</code> only when missing.</p>',
+            ('php8-strings.php', php('''var_dump( str_starts_with( '/var/www/html', '/var' ) );
+var_dump( str_ends_with( 'image.png', '.png' ) );
+var_dump( str_contains( 'WordPress Toolkit', 'Toolkit' ) );
+
+$first_key = array_key_first( array( 'alpha' => 1, 'beta' => 2 ) );
+echo "first key: {$first_key}\\n";'''))),
+        ('Escaping and translation stubs',
+            '<p>Pass-through implementations let you write code that looks WordPressy and runs anywhere.</p>',
+            ('wp-stubs.php', php('''echo __( 'Hello, world' ) . "\\n";
+echo esc_html( '<script>alert("xss")</script>' ) . "\\n";
+echo esc_attr( 'a "quoted" value' ) . "\\n";
+echo esc_url( 'https://example.com/?a=1&b=2' ) . "\\n";'''))),
+        ('A simple filter chain',
+            '<p>The hook system is a real implementation of the WordPress filter API: registered callbacks get applied in priority order, and each one transforms the running value.</p>',
+            ('filter-chain.php', php('''add_filter( 'sanitize_title', 'trim' );
+add_filter( 'sanitize_title', 'strtolower' );
+add_filter( 'sanitize_title', function ( $title ) {
+\treturn preg_replace( '/\\s+/', '-', $title );
+} );
+
+echo apply_filters( 'sanitize_title', '  My Post Title  ' ) . "\\n";'''))),
+        ('Priority ordering and multi-arg passing',
+            '<p>Lower priority numbers run first. The fourth argument to <code>add_filter</code> controls how many context values get passed to the callback.</p>',
+            ('priority-args.php', php('''add_filter( 'render_price', function ( $html, $price, $currency ) {
+\treturn $html . " ({$currency} markup)";
+}, 30, 3 );
+
+add_filter( 'render_price', function ( $html, $price ) {
+\treturn "<strong>{$html}</strong>";
+}, 10, 2 );
+
+add_filter( 'render_price', function ( $html, $price, $currency ) {
+\tif ( 'EUR' === $currency ) return $html . ' EUR';
+\treturn $html . " {$currency}";
+}, 20, 3 );
+
+echo apply_filters( 'render_price', '19.99', 19.99, 'EUR' ) . "\\n";'''))),
+        ('Hook-based extension points in standalone libraries',
+            '<p>Use <code>do_action</code> and <code>apply_filters</code> as cheap extension points in your own code, without depending on WordPress.</p>',
+            ('library-hooks.php', php('''class ImportPipeline {
+\tpublic function process( array $row ) {
+\t\t$row = apply_filters( 'import_pipeline_normalize', $row );
+\t\tdo_action( 'import_pipeline_row_processed', $row );
+\t\treturn $row;
+\t}
+}
+
+add_filter( 'import_pipeline_normalize', function ( $row ) {
+\t$row['email'] = strtolower( trim( $row['email'] ) );
+\treturn $row;
+} );
+
+$log = array();
+add_action( 'import_pipeline_row_processed', function ( $row ) use ( &$log ) {
+\t$log[] = $row['email'];
+} );
+
+$pipeline = new ImportPipeline();
+$pipeline->process( array( 'email' => '  USER@EXAMPLE.COM  ' ) );
+$pipeline->process( array( 'email' => 'OTHER@example.com' ) );
+
+echo implode( "\\n", $log ) . "\\n";'''))),
+    ]))
+
+# ===========================================================================
+# Blueprints
+# ===========================================================================
+COMPONENTS.append(('blueprints', 'Blueprints',
+    'Declarative WordPress site provisioning. Write a JSON description of plugins, options, and content; let the runner execute it.',
+    'wp-php-toolkit/blueprints',
+    [
+        ('Why this exists',
+            '<p>A WordPress environment is more than a database dump. It can require a specific core version, plugins, themes, site options, uploaded files, content, and setup steps. Rebuilding that by hand makes demos, tests, bug reports, workshops, and CI fixtures drift over time.</p>'
+            '<p>The Blueprints component treats site setup as data. A blueprint JSON document describes the desired steps, and the runner applies them to either a new WordPress install or an existing one. The validator exists because user-authored JSON needs clear, path-specific errors rather than generic schema failures.</p>'
+            '<p><code>RunnerConfiguration</code> separates the web root from the WordPress core directory, since real hosts often put them in different places. Both paths are explicit on the runner, never inferred.</p>'
+            '<p>Blueprints can <em>create</em> a new WordPress install (download core, set up the database, apply steps) or <em>apply to an existing</em> site. Creating a fresh install needs filesystem access this in-browser runtime doesn\'t have, so the runnable snippets focus on <code>APPLY_TO_EXISTING_SITE</code>.</p>',
+            None),
+        ('Configure a runner for an existing site',
+            '<p><code>RunnerConfiguration</code> is a fluent builder. The minimum: target site root, target site URL, execution mode.</p>',
+            ('configure.php', php('''use WordPress\\Blueprints\\Runner;
+use WordPress\\Blueprints\\RunnerConfiguration;
+
+$config = ( new RunnerConfiguration() )
+\t->set_execution_mode( Runner::EXECUTION_MODE_APPLY_TO_EXISTING_SITE )
+\t->set_target_site_root( '/wordpress' )
+\t->set_target_site_url( 'http://playground.test/' );
+
+echo "mode: " . $config->get_execution_mode() . "\\n";
+echo "root: " . $config->get_target_site_root() . "\\n";
+echo "url:  " . $config->get_target_site_url() . "\\n";'''))),
+        ('Generate blueprint JSON from PHP',
+            '<p>CI jobs and tests stay clearer when PHP builds the blueprint from data instead of hand-writing JSON. Keep the structure plain: <code>version</code>, then a list of step arrays.</p>',
+            ('build-json.php', php('''$site_name = 'Demo Site';
+$plugins   = array( 'gutenberg', 'classic-editor' );
+
+$blueprint = array(
+\t'version' => 2,
+\t'steps'   => array(
+\t\tarray(
+\t\t\t'step'    => 'setSiteOptions',
+\t\t\t'options' => array(
+\t\t\t\t'blogname'              => $site_name,
+\t\t\t\t'permalink_structure'   => '/%postname%/',
+\t\t\t\t'show_on_front'         => 'page',
+\t\t\t),
+\t\t),
+\t),
+);
+
+foreach ( $plugins as $slug ) {
+\t$blueprint['steps'][] = array(
+\t\t'step'       => 'installPlugin',
+\t\t'pluginData' => "https://downloads.wordpress.org/plugin/{$slug}.zip",
+\t);
+\t$blueprint['steps'][] = array(
+\t\t'step'   => 'activatePlugin',
+\t\t'plugin' => "{$slug}/{$slug}.php",
+\t);
+}
+
+echo json_encode( $blueprint, JSON_PRETTY_PRINT | JSON_UNESCAPED_SLASHES ) . "\\n";'''))),
+        ('Validate before running',
+            '<p>The schema validator returns a human-readable <code>ValidationError</code> instead of a generic "does not match schema" failure. Use it before handing user-authored JSON to a runner.</p>',
+            ('validate.php', php('''use WordPress\\Blueprints\\Validator\\HumanFriendlySchemaValidator;
+
+$schema = array(
+\t'type'       => 'object',
+\t'required'   => array( 'version', 'steps' ),
+\t'properties' => array(
+\t\t'version' => array( 'type' => 'integer' ),
+\t\t'steps'   => array(
+\t\t\t'type'  => 'array',
+\t\t\t'items' => array(
+\t\t\t\t'type'       => 'object',
+\t\t\t\t'required'   => array( 'step' ),
+\t\t\t\t'properties' => array(
+\t\t\t\t\t'step' => array( 'type' => 'string' ),
+\t\t\t\t),
+\t\t\t),
+\t\t),
+\t),
+);
+
+$blueprint = array(
+\t'version' => 2,
+\t'steps'   => array(
+\t\tarray( 'pluginData' => 'https://downloads.wordpress.org/plugin/gutenberg.zip' ),
+\t),
+);
+
+$error = ( new HumanFriendlySchemaValidator( $schema ) )->validate( $blueprint );
+if ( null === $error ) {
+\techo "valid\\n";
+} else {
+\techo $error->get_pretty_path() . ": " . $error->message . "\\n";
+}'''))),
+        ('The Blueprint JSON shape',
+            '<p>A blueprint is a JSON document with a <code>version</code> field and a <code>steps</code> array. Each step has a <code>"step"</code> discriminator and step-specific fields. This is the same shape used by <a href="https://playground.wordpress.net/">WordPress Playground</a>.</p>'
+            '<pre><code>{\n  "version": 2,\n  "steps": [\n    { "step": "setSiteOptions",\n      "options": {\n        "blogname": "Demo Site",\n        "permalink_structure": "/%postname%/"\n      } },\n    { "step": "installPlugin",\n      "pluginData": "https://downloads.wordpress.org/plugin/gutenberg.zip" },\n    { "step": "activatePlugin",\n      "plugin": "gutenberg/gutenberg.php" }\n  ]\n}</code></pre>',
+            None),
+    ]))
+
+# ===========================================================================
+# ToolkitCodingStandards
+# ===========================================================================
+COMPONENTS.append(('coding-standards', 'ToolkitCodingStandards',
+    'PHP_CodeSniffer sniffs used by this project: enforce Yoda comparisons and ban the short ternary where it hides falsy-value bugs.',
+    'wp-php-toolkit/toolkit-coding-standards',
+    [
+        ('Why this exists',
+            '<p>This package is not a general-purpose style guide. It holds project-specific PHP_CodeSniffer rules for review comments the toolkit wants automated: comparisons should follow the WordPress Yoda style, and short ternaries should not hide whether a fallback is meant for <code>null</code> only or for all falsy values.</p>'
+            '<p>Use it in this monorepo, or in a project that intentionally wants the same review tradeoffs. If your project does not follow WordPress-style comparisons, the Yoda sniff is probably the wrong rule for you.</p>',
+            None),
+        ('Reference the standard from your phpcs.xml',
+            '<p>The component is a PHPCS ruleset, so the useful examples are configuration and before/after code rather than runtime snippets. Activate both sniffs at once by referencing <code>WordPressToolkitCodingStandards</code>:</p>'
+            '<pre><code>&lt;?xml version="1.0"?&gt;\n&lt;ruleset name="My Project"&gt;\n  &lt;file&gt;src/&lt;/file&gt;\n\n  &lt;!-- Activate both toolkit sniffs --&gt;\n  &lt;rule ref="WordPressToolkitCodingStandards"/&gt;\n\n  &lt;!-- Or pick them individually --&gt;\n  &lt;!-- &lt;rule ref="WordPressToolkitCodingStandards.PHP.EnforceYodaComparison"/&gt; --&gt;\n  &lt;!-- &lt;rule ref="WordPressToolkitCodingStandards.PHP.DisallowShortTernary"/&gt; --&gt;\n&lt;/ruleset&gt;</code></pre>'
+            '<p>Then run phpcs and phpcbf the usual way:</p>'
+            '<pre><code>vendor/bin/phpcs --standard=phpcs.xml .\nvendor/bin/phpcbf --standard=phpcs.xml .</code></pre>',
+            None),
+        ('EnforceYodaComparison: catches accidental assignment',
+            '<p>Yoda comparisons (<code>true === $x</code>) make typo-induced assignments easier to catch and match the WordPress style used throughout the toolkit:</p>'
+            '<pre><code>// Bug: single = inside a condition. Always truthy, mutates $status.\nif ( $status = \'published\' ) {\n    publish_post( $post );\n}\n\n// Yoda style: writing this typo would be a parse error.\nif ( \'published\' === $status ) {\n    publish_post( $post );\n}</code></pre>'
+            '<p>The sniff covers <code>===</code>, <code>!==</code>, <code>==</code>, and <code>!=</code>, and stays quiet when both sides are dynamic.</p>',
+            None),
+        ('Why ban the short ternary',
+            '<p>Developers confuse the short ternary (<code>$a ?: $b</code>) with the null-coalescing operator (<code>$a ?? $b</code>). They differ on falsy-but-not-null values: <code>0 ?: \'fallback\'</code> returns <code>\'fallback\'</code>, but <code>0 ?? \'fallback\'</code> returns <code>0</code>. The sniff bans <code>?:</code> entirely so reviewers don\'t have to relitigate this on every PR.</p>',
+            None),
+        ('Review-friendly replacements',
+            '<p>When the fallback should apply only to <code>null</code>, use <code>??</code>. When the fallback should apply to every falsy value, write the full ternary so the intent is visible in review.</p>'
+            '<pre><code>// Only missing values fall back. 0 and "" are preserved.\n$limit = $request_limit ?? 20;\n\n// Any falsy value falls back. The duplicated condition is intentional.\n$title = $raw_title ? $raw_title : \'Untitled\';</code></pre>',
+            None),
+    ]))
diff --git a/bin/_expected_outputs.json b/bin/_expected_outputs.json
new file mode 100644
index 000000000..d63c37235
--- /dev/null
+++ b/bin/_expected_outputs.json
@@ -0,0 +1,81 @@
+{
+  "blockparser::audit-embeds.php": "ok     https://twitter.com/wordpress/status/1\nok     https://youtube.com/watch?v=abc\nSTALE  https://vine.co/v/xyz\n",
+  "blockparser::count-blocks.php": "   2  core/paragraph\n   1  core/group\n   1  core/heading\n   1  core/image\n",
+  "blockparser::find-custom-block.php": "1. Jane (5/5): Loved it.\n2. Joe (4/5): Pretty good.\n",
+  "blockparser::has-block.php": "has button\nmissing gallery\n",
+  "blockparser::lint-headings.php": "ok   Intro: H2\nWARN Subsection: jumped from H2 to H4\nok   Body: H3\n",
+  "blockparser::parse.php": "core/heading: Welcome\ncore/paragraph: Hello from the block editor.\n",
+  "blueprints::build-json.php": "{\n    \"version\": 2,\n    \"steps\": [\n        {\n            \"step\": \"setSiteOptions\",\n            \"options\": {\n                \"blogname\": \"Demo Site\",\n                \"permalink_structure\": \"/%postname%/\",\n                \"show_on_front\": \"page\"\n            }\n        },\n        {\n            \"step\": \"installPlugin\",\n            \"pluginData\": \"https://downloads.wordpress.org/plugin/gutenberg.zip\"\n        },\n        {\n            \"step\": \"activatePlugin\",\n            \"plugin\": \"gutenberg/gutenberg.php\"\n        },\n        {\n            \"step\": \"installPlugin\",\n            \"pluginData\": \"https://downloads.wordpress.org/plugin/classic-editor.zip\"\n        },\n        {\n            \"step\": \"activatePlugin\",\n            \"plugin\": \"classic-editor/classic-editor.php\"\n        }\n    ]\n}\n",
+  "blueprints::configure.php": "mode: apply-to-existing-site\nroot: /wordpress\nurl:  http://playground.test/\n",
+  "blueprints::validate.php": "Blueprint root[\"steps\"][0]: Missing required field: step.\n",
+  "bytestream::deflate-roundtrip.php": "original  : 1050 bytes\ndeflated  : 45 bytes (4.3%)\nround-trip: OK\n",
+  "bytestream::limited.php": "body sees: BODY:hello there\nremaining in source: |FOOTER:done\n",
+  "bytestream::lines.php": "[1] alpha\n[2] bravo\n[3] charlie\n[4] delta\n[5] echo\n",
+  "bytestream::memory-pipe.php": "got: first chunk\nsecond chunk\nthird chunk\n",
+  "bytestream::teaser-read.php": "Read 1800 bytes in 256-byte chunks.\n",
+  "cli::help-text.php": "Usage: mytool [options] <input>\n\nOptions:\n  -o, --output=VALUE           Write result to FILE\n  -f, --force                  Overwrite existing files\n  -v, --verbose                Verbose output\n  -h, --help                   Show this help and exit\n",
+  "cli::mix-shapes.php": "input:   input.json\nflags:   all, force, verbose\noutput:  /tmp/<tempfile>.txt\nport:    8080\n",
+  "cli::parse-flag.php": "verbose: yes\ninput:   input.txt\n",
+  "cli::require-options.php": "error: Missing required option --site-path\n",
+  "cli::subcommands.php": "command=deploy\noptions: {\"env\":\"production\",\"dry-run\":true}\npositionals: [\"web-01\",\"web-02\"]\n---\ncommand=rollback\noptions: {\"to\":\"abc123\"}\npositionals: []\n",
+  "dataliberation::build-wxr.php": "items: 2\nterms: 3\nBlog post exported\n",
+  "dataliberation::md-to-wxr.php": "posts: 2\nblock markup exported\nfrontmatter title exported\n",
+  "dataliberation::rewrite-urls.php": "new URL present\nold URL removed\n",
+  "dataliberation::wxr-quickstart.php": "bytes: 475\ntitle exported\nstatus exported\n",
+  "dataliberation::wxr-read.php": "site_option: {\"option_name\":\"blogname\",\"option_value\":\"Demo\"}\npost: {\"post_title\":\"First\",\"post_id\":\"1\",\"post_type\":\"post\",\"post_content\":\"Body 1\"}\npost: {\"post_title\":\"Second\",\"post_id\":\"2\",\"post_type\":\"post\",\"post_content\":\"Body 2\"}\n",
+  "encoding::mixed-encoding.php": "#1 ok: Plain ASCII\n#2 ok: Caf\u00e9\n#3 recovered as latin1: caf\u00e9\n#4 recovered as latin1: weird \u00c0 byte\n",
+  "encoding::noncharacters.php": "normal text: ok\nU+FFFE:      reject\nU+FDD0:      reject\n",
+  "encoding::pipeline.php": "good       valid=Y noncharacter=N -> Caf\u00e9\nlatin1     valid=N noncharacter=N -> caf\ufffd\noverlong   valid=N noncharacter=N -> x\ufffd\ufffdy\nnoncharac  valid=Y noncharacter=Y -> hi \ufffe there\n",
+  "encoding::scrub.php": "the byte \ufffd should not be here.\n.\ufffd\ufffd.\n",
+  "encoding::validate.php": "ASCII:         valid\nUTF-8 pencil:  valid\nlatin-1 byte:  invalid\noverlong slash: invalid\nsurrogate half: invalid\n",
+  "filesystem::atomic-write.php": "config: {\"v\":2}\nno .tmp leftovers: 1 entries in root\n",
+  "filesystem::cross-backend-copy.php": "in memory after two copies:\n  posts: 2024-01.md\n  index: <h1>Home</h1>\n",
+  "filesystem::local-chroot.php": "Hi from local disk.\nexists after cleanup? no\n",
+  "filesystem::path-helpers.php": "/var/www/site/index.php\n/a/b\na/c/e\n",
+  "filesystem::sqlite.php": "post-1.md: # Post 1\npost-2.md: # Post 2\npost-3.md: # Post 3\n",
+  "filesystem::teaser-memory.php": "Hello, world!",
+  "filesystem::test-without-disk.php": "{\"version\":\"1.2.4\"}\n",
+  "git::branches.php": "on experiment: {\"flag\":true}\non trunk:      {\"flag\":false}\n",
+  "git::commit-in-memory.php": "commit: <oid>\nHEAD: <oid>\nREADME: # My Project\n",
+  "git::git-filesystem.php": "tree:\n  /posts/about.md\n  /posts/hello.md\n\nhello.md now:\n# Hello\nSecond draft.\n",
+  "git::merge-branches.php": "merge head: <oid>\nconflicts:  none\nresult:\nbuy oat milk\nwalk dog\nread book\nwrite blog post\n",
+  "git::options-snapshot.php": "Files changed in last snapshot:\n  options.json\n",
+  "git::walk-history.php": "<hash>  expand examples\n<hash>  fix typo\n<hash>  add intro\n",
+  "html::absolute-links.php": "<p>See <a href=\"https://my-site.test/about\">about</a>, <a href=\"https://example.com/x\">x</a>, and <a href=\"https://my-site.test/contact.html\">contact</a>.</p>",
+  "html::bookmarks.php": "<ul data-progress=\"2/3\"><li><input type=\"checkbox\" checked> Buy milk</li><li><input type=\"checkbox\"> Walk the dog</li><li><input type=\"checkbox\" checked> Read book</li></ul>",
+  "html::breadcrumbs.php": "found 2 figure images\n<article><figure><img class=\"figure-image\" src=\"hero.jpg\" alt=\"Hero\"><figcaption>Hero shot</figcaption></figure><p>Body copy <img src=\"emoji.png\" alt=\"\"> mid-paragraph.</p><figure><img class=\"figure-image\" src=\"diagram.png\" alt=\"Diagram\"></figure></article>",
+  "html::csp-nonce.php": "nonce: <random>\n\n<head><style nonce=\"<random>\">body{font:16px sans-serif}</style></head><body><script nonce=\"<random>\">console.log(\"hi\")</script><script nonce=\"<random>\" src=\"vendor.js\"></script></body>",
+  "html::decode-entities.php": "attribute: path?a=1&b=2&copy\ntext:      AT&T \u2014 100% \ud83d\ude00\nbool(false)\n",
+  "html::lazy-load-images.php": "<article>\n\t<img decoding=\"async\" loading=\"lazy\" src=\"hero.jpg\" alt=\"Hero\">\n\t<p>Intro copy.</p>\n\t<img decoding=\"async\" loading=\"lazy\" src=\"inline.jpg\" alt=\"Inline\">\n</article>",
+  "html::outline.php": "    H1  Title\n      H2  Chapter 1\n      H2  Chapter 2\n",
+  "html::sanitize-html.php": "<p>Hi <b >friend</b>!</p><script></script><img src=x >",
+  "html::srcset-rewrite.php": "<figure><img sizes=\"(max-width: 768px) 100vw, 768px\" srcset=\"https://cdn.test/uploads/photo.jpg?w=480 480w, https://cdn.test/uploads/photo.jpg?w=768 768w, https://cdn.test/uploads/photo.jpg?w=1200 1200w\" src=\"https://cdn.test/uploads/photo.jpg\" alt=\"Sunset\"></figure>",
+  "httpclient::parse-response.php": "status: 201 Created\nok:     yes\ntype:   application/json\nsize:   27 bytes\n",
+  "httpclient::request-object.php": "POST https://api.example.test/posts\ncontent-type: application/json\ncontent-length: 39\nauthorization: Basic dXNl...\n",
+  "httpserver::buffered-writer.php": "headers before send:\nContent-Type: text/html\n\nbody:\n<!doctype html><title>Hi</title><h1>Hello</h1><p>Buffered body, sent at the end.</p>",
+  "markdown::count-blocks.php": "core/heading: 1\ncore/paragraph: 2\ncore/table: 1\ncore/code: 1\ncore/quote: 1\n",
+  "markdown::frontmatter.php": "Title: The Name of the Wind\nStatus: publish\nTags: fantasy, kingkiller\n",
+  "markdown::migrate-folder.php": "=== roadmap (/tmp/<tempfile>/roadmap.md) ===\n<!-- wp:heading {\"level\":1} -->\n<h1 class=\"wp-block-heading\" id=\"roadmap\">Roadmap</h1>\n<!-- /wp:heading -->\n\n<!-- wp:lis...\n\n=== Welcome (/tmp/<tempfile>/welcome.md) ===\n<!-- wp:paragraph -->\n<p>Hello world.</p>\n<!-- /wp:paragraph -->\n\n...\n\n",
+  "markdown::quickstart.php": "<!-- wp:heading {\"level\":1} -->\n<h1 class=\"wp-block-heading\" id=\"hello\">Hello</h1>\n<!-- /wp:heading -->\n\n<!-- wp:paragraph -->\n<p>Welcome to <b>WordPress</b>.</p>\n<!-- /wp:paragraph -->\n\n",
+  "markdown::roundtrip.php": "## Round trip\n\n- one\n- two\n- three\n\n",
+  "merge::conflicts.php": "ours:   line 2 from Alice\ntheirs: line 2 from Bob\n\n--- merged content with markers ---\nline 1\n\n<<<<<<< HEAD\nline 2 from Alice\n\n=======\nline 2 from Bob\n\n>>>>>>> incoming \n\n",
+  "merge::git-patch.php": "diff --git a/post.yml b/post.yml\n--- a/post.yml\n+++ b/post.yml\n@@ -1,4 +1,5 @@- title: Hello\n+ title: Hello, world\n  author: Alice\n- status: draft\n+ status: published\n+ tags: greeting\n  \n",
+  "merge::line-diff.php": "= alpha\n- beta\n+ BETA\n= gamma\n+ delta\n= \n",
+  "merge::sync-folder-vs-db.php": "=== hello.md ===\n(conflict \u2014 needs review)\n# Hello\n\n<<<<<<< HEAD\nDraft body, expanded on disk.\n\n=======\nNew section from the editor.\n\n>>>>>>> incoming \n\n\n=== about.md ===\n(conflict \u2014 needs review)\n# About\n\n<<<<<<< HEAD\nWho *they* are.\n\n=======\nWho we really are.\n\n>>>>>>> incoming \n\n\n",
+  "merge::three-way.php": "clean merge:\nintro updated\nbody\noutro\nappendix\n\n",
+  "polyfill::filter-chain.php": "my-post-title\n",
+  "polyfill::library-hooks.php": "user@example.com\nother@example.com\n",
+  "polyfill::php8-strings.php": "bool(true)\nbool(true)\nbool(true)\nfirst key: alpha\n",
+  "polyfill::priority-args.php": "<strong>19.99</strong> EUR (EUR markup)\n",
+  "polyfill::wp-stubs.php": "Hello, world\n&lt;script&gt;alert(&quot;xss&quot;)&lt;/script&gt;\na &quot;quoted&quot; value\nhttps://example.com/?a=1&amp;b=2\n",
+  "xml::bump-prices.php": "<catalog><book sku=\"A1\" price=\"32.99\"><title>PHP Internals</title></book><book sku=\"A2\" price=\"15.95\"><title>WordPress at Scale</title></book></catalog>",
+  "xml::opml.php": "Hacker News\thttps://news.ycombinator.com/rss\nLWN\thttps://lwn.net/headlines/rss\nWordPress\thttps://wordpress.org/news/feed/\n",
+  "xml::rewrite-wxr-urls.php": "rewrote 3 text nodes\n\n<?xml version=\"1.0\"?><rss xmlns:wp=\"http://wordpress.org/export/1.2/\"><channel><wp:base_site_url>https://new.example.com</wp:base_site_url><item><link>https://new.example.com/2024/post-1</link><guid>https://new.example.com/?p=1</guid></item></channel></rss>",
+  "xml::wxr-namespaces.php": "title: Hello World\ndc/creator: admin\nwp/post_id: 42\nwp/status: publish\n",
+  "zip::epub.php": "mimetype: application/epub+zip\nsize on disk: 839 bytes\n",
+  "zip::repack.php": "new config.json: {\"debug\":true,\"version\":\"1.0.1\"}\nuntouched: <?php echo \"hello\";\n",
+  "zip::stream-large.php": "Inflated 205000 bytes in 8 KB chunks, parsed 15000 rows.\n",
+  "zip::teaser-read.php": "Hello from inside the zip.",
+  "zip::zip-slip.php": "../../etc/passwd                              => etc/passwd\n./safe/path.txt                               => ./safe/path.txt\na/../../b/secret                              => a/../b/secret\na//b///c.txt                                  => a/b/c.txt\n../../../../root/.ssh/authorized_keys         => root/.ssh/authorized_keys\n",
+  "zip::zip-to-memfs.php": "files now in memory:\n  /app/README.md\n  /app/VERSION\n  /app/assets/style.css\n  /app/index.php\n  /app/lib/util.php\n"
+}
diff --git a/bin/build-docs-bundle.sh b/bin/build-docs-bundle.sh
new file mode 100755
index 000000000..ce6eb195d
--- /dev/null
+++ b/bin/build-docs-bundle.sh
@@ -0,0 +1,23 @@
+#!/usr/bin/env bash
+# Rebuilds docs/assets/php-toolkit.zip and regenerates the docs HTML pages.
+# Run this whenever components/ changes or the docs page generator (bin/build-docs.py)
+# changes.
+set -euo pipefail
+
+cd "$(dirname "$0")/.."
+
+echo "==> composer install --no-dev --optimize-autoloader"
+composer install --no-dev --optimize-autoloader --quiet
+
+echo "==> bundling docs/assets/php-toolkit.zip"
+rm -f docs/assets/php-toolkit.zip
+zip -qr docs/assets/php-toolkit.zip components vendor bootstrap.php composer.json \
+  -x "*/Tests/*" "*/tests/*" "*/.git/*" "*/.github/*" "*/node_modules/*"
+
+echo "==> regenerating legacy docs/_legacy/*/index.html"
+python3 bin/build-docs.py
+
+echo "==> regenerating docs/reference/*.html"
+python3 bin/build-reference.py
+
+echo "Done. docs/assets/php-toolkit.zip = $(du -h docs/assets/php-toolkit.zip | cut -f1)"
diff --git a/bin/build-docs.py b/bin/build-docs.py
new file mode 100755
index 000000000..ede776442
--- /dev/null
+++ b/bin/build-docs.py
@@ -0,0 +1,263 @@
+#!/usr/bin/env python3
+"""
+Generates docs/<component>/index.html for every component plus the docs/index.html
+landing page. The component catalog lives in bin/_docs_components.py so that
+content and orchestration stay separate.
+"""
+
+import json
+import os
+import re
+import sys
+from html import escape as h
+
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+from _docs_components import (
+    COMPONENTS,
+    COMPONENT_GUIDES,
+    COMPONENT_RELATIONS,
+    STARTER_PATHS,
+)
+
+DOCS = os.path.join(os.path.dirname(os.path.abspath(__file__)), '..', 'docs', '_legacy')
+EXPECTED_PATH = os.path.join(os.path.dirname(os.path.abspath(__file__)), '_expected_outputs.json')
+ASSET_VERSION = '20260429-concept-guide'
+
+EXPECTED = {}
+if os.path.exists(EXPECTED_PATH):
+    with open(EXPECTED_PATH) as f:
+        EXPECTED = {tuple(k.split('::')): v for k, v in json.load(f).items()}
+
+PAGE_HEAD = '''<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>{title} — PHP Toolkit</title>
+<meta name="description" content="{description}">
+<link rel="stylesheet" href="../assets/style.css?v={asset_version}">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v={asset_version}" defer></script>
+</head>
+<body>
+<header class="site">
+\t<a class="brand" href="../">PHP Toolkit</a>
+\t<nav>
+\t\t<a href="../">Components</a>
+\t\t<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+\t</nav>
+</header>
+'''
+
+PAGE_FOOT = '''<footer class="site">
+\t<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
+'''
+
+
+def snippet_block(slug, name, code, runnable=True):
+    # <script type="application/x-php"> content is parsed as raw text — entities
+    # are not decoded — so the PHP must be inserted verbatim. Guard only against
+    # the literal closing-tag string.
+    safe = code.rstrip().replace('</script', '<\\/script')
+    expected = EXPECTED.get((slug, name)) if runnable else None
+    expected_block = ''
+    if expected is not None:
+        expected_safe = expected.rstrip().replace('</script', '<\\/script')
+        # Pre-rendered output: <php-snippet> reads the script child and skips
+        # booting the Playground runtime entirely, so first-Run is instant.
+        expected_block = (
+            f'<script type="text/expected-output">\n{expected_safe}\n</script>\n'
+        )
+    runnable_attr = '' if runnable else ' runnable="false"'
+    return (
+        f'<php-snippet blueprint="toolkit-setup" name="{h(name)}"{runnable_attr}>\n'
+        f'<script type="application/x-php">\n{safe}\n</script>\n'
+        f'{expected_block}'
+        f'</php-snippet>\n'
+    )
+
+
+def render_example(slug, snippet):
+    name, code = snippet[0], snippet[1]
+    runnable = len(snippet) < 3 or snippet[2]
+    if not runnable:
+        return snippet_block(slug, name, code, False)
+    return snippet_block(slug, name, code, True)
+
+
+def slugify(text):
+    return re.sub(r'[^\w\s-]', '', text.lower()).strip().replace(' ', '-')
+
+
+def render_component(slug, title, lede, install, sections):
+    nav_items = []
+    for s, t, _, _, _ in COMPONENTS:
+        cls = ' class="current"' if s == slug else ''
+        nav_items.append(f'\t\t\t<li{cls}><a href="../{s}/">{h(t)}</a></li>')
+    sidebar = (
+        '\t<aside class="sidebar" aria-label="Component navigation">\n'
+        '\t\t<button class="sidebar-toggle" type="button" aria-expanded="false">'
+        'On this page ▾</button>\n'
+        '\t\t<nav class="toc" aria-label="Table of contents"></nav>\n'
+        '\t\t<details class="components-nav" open>\n'
+        '\t\t\t<summary>All components</summary>\n'
+        '\t\t\t<ol>\n'
+        + '\n'.join(nav_items) + '\n'
+        '\t\t\t</ol>\n'
+        '\t\t</details>\n'
+        '\t</aside>\n'
+    )
+
+    out = [PAGE_HEAD.format(
+        title=h(title),
+        description=h(re.sub(r'<[^>]+>', '', lede)),
+        asset_version=ASSET_VERSION,
+    )]
+    out.append('<div class="layout">\n')
+    out.append(sidebar)
+    out.append('\t<article class="content">\n')
+    out.append(f'\t\t<h1>{h(title)}</h1>\n')
+    out.append(f'\t\t<p class="lede">{lede}</p>\n')
+    if install:
+        out.append(f'\t\t<code class="install">composer require {h(install)}</code>\n')
+
+    purpose = None
+    usage_sections = sections
+    if sections and sections[0][0].lower() == 'why this exists':
+        purpose = sections[0]
+        usage_sections = sections[1:]
+
+    if purpose:
+        _, body_html, snippet = purpose
+        if body_html:
+            out.append(f'\t\t{body_html}\n')
+        if snippet:
+            out.append(render_example(slug, snippet))
+
+    guide = COMPONENT_GUIDES.get(slug, {})
+    if guide:
+        mental_model = guide.get('mental_model')
+        journey = guide.get('journey', ())
+        if mental_model:
+            out.append(f'\t\t{mental_model}\n')
+        if journey:
+            out.append('\t\t<p class="you-will-learn-label">You will learn to:</p>\n')
+            out.append('\t\t<ul class="you-will-learn">\n')
+            for label, _text in journey:
+                out.append(f'\t\t\t<li>{h(label)}</li>\n')
+            out.append('\t\t</ul>\n')
+
+    if install:
+        out.append(
+            '\t\t<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. '
+            'Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. '
+            'Static snippets show config or shell commands that need a real local environment.</p>\n'
+        )
+
+    for heading, body_html, snippet in usage_sections:
+        out.append(f'\t\t<h2 id="{slugify(heading)}">{h(heading)}</h2>\n')
+        if body_html:
+            out.append(f'\t\t{body_html}\n')
+        if snippet:
+            out.append(render_example(slug, snippet))
+
+    related = COMPONENT_RELATIONS.get(slug, ())
+    if related:
+        out.append('\t\t<h2 id="see-also">See also</h2>\n')
+        out.append('\t\t<ul class="related-components">\n')
+        for related_slug, related_title, reason in related:
+            out.append(
+                f'\t\t\t<li><a href="../{related_slug}/">{h(related_title)}</a>'
+                f'<span>{reason}</span></li>\n'
+            )
+        out.append('\t\t</ul>\n')
+    out.append('\t</article>\n</div>\n')
+    out.append(PAGE_FOOT)
+    return ''.join(out)
+
+
+def render_index():
+    title_by_slug = {slug: title for slug, title, _, _, _ in COMPONENTS}
+    cards = []
+    for slug, title, lede, _, _ in COMPONENTS:
+        clean = re.sub(r'<[^>]+>', '', lede)
+        first = clean.split('.')[0]
+        if len(first) > 110:
+            first = first[:107].rsplit(' ', 1)[0] + '…'
+        suffix = '' if first.endswith(('…', '.')) else '.'
+        cards.append(
+            f'\t\t<li><a href="{slug}/"><strong>{h(title)}</strong>'
+            f'<span>{h(first)}{suffix}</span></a></li>'
+        )
+    cards_html = '\n'.join(cards)
+    path_cards = []
+    for title, description, slugs in STARTER_PATHS:
+        links = ' '.join(
+            f'<a href="{slug}/">{h(title_by_slug[slug])}</a>' for slug in slugs
+        )
+        path_cards.append(
+            f'\t\t<li><strong>{h(title)}</strong><span>{h(description)}</span>'
+            f'<nav aria-label="{h(title)} path">{links}</nav></li>'
+        )
+    paths_html = '\n'.join(path_cards)
+    return f'''<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>PHP Toolkit — runnable docs</title>
+<meta name="description" content="Guided docs for eighteen pure-PHP libraries for WordPress and general PHP, with runnable examples powered by WordPress Playground.">
+<link rel="stylesheet" href="assets/style.css?v={ASSET_VERSION}">
+</head>
+<body>
+<header class="site">
+\t<a class="brand" href="./">PHP Toolkit</a>
+\t<nav>
+\t\t<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+\t</nav>
+</header>
+<main class="landing">
+\t<h1>PHP Toolkit</h1>
+\t<p class="lede">Eighteen standalone pure-PHP libraries for WordPress and general PHP, with no extension or Composer dependencies. Each guide starts with the story for that component, outlines the route through the page, names the main APIs, and then uses examples only where code clarifies the idea.</p>
+
+\t<h2>Choose a Path</h2>
+\t<ul class="starter-paths">
+{paths_html}
+\t</ul>
+
+\t<h2>Components</h2>
+\t<ul class="components">
+{cards_html}
+\t</ul>
+
+\t<h2>How these examples work</h2>
+\t<p>Most PHP examples embed <code>&lt;php-snippet&gt;</code> elements from <a href="https://playground.wordpress.net/">WordPress Playground</a>. The first <em>Run</em> click on a page boots a single shared PHP+WordPress runtime in your browser via WebAssembly and unzips the toolkit into it. Subsequent snippets reuse the same runtime, so only the first run pays the boot cost.</p>
+\t<p>Examples that need a local listening port, a web server, or deployment-specific config are presented as static code blocks so the page does not imply they can run in the browser sandbox.</p>
+\t<p>The toolkit bundle (<code>docs/assets/php-toolkit.zip</code>, ≈1.8&nbsp;MB) ships with the docs, so no third-party CDN is involved.</p>
+</main>
+<footer class="site">
+\t<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
+'''
+
+
+def main():
+    with open(os.path.join(DOCS, 'index.html'), 'w') as f:
+        f.write(render_index())
+
+    for slug, title, lede, install, sections in COMPONENTS:
+        out_dir = os.path.join(DOCS, slug)
+        os.makedirs(out_dir, exist_ok=True)
+        with open(os.path.join(out_dir, 'index.html'), 'w') as f:
+            f.write(render_component(slug, title, lede, install, sections))
+        print(f'  wrote {slug}/index.html')
+
+
+if __name__ == '__main__':
+    main()
diff --git a/bin/build-reference.py b/bin/build-reference.py
new file mode 100644
index 000000000..bc95c8991
--- /dev/null
+++ b/bin/build-reference.py
@@ -0,0 +1,223 @@
+#!/usr/bin/env python3
+"""Generates docs/reference/<slug>.html for components not already hand-written.
+Pulls catalog data from _docs_components.py and emits the concept-guide shape:
+lede + install + context paragraphs + minimal example + refinements + pitfalls + see also.
+
+The hand-written reference pages (html, zip) are skipped — they live as
+authored HTML files and we don't overwrite them.
+"""
+
+import json
+import os
+import re
+import sys
+from html import escape as h, unescape
+
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+from _docs_components import COMPONENTS, COMPONENT_RELATIONS, CREDITS
+
+DOCS = os.path.join(os.path.dirname(os.path.abspath(__file__)), '..', 'docs', 'reference')
+EXPECTED_PATH = os.path.join(os.path.dirname(os.path.abspath(__file__)), '_expected_outputs.json')
+ASSET_VERSION = '20260429-rewrite'
+
+EXPECTED = {}
+if os.path.exists(EXPECTED_PATH):
+    with open(EXPECTED_PATH) as f:
+        EXPECTED = {tuple(k.split('::')): v for k, v in json.load(f).items()}
+
+# Skip the hand-written ones.
+SKIP = {'html', 'zip'}
+
+PAGE_HEAD = '''<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>{title} — PHP Toolkit reference</title>
+<meta name="description" content="{description}">
+<link rel="stylesheet" href="../assets/style.css?v={asset_version}">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v={asset_version}" defer></script>
+</head>
+<body>
+<header class="site">
+\t<a class="brand" href="../">PHP Toolkit</a>
+\t<nav>
+\t\t<a href="../learn/">Learn</a>
+\t\t<a href="./">Reference</a>
+\t\t<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+\t</nav>
+</header>
+
+<div class="layout">
+'''
+
+PAGE_FOOT = '''\t</article>
+</div>
+
+<footer class="site">
+\t<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
+'''
+
+
+def slugify(text):
+    return re.sub(r'[^\w\s-]', '', text.lower()).strip().replace(' ', '-')
+
+
+def split_pitfalls(body_html):
+    """Pull out paragraphs that begin with 'Footgun:' or 'Gotcha:' and return them
+    as separate pitfall callouts. Return (rest_html, [pitfall_html, ...])."""
+    pitfalls = []
+    rest = []
+    for chunk in re.findall(r'<p>.*?</p>', body_html, flags=re.DOTALL):
+        plain = re.sub(r'<[^>]+>', '', chunk).strip()
+        if plain.lower().startswith(('footgun', 'gotcha')):
+            inner = chunk[3:-4]  # strip <p>...</p>
+            inner = re.sub(r'^<strong>(Footgun|Gotcha)[^<]*</strong>\s*[—:.\s]*', '', inner)
+            inner = re.sub(r'^(Footgun|Gotcha)[^a-z<]*', '', inner)
+            pitfalls.append(inner.strip())
+        else:
+            rest.append(chunk)
+    return ''.join(rest), pitfalls
+
+
+def snippet_block(slug, name, code, runnable=True):
+    safe = code.rstrip().replace('</script', '<\\/script')
+    expected = EXPECTED.get((slug, name)) if runnable else None
+    expected_block = ''
+    if expected is not None:
+        expected_safe = expected.rstrip().replace('</script', '<\\/script')
+        expected_block = (
+            f'<script type="text/expected-output">\n{expected_safe}\n</script>\n'
+        )
+    runnable_attr = '' if runnable else ' runnable="false"'
+    return (
+        f'<php-snippet blueprint="toolkit-setup" name="{h(name)}"{runnable_attr}>\n'
+        f'<script type="application/x-php">\n{safe}\n</script>\n'
+        f'{expected_block}'
+        f'</php-snippet>\n'
+    )
+
+
+def render_example(slug, snippet):
+    name, code = snippet[0], snippet[1]
+    runnable = len(snippet) < 3 or snippet[2]
+    return snippet_block(slug, name, code, runnable)
+
+
+def sidebar(current_slug):
+    items = []
+    for slug, title, _, _, _ in COMPONENTS:
+        is_legacy = slug in SKIP or slug in {
+            'bytestream', 'filesystem', 'blockparser', 'markdown', 'xml', 'encoding',
+            'dataliberation', 'git', 'merge', 'httpclient', 'httpserver', 'corsproxy',
+            'cli', 'polyfill', 'blueprints', 'coding-standards',
+        }
+        # Reference page exists for skipped (handwritten) and the ones we generate here.
+        href = f'{slug}.html'
+        cls = ' class="current"' if slug == current_slug else ''
+        items.append(f'\t\t\t<li{cls}><a href="{href}">{h(title)}</a></li>')
+    return (
+        '\t<aside class="sidebar" aria-label="Reference navigation">\n'
+        '\t\t<button class="sidebar-toggle" type="button" aria-expanded="false">'
+        'On this page ▾</button>\n'
+        '\t\t<nav class="toc" aria-label="Table of contents"></nav>\n'
+        '\t\t<details class="components-nav" open>\n'
+        '\t\t\t<summary>All components</summary>\n'
+        '\t\t\t<ol>\n'
+        + '\n'.join(items) + '\n'
+        '\t\t\t</ol>\n'
+        '\t\t</details>\n'
+        '\t</aside>\n'
+    )
+
+
+def render_component(slug, title, lede, install, sections):
+    # Separate the "Why this exists" intro from the worked sections.
+    purpose_html = ''
+    pitfalls_from_purpose = []
+    usage = sections
+    if sections and sections[0][0].lower() == 'why this exists':
+        _, body, _ = sections[0]
+        purpose_html, pitfalls_from_purpose = split_pitfalls(unescape(body or ''))
+        usage = sections[1:]
+
+    out = [PAGE_HEAD.format(
+        title=h(title),
+        description=h(re.sub(r'<[^>]+>', '', lede)),
+        asset_version=ASSET_VERSION,
+    )]
+    out.append(sidebar(slug))
+    out.append('\t<article class="content">\n\n')
+    out.append(f'<h1>{h(title)}</h1>\n\n')
+    out.append(f'<p class="lede">{lede}</p>\n\n')
+    if install:
+        out.append(f'<pre><code class="install">composer require {h(install)}</code></pre>\n\n')
+    if slug in CREDITS:
+        title_credit, body_credit = CREDITS[slug]
+        out.append(
+            '<aside class="callout credit">\n'
+            f'\t<strong>{h(title_credit)}.</strong> {body_credit}\n'
+            '</aside>\n\n'
+        )
+    if purpose_html:
+        out.append(unescape(purpose_html) + '\n\n')
+
+    # Worked examples + accumulated pitfalls.
+    pitfalls = list(pitfalls_from_purpose)
+    minimal_emitted = False
+    for heading, body_html, snippet in usage:
+        # Pull pitfalls out of section body too.
+        rest, found = split_pitfalls(unescape(body_html or ''))
+        pitfalls.extend(found)
+        h2 = heading
+        if not minimal_emitted and snippet:
+            h2 = 'A minimal example'
+            minimal_emitted = True
+        elif snippet:
+            h2 = f'Refinement: {heading[0].lower() + heading[1:]}' if heading else heading
+        out.append(f'<h2 id="{slugify(h2)}">{h(h2)}</h2>\n\n')
+        if rest:
+            out.append(rest + '\n\n')
+        if snippet:
+            out.append(render_example(slug, snippet) + '\n')
+
+    if pitfalls:
+        out.append('<h2 id="pitfalls">Pitfalls</h2>\n\n')
+        for p in pitfalls:
+            out.append(f'<aside class="callout pitfall">{p}</aside>\n\n')
+
+    related = COMPONENT_RELATIONS.get(slug, ())
+    if related:
+        out.append('<h2 id="see-also">See also</h2>\n\n')
+        out.append('<ul class="related-components">\n')
+        for rel_slug, rel_title, reason in related:
+            href = f'{rel_slug}.html'
+            out.append(
+                f'\t<li><a href="{href}"><strong>{h(rel_title)}</strong></a>'
+                f'<span>{reason}</span></li>\n'
+            )
+        out.append('</ul>\n\n')
+
+    out.append(PAGE_FOOT)
+    return ''.join(out)
+
+
+def main():
+    os.makedirs(DOCS, exist_ok=True)
+    for slug, title, lede, install, sections in COMPONENTS:
+        if slug in SKIP:
+            continue
+        out = render_component(slug, title, lede, install, sections)
+        path = os.path.join(DOCS, f'{slug}.html')
+        with open(path, 'w') as f:
+            f.write(out)
+        print(f'wrote reference/{slug}.html')
+
+
+if __name__ == '__main__':
+    main()
diff --git a/bin/run-snippets.py b/bin/run-snippets.py
new file mode 100755
index 000000000..950f37747
--- /dev/null
+++ b/bin/run-snippets.py
@@ -0,0 +1,199 @@
+#!/usr/bin/env python3
+"""
+Runs every PHP snippet in bin/_docs_components.py against the local
+toolkit (`composer install` first, so vendor/autoload.php exists) and
+captures stdout. Used in two ways:
+
+    bin/run-snippets.py --update     Regenerate bin/_expected_outputs.json
+                                     from the snippets that ran successfully.
+    bin/run-snippets.py --check      Run every snippet, compare against the
+                                     committed JSON. Exit nonzero on drift.
+                                     Used by .github/workflows/snippet-tests.yml.
+
+Snippets reference '/wordpress/wp-content/php-toolkit/vendor/autoload.php' —
+the path that exists inside Playground. The runner rewrites that to the
+repo's local vendor/autoload.php before executing.
+
+Snippets marked non-runnable in the catalog are skipped. Snippets that need
+WordPress, network access, or a listening TCP port may run locally but avoid
+committing expected output because their stdout is environment-dependent.
+"""
+
+import argparse
+import json
+import os
+import re
+import subprocess
+import sys
+import tempfile
+
+THIS = os.path.dirname(os.path.abspath(__file__))
+ROOT = os.path.dirname(THIS)
+sys.path.insert(0, THIS)
+from _docs_components import COMPONENTS  # noqa: E402
+
+VENDOR_AUTOLOAD = os.path.join(ROOT, 'vendor', 'autoload.php')
+EXPECTED_PATH = os.path.join(THIS, '_expected_outputs.json')
+
+# Snippets that can run but whose output isn't stable (real network, timestamps,
+# host-specific values). They're verified to exit 0 but their stdout isn't
+# captured into the JSON, so the docs page boots Playground at click time.
+NO_EXPECTED = {
+    ('httpclient', 'get.php'),
+    ('httpclient', 'post.php'),
+    ('httpclient', 'progress.php'),
+    ('httpclient', 'sliding-window.php'),
+    ('httpclient', 'resume-download.php'),
+    ('httpclient', 'stream-unzip.php'),
+    ('httpclient', 'fan-out.php'),
+    ('httpclient', 'stream-to-disk.php'),
+}
+
+PLAYGROUND_AUTOLOAD = "/wordpress/wp-content/php-toolkit/vendor/autoload.php"
+
+# Tiny polyfill so WordPress-only globals don't break local runs.
+# Injected after the autoload require so WP_Block_Parser exists.
+LOCAL_PRELUDE = """
+if ( ! function_exists( 'parse_blocks' ) ) {
+\tfunction parse_blocks( $content ) {
+\t\treturn ( new WP_Block_Parser() )->parse( $content );
+\t}
+}
+"""
+
+
+def rewrite(code):
+    code = code.replace(PLAYGROUND_AUTOLOAD, VENDOR_AUTOLOAD)
+    match = re.search(r"require\s+'[^']*vendor/autoload\.php';", code)
+    if match:
+        insert_at = match.end()
+        code = code[:insert_at] + LOCAL_PRELUDE + code[insert_at:]
+    return code
+
+
+def run_one(code, timeout=15):
+    with tempfile.NamedTemporaryFile(suffix='.php', mode='w', delete=False) as f:
+        f.write(rewrite(code))
+        path = f.name
+    try:
+        proc = subprocess.run(
+            ['php', '-d', 'display_errors=stderr', path],
+            capture_output=True, text=True, timeout=timeout,
+        )
+        return proc.returncode, proc.stdout, proc.stderr
+    except subprocess.TimeoutExpired:
+        return -1, '', f'TIMEOUT after {timeout}s'
+    finally:
+        try:
+            os.unlink(path)
+        except OSError:
+            pass
+
+
+def normalize(text):
+    """Strip noise that varies between runs (tempfile names, timestamps)."""
+    # tempnam paths
+    text = re.sub(r'/tmp/\w+\.zip', '/tmp/<tempfile>.zip', text)
+    text = re.sub(r'(/tmp/\w+)(\.epub|\.tmp\.[a-f0-9]+)?', r'/tmp/<tempfile>\2', text)
+    text = re.sub(r'sys_get_temp_dir\(\) \. \'/[^\']+', "sys_get_temp_dir() . '/<demo>", text)
+    # uniqid suffixes from sys_get_temp_dir paths in code
+    text = re.sub(r'/(toolkit|atomic|copytree|big|orig|repacked|app|book|demo|sample|hash|gz|dl)-[a-f0-9]+', r'/\1-XXXXXX', text)
+    # Random nonces / hex strings
+    text = re.sub(r'\bnonce(?:: |=")([0-9a-f]{16})"?', lambda m: m.group(0).replace(m.group(1), '<random>'), text)
+    text = re.sub(r'\bcommit: [0-9a-f]{40}\b', 'commit: <oid>', text)
+    text = re.sub(r'\bHEAD:\s+[0-9a-f]{40}', 'HEAD: <oid>', text)
+    text = re.sub(r'\boid: [0-9a-f]{40}\b', 'oid: <oid>', text)
+    text = re.sub(r'merge head: [0-9a-f]{40}', 'merge head: <oid>', text)
+    text = re.sub(r'\b[a-f0-9]{7}  ', '<hash>  ', text)
+    # Memory numbers
+    text = re.sub(r'Peak memory: [\d.]+ MB', 'Peak memory: <N> MB', text)
+    return text
+
+
+def main():
+    ap = argparse.ArgumentParser()
+    ap.add_argument('--update', action='store_true', help='Regenerate _expected_outputs.json')
+    ap.add_argument('--check', action='store_true', help='Verify against _expected_outputs.json')
+    ap.add_argument('--filter', default=None, help='Only run snippets whose slug or filename match this substring')
+    args = ap.parse_args()
+
+    if not args.update and not args.check:
+        args.check = True
+
+    if not os.path.exists(VENDOR_AUTOLOAD):
+        print(f'ERROR: {VENDOR_AUTOLOAD} not found. Run `composer install` first.', file=sys.stderr)
+        sys.exit(2)
+
+    existing = {}
+    if os.path.exists(EXPECTED_PATH):
+        with open(EXPECTED_PATH) as f:
+            existing = {tuple(k.split('::')): v for k, v in json.load(f).items()}
+
+    new = {}
+    failures = []
+    skipped = 0
+    matched = 0
+    drift = []
+
+    for slug, _, _, _, sections in COMPONENTS:
+        for heading, _, snippet in sections:
+            if not snippet:
+                continue
+            filename, code = snippet[0], snippet[1]
+            runnable = len(snippet) < 3 or snippet[2]
+            if not runnable:
+                continue
+            if args.filter and args.filter not in slug and args.filter not in filename:
+                continue
+            rc, stdout, stderr = run_one(code)
+            if rc != 0:
+                # Snippet can't run locally — leave it out of JSON. The docs
+                # site will boot Playground for it at click time.
+                failures.append((slug, filename, stderr.strip().splitlines()[:2]))
+                skipped += 1
+                continue
+
+            key = (slug, filename)
+            if key in NO_EXPECTED:
+                # Ran successfully but we don't compare output. Don't store.
+                matched += 1
+                continue
+
+            normalized = normalize(stdout)
+            new[key] = normalized
+
+            if args.check:
+                expected = existing.get(key)
+                if expected is None:
+                    drift.append((slug, filename, 'NEW (run --update to add)'))
+                elif normalize(expected) != normalized:
+                    drift.append((slug, filename, 'OUTPUT CHANGED'))
+                else:
+                    matched += 1
+            else:
+                matched += 1
+
+    print(f'\nRan {matched + len(drift)} snippets; {skipped} couldn\'t run locally.')
+    for slug, filename, why in failures:
+        why_text = ' '.join(why) if why else '(no stderr)'
+        print(f'  skip   {slug}/{filename:<32} {why_text[:80]}')
+    if args.check:
+        for slug, filename, kind in drift:
+            print(f'  DRIFT  {slug}/{filename:<32} {kind}')
+
+    if args.update:
+        joined = {f'{k[0]}::{k[1]}': v for k, v in sorted(new.items())}
+        with open(EXPECTED_PATH, 'w') as f:
+            json.dump(joined, f, indent=2, sort_keys=True)
+            f.write('\n')
+        print(f'\nWrote {len(joined)} expected outputs to {EXPECTED_PATH}')
+        sys.exit(0)
+
+    if drift:
+        print(f'\n{len(drift)} snippet(s) drifted. Run `bin/run-snippets.py --update` to refresh.')
+        sys.exit(1)
+    print('\nAll snippets match expected outputs.')
+
+
+if __name__ == '__main__':
+    main()
diff --git a/bin/serve-docs.py b/bin/serve-docs.py
new file mode 100755
index 000000000..da64cc89c
--- /dev/null
+++ b/bin/serve-docs.py
@@ -0,0 +1,30 @@
+#!/usr/bin/env python3
+"""
+Local dev server for docs/. Adds CORS headers so the WordPress Playground
+iframe can fetch docs/assets/php-toolkit.zip across origins.
+
+GitHub Pages serves Access-Control-Allow-Origin: * by default, so this
+server is only needed for `python3 -m http.server`-equivalent local previews.
+
+Usage:
+    python3 bin/serve-docs.py [port]
+"""
+
+import http.server
+import os
+import sys
+
+PORT = int(sys.argv[1]) if len(sys.argv) > 1 else 8787
+DOCS = os.path.join(os.path.dirname(os.path.abspath(__file__)), '..', 'docs')
+
+
+class CorsHandler(http.server.SimpleHTTPRequestHandler):
+    def end_headers(self):
+        self.send_header('Access-Control-Allow-Origin', '*')
+        self.send_header('Access-Control-Allow-Headers', '*')
+        super().end_headers()
+
+
+os.chdir(DOCS)
+print(f'Serving {DOCS} on http://localhost:{PORT}/')
+http.server.ThreadingHTTPServer(('', PORT), CorsHandler).serve_forever()
diff --git a/components/BlockParser/README.md b/components/BlockParser/README.md
index 2cf95fb97..fa0d7b2b6 100644
--- a/components/BlockParser/README.md
+++ b/components/BlockParser/README.md
@@ -1,218 +1,137 @@
 # BlockParser
 
-A standalone extraction of WordPress core's block parser. It takes a document containing WordPress block markup (`<!-- wp:name -->...<!-- /wp:name -->`) and returns a structured array of parsed blocks with their attributes, inner HTML, inner blocks, and content interleaving. This is the same parser that powers `parse_blocks()` in WordPress core, packaged as an independent library with no WordPress dependency.
+## Why this exists
 
-## Installation
-
-```
-composer require wp-php-toolkit/blockparser
-```
-
-## Quick Start
-
-```php
-$document = <<<HTML
-<!-- wp:heading {"level":2} -->
-<h2>Welcome</h2>
-<!-- /wp:heading -->
+WordPress stores post content as annotated HTML. Instead of inventing a separate file format, it embeds block boundaries directly inside HTML comments:
 
+```html
 <!-- wp:paragraph -->
-<p>Hello from the block editor.</p>
+<p>Hello, world.</p>
 <!-- /wp:paragraph -->
-HTML;
 
-$parser = new WP_Block_Parser();
-$blocks = $parser->parse( $document );
-
-foreach ( $blocks as $block ) {
-    if ( 'core/heading' === $block['blockName'] ) {
-        echo 'Found heading: ' . strip_tags( $block['innerHTML'] );
-        // "Found heading: Welcome"
-    }
-}
+<!-- wp:image {"align":"center","sizeSlug":"large"} -->
+<figure class="wp-block-image aligncenter"><img src="photo.jpg" /></figure>
+<!-- /wp:image -->
 ```
 
-## Usage
-
-### Parsing a Document
+Every WordPress editor, REST API response, and block renderer needs to turn that serialized markup into a structured tree. WordPress core ships `WP_Block_Parser` to do exactly that — but it's buried inside WordPress itself, tied to the full WordPress load. This component extracts it so you can parse block markup anywhere: CLI tools, build scripts, data-migration pipelines, standalone PHP apps — without booting WordPress.
 
-Call `parse()` with any string containing block markup. It returns an array of block arrays, each with the following keys:
+## How it works
 
-```php
-$parser = new WP_Block_Parser();
-$blocks = $parser->parse( $document );
-
-// Each element in $blocks is an array:
-// array(
-//     'blockName'    => 'core/paragraph',   // Fully-qualified block name, or null for freeform HTML.
-//     'attrs'        => array(),             // Attributes from the block comment delimiter.
-//     'innerBlocks'  => array(),             // Nested blocks (same structure, recursive).
-//     'innerHTML'    => '<p>Text</p>',       // The HTML inside the block, with inner blocks removed.
-//     'innerContent' => array( '<p>Text</p>' ), // Interleaved HTML strings and null markers for inner block positions.
-// )
-```
+The parser is a single-pass, stack-based scanner. It moves forward through the document looking for HTML comments that follow the block annotation pattern. When it finds an opening comment like `<!-- wp:image {"align":"center"} -->`, it:
 
-### Block Types
+1. Decodes the JSON attributes from the comment body.
+2. Pushes a frame onto a stack, recording the block name, attributes, and the byte offset where the block started.
+3. Keeps scanning, collecting the raw HTML between the opening and closing comments as `innerHTML`.
+4. If it encounters another `<!-- wp:... -->` before the closing comment, it recurses — pushing a new frame for the inner block.
+5. When it finds a closing comment (`<!-- /wp:image -->`), it pops the frame, attaches any collected inner blocks, and appends the completed block to its parent.
 
-The parser recognizes three kinds of block tokens:
+Freeform content between blocks — plain HTML with no block annotations — becomes a "classic block" with `blockName` set to `null`.
 
-**Standard blocks** have an opener and closer:
+The `innerContent` array is the most subtle part of the output. It interleaves child block positions with raw HTML chunks, letting renderers reconstruct the exact original layout. This is how the columns block describes which raw HTML wraps each inner column.
 
-```php
-$blocks = ( new WP_Block_Parser() )->parse(
-    '<!-- wp:paragraph --><p>Hello</p><!-- /wp:paragraph -->'
-);
-// $blocks[0]['blockName'] === 'core/paragraph'
-// $blocks[0]['innerHTML'] === '<p>Hello</p>'
-```
+## Usage
 
-**Self-closing (void) blocks** end with `/-→`:
+### Parse a post's block content
 
 ```php
-$blocks = ( new WP_Block_Parser() )->parse(
-    '<!-- wp:spacer {"height":"50px"} /-->'
-);
-// $blocks[0]['blockName'] === 'core/spacer'
-// $blocks[0]['attrs']     === array( 'height' => '50px' )
-// $blocks[0]['innerHTML'] === ''
-```
+use WordPress\BlockParser\WP_Block_Parser;
 
-**Freeform HTML** is any content outside of block delimiters:
+$parser = new WP_Block_Parser();
+$blocks = $parser->parse( $post_content );
 
-```php
-$blocks = ( new WP_Block_Parser() )->parse(
-    '<p>Just some HTML, no blocks here.</p>'
-);
-// $blocks[0]['blockName'] === null
-// $blocks[0]['innerHTML'] === '<p>Just some HTML, no blocks here.</p>'
+foreach ( $blocks as $block ) {
+    echo $block['blockName'];   // e.g. "core/paragraph"
+    echo $block['innerHTML'];   // the raw HTML inside the block
+    // $block['attrs']          — decoded JSON attributes
+    // $block['innerBlocks']    — nested blocks (same structure, recursive)
+    // $block['innerContent']   — interleaved HTML chunks + child-block slots
+}
 ```
 
-### Block Attributes
+### Inspect block attributes
 
-Attributes are encoded as JSON inside the block comment delimiter. The parser decodes them into a PHP associative array:
+Attributes are encoded as JSON in the opening comment and decoded automatically:
 
 ```php
-$blocks = ( new WP_Block_Parser() )->parse(
-    '<!-- wp:image {"id":123,"sizeSlug":"large","linkDestination":"none"} -->' .
-    '<figure class="wp-block-image size-large"><img src="photo.jpg" class="wp-image-123"/></figure>' .
-    '<!-- /wp:image -->'
-);
-
-$attrs = $blocks[0]['attrs'];
-// array(
-//     'id'              => 123,
-//     'sizeSlug'        => 'large',
-//     'linkDestination' => 'none',
-// )
+$markup = '<!-- wp:image {"sizeSlug":"large","linkDestination":"none"} -->'
+        . '<figure>...</figure>'
+        . '<!-- /wp:image -->';
+
+$blocks = $parser->parse( $markup );
+echo $blocks[0]['attrs']['sizeSlug'];  // "large"
 ```
 
-### Nested Blocks
+### Walk a nested block tree
 
-Blocks can contain other blocks. Inner blocks appear in the `innerBlocks` array, and `innerContent` interleaves the HTML fragments with `null` markers showing where each inner block was located:
+Blocks can contain other blocks. The `innerBlocks` key holds them recursively:
 
 ```php
-$document = <<<HTML
-<!-- wp:columns -->
-<div class="wp-block-columns">
-<!-- wp:column -->
-<div class="wp-block-column">
-<!-- wp:paragraph -->
-<p>Left column</p>
-<!-- /wp:paragraph -->
-</div>
-<!-- /wp:column -->
-<!-- wp:column -->
-<div class="wp-block-column">
-<!-- wp:paragraph -->
-<p>Right column</p>
-<!-- /wp:paragraph -->
-</div>
-<!-- /wp:column -->
-</div>
-<!-- /wp:columns -->
-HTML;
+function walk( array $blocks, int $depth = 0 ): void {
+    foreach ( $blocks as $block ) {
+        if ( $block['blockName'] === null ) {
+            continue; // skip freeform HTML between blocks
+        }
+        echo str_repeat( '  ', $depth ) . $block['blockName'] . "\n";
+        walk( $block['innerBlocks'], $depth + 1 );
+    }
+}
 
-$parser = new WP_Block_Parser();
-$blocks = $parser->parse( $document );
-
-$columns = $blocks[0];
-// $columns['blockName']   === 'core/columns'
-// count( $columns['innerBlocks'] ) === 2
-
-$left_column = $columns['innerBlocks'][0];
-// $left_column['blockName'] === 'core/column'
-// $left_column['innerBlocks'][0]['blockName'] === 'core/paragraph'
-
-// innerContent shows the interleaving of HTML and inner block positions:
-// array(
-//     '<div class="wp-block-columns">\n',  // HTML before first inner block
-//     null,                                 // Position of first inner block (core/column)
-//     '\n',                                 // HTML between inner blocks
-//     null,                                 // Position of second inner block (core/column)
-//     '\n</div>\n',                         // HTML after last inner block
-// )
+walk( $parser->parse( $post_content ) );
+// core/columns
+//   core/column
+//     core/paragraph
+//   core/column
+//     core/image
 ```
 
-### Namespaced Blocks
+### Reconstruct output using innerContent
 
-The parser handles both core blocks (`wp:paragraph`) and namespaced third-party blocks (`wp:my-plugin/custom-block`). Block names without an explicit namespace are prefixed with `core/`:
+The `innerContent` array lets you rebuild the original markup while swapping in rendered child blocks:
 
 ```php
-$blocks = ( new WP_Block_Parser() )->parse(
-    '<!-- wp:my-plugin/testimonial {"author":"Jane"} -->' .
-    '<blockquote>Great product!</blockquote>' .
-    '<!-- /wp:my-plugin/testimonial -->'
-);
-// $blocks[0]['blockName'] === 'my-plugin/testimonial'
-// $blocks[0]['attrs']     === array( 'author' => 'Jane' )
-```
+function render_block( array $block ): string {
+    $output      = '';
+    $child_index = 0;
+
+    foreach ( $block['innerContent'] as $chunk ) {
+        if ( is_string( $chunk ) ) {
+            $output .= $chunk;
+        } else {
+            // null = "insert rendered child block here"
+            $output .= render_block( $block['innerBlocks'][ $child_index++ ] );
+        }
+    }
 
-### Error Recovery
+    return $output;
+}
+```
 
-The parser is designed to never fail. When it encounters malformed markup such as missing closers or mismatched block names, it produces a best-effort parse rather than returning an error:
+### Find all blocks of a specific type
 
 ```php
-// Missing closer -- the parser treats it as implicitly closed.
-$blocks = ( new WP_Block_Parser() )->parse(
-    '<!-- wp:paragraph --><p>No closer here'
-);
-// $blocks[0]['blockName'] === 'core/paragraph'
-// $blocks[0]['innerHTML'] === '<p>No closer here'
-```
-
-## API Reference
+function find_blocks( array $blocks, string $name ): array {
+    $found = array();
+    foreach ( $blocks as $block ) {
+        if ( $block['blockName'] === $name ) {
+            $found[] = $block;
+        }
+        $found = array_merge( $found, find_blocks( $block['innerBlocks'], $name ) );
+    }
+    return $found;
+}
 
-### WP_Block_Parser
+$images = find_blocks( $parser->parse( $post_content ), 'core/image' );
+```
 
-| Method | Description |
-|--------|-------------|
-| `parse( $document )` | Parse block markup and return an array of block structures |
+## Block structure reference
 
-### Block Structure (array keys)
+Each parsed block is an associative array:
 
 | Key | Type | Description |
 |-----|------|-------------|
-| `blockName` | `string\|null` | Fully-qualified name (e.g. `core/paragraph`), or `null` for freeform HTML |
-| `attrs` | `array` | Block attributes decoded from the JSON in the comment delimiter |
-| `innerBlocks` | `array` | Nested blocks, same structure recursively |
-| `innerHTML` | `string` | HTML content with inner blocks stripped out |
-| `innerContent` | `array` | Interleaved HTML strings and `null` markers for inner block positions |
-
-### WP_Block_Parser_Block
-
-| Property | Type | Description |
-|----------|------|-------------|
-| `$blockName` | `string\|null` | Block name |
-| `$attrs` | `array\|null` | Block attributes |
-| `$innerBlocks` | `array` | Nested block instances |
-| `$innerHTML` | `string` | Inner HTML content |
-| `$innerContent` | `array` | Interleaved content with `null` placeholders |
-
-## Attribution
-
-This component is extracted from [WordPress core](https://github.com/WordPress/wordpress-develop). The `WP_Block_Parser`, `WP_Block_Parser_Block`, and `WP_Block_Parser_Frame` classes are maintained as part of the WordPress block editor infrastructure. Licensed under GPL v2.
-
-## Requirements
-
-- PHP 7.2+
-- No external dependencies
+| `blockName` | `string\|null` | Namespaced block name, e.g. `"core/paragraph"`. `null` for classic/freeform content between blocks. |
+| `attrs` | `array` | Decoded JSON attributes from the opening comment. Empty array if none. |
+| `innerBlocks` | `array` | Recursively parsed child blocks in order of appearance. |
+| `innerHTML` | `string` | The full raw HTML between the opening and closing comments, including inner block markup verbatim. |
+| `innerContent` | `array` | Interleaved array: strings are raw HTML chunks, `null` values mark positions where a child block from `innerBlocks` should be inserted. |
diff --git a/components/Filesystem/README.md b/components/Filesystem/README.md
index 17a605415..153d0e525 100644
--- a/components/Filesystem/README.md
+++ b/components/Filesystem/README.md
@@ -1,240 +1,141 @@
 # Filesystem
 
-A unified filesystem abstraction that lets you work with local disks, in-memory trees, SQLite-backed storage, and other backends through a single interface. Every implementation uses forward slashes as path separators regardless of the host OS, so code that works on Linux works identically on Windows and macOS.
+## Why this exists
 
-## Installation
+PHP's built-in file functions (`file_get_contents`, `fopen`, `mkdir`, etc.) are tightly coupled to the local disk. That's fine for simple scripts, but it creates a real problem when you want to:
 
-```bash
-composer require wp-php-toolkit/filesystem
-```
-
-## Quick Start
-
-```php
-use WordPress\Filesystem\InMemoryFilesystem;
+- **Test code without touching the disk.** Unit tests that create real files are slow, fragile, and leave cleanup responsibilities behind.
+- **Work with non-disk storage.** WordPress Playground runs entirely in the browser using a virtual filesystem backed by a SQLite database. Your code needs to work the same way against both a real disk and an in-memory tree.
+- **Operate on ZIP archives as if they were directories.** Instead of extracting first and then reading, you want to walk a ZIP file the same way you'd walk a folder.
+- **Stay portable across operating systems.** Windows uses backslashes; everything else uses forward slashes. Code that hardcodes separators breaks on the other platform.
 
-$fs = InMemoryFilesystem::create();
-$fs->mkdir( '/docs' );
-$fs->put_contents( '/docs/readme.txt', 'Hello, world!' );
-echo $fs->get_contents( '/docs/readme.txt' ); // "Hello, world!"
-```
+This component defines a single `Filesystem` interface and several implementations behind it. Write your code against the interface once, and it works against any backend.
 
-## Usage
-
-### Local Filesystem
-
-`LocalFilesystem` wraps the real disk. Pass a root directory to `create()` and all paths are resolved relative to it.
-
-```php
-use WordPress\Filesystem\LocalFilesystem;
+## How it works
 
-$fs = LocalFilesystem::create( '/var/www/mysite' );
+The `Filesystem` interface defines the operations every backend must support: listing directories, reading and writing files, checking existence, copying, renaming, deleting. Implementations handle the translation to whatever storage mechanism is underneath.
 
-// Write and read files
-$fs->put_contents( '/config.json', '{"debug": true}' );
-echo $fs->get_contents( '/config.json' ); // '{"debug": true}'
+All paths use forward slashes (`/`) regardless of OS. On Windows, the `LocalFilesystem` translates them to backslashes internally, but your code never sees that.
 
-// Directory operations
-$fs->mkdir( '/uploads/2024', array( 'recursive' => true ) );
-$fs->put_contents( '/uploads/2024/photo.txt', 'image data here' );
+Reads and writes are stream-based under the hood. `open_read_stream()` returns a handle you can read in chunks; `open_write_stream()` gives you a handle to write to. `get_contents()` and `put_contents()` are convenience wrappers that read or write the entire file at once.
 
-// List directory contents
-$entries = $fs->ls( '/uploads/2024' ); // ['photo.txt']
+The `FilesystemVisitor` handles recursive tree traversal, emitting events for each directory and file it encounters.
 
-// Check paths
-$fs->is_dir( '/uploads' );   // true
-$fs->is_file( '/config.json' ); // true
-$fs->exists( '/missing' );     // false
-```
+### The implementations
 
-Without a root argument, `LocalFilesystem::create()` defaults to the system root (`/` on Unix, the system drive on Windows).
+**`LocalFilesystem`** — wraps PHP's built-in file functions. Works on the actual disk.
 
-### In-Memory Filesystem
+**`InMemoryFilesystem`** — stores everything in a PHP array. Fast, zero I/O, perfect for tests and ephemeral scratch space.
 
-`InMemoryFilesystem` stores everything in PHP arrays. It is useful for tests, temporary processing, and anywhere you need a fast, disposable filesystem.
+**`SQLiteFilesystem`** — stores files in a SQLite database. Used by WordPress Playground to persist a WordPress installation in a single database file that can be serialized, snapshotted, and restored.
 
-```php
-use WordPress\Filesystem\InMemoryFilesystem;
+**`ZipFilesystem`** (from the Zip component) — mounts a ZIP archive as a read-only directory tree.
 
-$fs = InMemoryFilesystem::create();
+**`UploadedFilesystem`** — wraps another filesystem and tracks which paths were written, for auditing what an operation produced.
 
-$fs->mkdir( '/src/components', array( 'recursive' => true ) );
-$fs->put_contents( '/src/components/button.php', '<?php // button' );
-$fs->put_contents( '/src/components/form.php', '<?php // form' );
+### ChrootLayer
 
-$files = $fs->ls( '/src/components' ); // ['button.php', 'form.php']
-```
+Many factory methods wrap a filesystem in a `ChrootLayer`, which jails all path operations to a specific root directory. This prevents code from accidentally escaping to `/` and makes it safe to hand a filesystem object to untrusted code.
 
-### SQLite Filesystem
+## Usage
 
-`SQLiteFilesystem` persists files and directories in a SQLite database. It requires the `sqlite3` PHP extension (dev-only dependency, not required by the library at runtime).
+### Read a file
 
 ```php
-use WordPress\Filesystem\SQLiteFilesystem;
-
-// In-memory SQLite database
-$fs = SQLiteFilesystem::create( ':memory:' );
+use WordPress\Filesystem\LocalFilesystem;
 
-// Or persist to a file
-$fs = SQLiteFilesystem::create( '/tmp/my-files.sqlite' );
+$fs = new LocalFilesystem( '/var/www/html' );
 
-$fs->mkdir( '/data' );
-$fs->put_contents( '/data/report.csv', 'id,name\n1,Alice' );
-echo $fs->get_contents( '/data/report.csv' );
+if ( $fs->is_file( '/wp-config.php' ) ) {
+    $contents = $fs->get_contents( '/wp-config.php' );
+}
 ```
 
-### File and Directory Operations
-
-All filesystem implementations share the same interface. These operations work identically across backends.
+### Write a file
 
 ```php
-// Rename (move) a file
-$fs->put_contents( '/old-name.txt', 'content' );
-$fs->rename( '/old-name.txt', '/new-name.txt' );
-
-// Copy a file
-$fs->put_contents( '/source.txt', 'content' );
-$fs->copy( '/source.txt', '/dest.txt' );
-
-// Copy a directory tree
-$fs->mkdir( '/src/lib', array( 'recursive' => true ) );
-$fs->put_contents( '/src/lib/utils.php', '<?php // utils' );
-$fs->copy( '/src', '/backup', array( 'recursive' => true ) );
-echo $fs->get_contents( '/backup/lib/utils.php' ); // '<?php // utils'
-
-// Remove files and directories
-$fs->rm( '/dest.txt' );
-$fs->rmdir( '/backup', array( 'recursive' => true ) );
+$fs->put_contents( '/uploads/hello.txt', 'Hello, world.' );
 ```
 
-### Streaming Reads and Writes
-
-Every filesystem can open byte streams for reading and writing. This integrates with the ByteStream component for chunk-based processing of large files.
+### List a directory
 
 ```php
-// Write via stream
-$writer = $fs->open_write_stream( '/output.bin' );
-$writer->append_bytes( 'chunk 1' );
-$writer->append_bytes( 'chunk 2' );
-$writer->close_writing();
-
-// Read via stream
-$reader = $fs->open_read_stream( '/output.bin' );
-$contents = $reader->consume_all();
-$reader->close_reading();
+foreach ( $fs->ls( '/wp-content/plugins' ) as $name ) {
+    echo $name . "\n";  // plugin directory names only, not full paths
+}
 ```
 
-### Copying Between Filesystems
+### Use an in-memory filesystem for tests
 
-The `copy_between_filesystems()` function streams data from one filesystem to another, even across different backends.
+Because your code accepts a `Filesystem` interface, you can swap in `InMemoryFilesystem` in tests without changing anything else:
 
 ```php
-use WordPress\Filesystem\LocalFilesystem;
 use WordPress\Filesystem\InMemoryFilesystem;
 
-use function WordPress\Filesystem\copy_between_filesystems;
-
-$local = LocalFilesystem::create( '/var/www/site' );
-$memory = InMemoryFilesystem::create();
+$fs = new InMemoryFilesystem();
+$fs->put_contents( '/config.json', json_encode( [ 'debug' => true ] ) );
 
-// Copy an entire directory tree from disk into memory
-copy_between_filesystems( array(
-    'source_filesystem' => $local,
-    'source_path'       => '/wp-content/themes/flavor',
-    'target_filesystem' => $memory,
-    'target_path'       => '/theme',
-) );
-
-echo $memory->get_contents( '/theme/style.css' );
+// Pass $fs to the code under test — it never touches the real disk.
+$result = my_config_loader( $fs );
 ```
 
-### Traversing a Filesystem
-
-`FilesystemVisitor` walks a filesystem tree depth-first, emitting enter and exit events for each directory along with its files.
+### Walk a directory tree
 
 ```php
 use WordPress\Filesystem\Visitor\FilesystemVisitor;
-use WordPress\Filesystem\Visitor\FileVisitorEvent;
 
-$visitor = new FilesystemVisitor( $fs );
+$visitor = new FilesystemVisitor( $fs, '/' );
 while ( $visitor->next() ) {
     $event = $visitor->get_event();
-    if ( $event->is_entering() ) {
-        echo "Entering: " . $event->dir . "\n";
-        foreach ( $event->files as $file ) {
-            echo "  File: " . $file . "\n";
-        }
-    }
+    echo $event->get_path() . ( $event->is_dir() ? '/' : '' ) . "\n";
 }
 ```
 
-### Path Helpers
+### Stream large files
 
-The Filesystem component provides Unix-style path utilities that behave consistently on every OS.
+For large files, streaming avoids loading everything into memory at once:
 
 ```php
-use function WordPress\Filesystem\wp_join_unix_paths;
-use function WordPress\Filesystem\wp_unix_dirname;
-use function WordPress\Filesystem\wp_unix_path_resolve_dots;
+$read_stream  = $fs->open_read_stream( '/large-export.sql' );
+$write_stream = $fs->open_write_stream( '/large-export-copy.sql' );
 
-// Join path segments, collapsing duplicate slashes
-echo wp_join_unix_paths( '/var/www', 'site', 'index.php' );
-// "/var/www/site/index.php"
+while ( ! $read_stream->is_finished() ) {
+    $chunk = $read_stream->read( 65536 );  // 64 KB at a time
+    $write_stream->write( $chunk );
+}
+
+$read_stream->close();
+$write_stream->close();
+```
 
-// Get the parent directory
-echo wp_unix_dirname( '/var/www/site/index.php' );
-// "/var/www/site"
+### Copy files between different backends
 
-// Resolve . and .. segments
-echo wp_unix_path_resolve_dots( '/var/www/site/../other/./page.php' );
-// "/var/www/other/page.php"
+Because every backend speaks the same interface, you can copy between them directly:
+
+```php
+use WordPress\Filesystem\LocalFilesystem;
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Filesystem\Visitor\FilesystemVisitor;
+
+$local  = new LocalFilesystem( '/var/www/html' );
+$memory = new InMemoryFilesystem();
+
+// Copy everything from disk to memory.
+$visitor = new FilesystemVisitor( $local, '/' );
+while ( $visitor->next() ) {
+    $event = $visitor->get_event();
+    $path  = $event->get_path();
+    if ( $event->is_file() ) {
+        $memory->put_contents( $path, $local->get_contents( $path ) );
+    } elseif ( $event->is_dir() ) {
+        $memory->mkdir( $path );
+    }
+}
 ```
 
-## API Reference
-
-### Filesystem Interface
-
-All implementations provide these methods:
-
-| Method | Description |
-|---|---|
-| `ls( $dir )` | List entries in a directory |
-| `is_dir( $path )` | Check if path is a directory |
-| `is_file( $path )` | Check if path is a file |
-| `exists( $path )` | Check if path exists |
-| `mkdir( $path, $options )` | Create a directory. Use `['recursive' => true]` for nested paths |
-| `rm( $path )` | Remove a file |
-| `rmdir( $path, $options )` | Remove a directory. Use `['recursive' => true]` for non-empty dirs |
-| `put_contents( $path, $data )` | Write a string to a file |
-| `get_contents( $path )` | Read a file into a string |
-| `open_read_stream( $path )` | Open a `ByteReadStream` for chunk-based reading |
-| `open_write_stream( $path )` | Open a `ByteWriteStream` for chunk-based writing |
-| `copy( $from, $to, $options )` | Copy a file or directory |
-| `rename( $from, $to )` | Move/rename a file or directory |
-
-### Implementations
-
-| Class | Description |
-|---|---|
-| `LocalFilesystem` | Wraps the real disk via `LocalFilesystem::create( $root )` |
-| `InMemoryFilesystem` | Array-backed filesystem via `InMemoryFilesystem::create()` |
-| `SQLiteFilesystem` | SQLite-backed filesystem via `SQLiteFilesystem::create( $path )` |
-| `UploadedFilesystem` | Read-only filesystem for handling REST API file uploads |
-
-Other packages extend this interface with additional backends: `GitFilesystem` (from the Git component) and `ZipFilesystem` (from the Zip component).
-
-### Helper Functions
-
-| Function | Description |
-|---|---|
-| `wp_join_unix_paths( ...$segments )` | Join path segments with forward slashes |
-| `wp_unix_dirname( $path )` | Get parent directory (Unix semantics on all OSes) |
-| `wp_unix_path_resolve_dots( $path )` | Resolve `.` and `..` segments |
-| `wp_unix_sys_get_temp_dir()` | Like `sys_get_temp_dir()` but always uses forward slashes |
-| `copy_between_filesystems( $args )` | Stream data between two filesystem instances |
-| `pipe_stream( $from, $to )` | Pipe a read stream into a write stream |
-
-## Requirements
-
-- PHP 7.2+
-- No external dependencies (SQLiteFilesystem requires the `sqlite3` extension, which is a dev-only dependency)
+## Path conventions
+
+- Always use forward slashes: `/wp-content/uploads/photo.jpg`.
+- Paths are absolute from the filesystem root. The root itself is `/`.
+- On Windows, `LocalFilesystem` converts slashes internally; you never need to use `DIRECTORY_SEPARATOR`.
+- `ChrootLayer` jails all paths to the configured root. A path of `/` inside a chrooted filesystem refers to the configured root directory on disk, not the actual system root.
diff --git a/components/Git/README.md b/components/Git/README.md
index ed61f56d2..0cd7213d1 100644
--- a/components/Git/README.md
+++ b/components/Git/README.md
@@ -1,229 +1,129 @@
 # Git
 
-A pure PHP implementation of a Git client and server. It can create repositories, read and write objects, commit files, manage branches, diff, merge, and communicate with remote servers over HTTP -- all without shelling out to the `git` binary or requiring any native extensions.
+## Why this exists
 
-## Installation
+Git is typically used through the `git` binary — a compiled C program that reads and writes the repository on disk. That's perfect for most development workflows, but it breaks down in a few important scenarios:
 
-```bash
-composer require wp-php-toolkit/git
-```
+- **Serverless and sandboxed environments.** WordPress Playground runs PHP entirely in the browser via WebAssembly. There is no OS, no filesystem, no ability to exec a subprocess. Yet Playground needs to clone, commit, and push WordPress installations as Git repositories.
+- **Programmatic repository manipulation.** Sometimes you want to create commits, rewrite history, or sync files between repositories entirely from PHP — without spawning a shell process or depending on the `git` binary being installed.
+- **Embedding Git into a PHP application.** Build tools, deployment systems, and migration scripts that want to produce or consume Git repositories without a compile-time dependency on libgit2 or similar native libraries.
 
-## Quick Start
+This component implements the Git object model, pack protocol, and HTTP smart transport in pure PHP. It can talk to any standard Git remote — GitHub, GitLab, Gitea, self-hosted — using only PHP's HTTP client.
 
-```php
-use WordPress\Filesystem\InMemoryFilesystem;
-use WordPress\Git\GitRepository;
-use WordPress\Git\Model\Commit;
-
-// Create a repository backed by an in-memory filesystem.
-// You can also use a local filesystem for on-disk storage.
-$repo = new GitRepository( InMemoryFilesystem::create() );
-
-// Commit files directly -- the repository builds the
-// blob, tree, and commit objects for you.
-$commit_oid = $repo->commit( array(
-    'updates' => array(
-        'README.md'          => '# My Project',
-        'src/hello-world.php' => '<?php echo "Hello!";',
-    ),
-) );
-
-// Read a file back from the latest commit.
-$contents = $repo->read_object_by_path( '/README.md' )->consume_all();
-// "# My Project"
-```
+## How it works
 
-## Usage
+Git's data model is simpler than it looks. Everything is content-addressed: the SHA-1 hash of an object's content is its name. There are four object types:
 
-### Creating and reading objects
+- **blob** — file content, nothing else.
+- **tree** — a directory listing: each entry maps a filename to either a blob hash (file) or another tree hash (subdirectory).
+- **commit** — a snapshot: it points to a tree (the root of the working directory), zero or more parent commit hashes, and metadata like the author and message.
+- **tag** — a named pointer to another object (usually a commit).
+
+When you commit a file, Git stores the file content as a blob, builds a tree structure from the directory layout, and creates a commit object that records which tree represents the project state at that moment. Branches are just named pointers to commit hashes stored in `refs/heads/`.
+
+`GitRepository` handles all of this. Give it a `Filesystem` object to use as backing storage, and it reads and writes Git objects directly into the `.git` directory structure. `GitRemote` handles the HTTP smart protocol — fetching a list of remote refs, downloading pack files, uploading missing objects.
+
+`GitFilesystem` wraps a `GitRepository` and exposes the contents of a specific commit through the standard `Filesystem` interface, so the rest of your code doesn't need to know it's reading from a Git object store.
+
+## Usage
 
-Every piece of data in Git is an object identified by its SHA-1 hash. You can create blobs, trees, and commits directly:
+### Create a new repository and make a commit
 
 ```php
-use WordPress\Filesystem\InMemoryFilesystem;
 use WordPress\Git\GitRepository;
+use WordPress\Filesystem\InMemoryFilesystem;
 
-$repo = new GitRepository( InMemoryFilesystem::create() );
+$fs   = new InMemoryFilesystem();
+$repo = new GitRepository( $fs );
+$repo->init();
 
-// Store a blob and get its SHA-1 hash.
-$blob_oid = $repo->add_object( 'blob', 'Hello, world!' );
-// "5dd01c177f5d7d1be5346a5bc18a569a7410c2ef"
+// Stage a file by writing it to the working directory...
+$fs->put_contents( '/hello.txt', 'Hello, world.' );
 
-// Read it back.
-$reader = $repo->read_object( $blob_oid );
-$reader->pull( 8096 );
-$data = $reader->peek( 8096 );
-// "Hello, world!"
+// ...then commit.
+$repo->stage_files( array( 'hello.txt' ) );
+$repo->commit( 'Initial commit', 'Author Name', 'author@example.com' );
 ```
 
-### Committing files
-
-The `commit()` method handles building the tree hierarchy, creating blob objects, and wiring up parent commits automatically:
+### Read a file from a specific commit
 
 ```php
-use WordPress\Filesystem\InMemoryFilesystem;
-use WordPress\Git\GitRepository;
+use WordPress\Git\GitFilesystem;
+
+// Mount the HEAD commit as a filesystem.
+$git_fs = new GitFilesystem( $repo, 'HEAD' );
 
-$repo = new GitRepository( InMemoryFilesystem::create() );
-
-// First commit.
-$first_oid = $repo->commit( array(
-    'updates' => array(
-        'dir1/file1.txt' => 'Initial content of file1',
-        'dir2/file2.txt' => 'Initial content of file2',
-    ),
-) );
-
-// Second commit -- only the changed files are updated.
-$second_oid = $repo->commit( array(
-    'updates' => array(
-        'dir1/file1.txt' => 'Updated file1',
-    ),
-) );
-
-// Delete a file in a commit.
-$third_oid = $repo->commit( array(
-    'deletes' => array( 'dir2/file2.txt' ),
-) );
+$contents = $git_fs->get_contents( '/hello.txt' );
+// "Hello, world."
 ```
 
-### Branch management
+### Clone from a remote
 
 ```php
-use WordPress\Filesystem\InMemoryFilesystem;
 use WordPress\Git\GitRepository;
+use WordPress\Git\GitRemote;
+use WordPress\Filesystem\LocalFilesystem;
 
-$repo = new GitRepository( InMemoryFilesystem::create() );
-$initial_oid = $repo->commit( array(
-    'updates' => array( 'file.txt' => 'initial' ),
-) );
-
-// Create a new branch pointing at the current commit.
-$repo->create_branch( 'refs/heads/feature', $initial_oid );
-
-// Switch to it.
-$repo->checkout( 'refs/heads/feature' );
+$fs   = new LocalFilesystem( '/tmp/my-clone' );
+$repo = new GitRepository( $fs );
+$repo->init();
 
-// Commit on the new branch.
-$repo->commit( array(
-    'updates' => array( 'file.txt' => 'changed on feature' ),
-) );
-
-// Switch back to the default branch.
-$repo->checkout( 'refs/heads/trunk' );
+$repo->add_remote( 'origin', 'https://github.com/WordPress/wordpress-develop' );
+$remote = $repo->get_remote_client( 'origin' );
 
-// Read the current branch tip hash.
-$head_hash = $repo->get_branch_tip( 'HEAD' );
+// Fetch the default branch.
+$remote->fetch( 'refs/heads/trunk' );
 ```
 
-### Merging
+### Push to a remote
 
 ```php
-$repo->checkout( 'refs/heads/trunk' );
-$result = $repo->merge( 'refs/heads/feature' );
-
-// $result['new_head'] -- the hash of the merge commit
-// $result['conflicts'] -- array of conflicting paths (empty if none)
+$remote = $repo->get_remote_client( 'origin' );
+$remote->push( 'refs/heads/my-branch' );
 ```
 
-### Using GitFilesystem
-
-`GitFilesystem` wraps a `GitRepository` with the standard `Filesystem` interface, so you can read and write files as if working with a regular filesystem. Each write creates a new commit.
+### Read the commit log
 
 ```php
-use WordPress\Filesystem\InMemoryFilesystem;
-use WordPress\Git\GitFilesystem;
-use WordPress\Git\GitRepository;
-use WordPress\Git\Model\Commit;
-
-$repo = new GitRepository( InMemoryFilesystem::create() );
-$repo->commit( array(
-    'updates' => array(
-        'README.md'                    => 'Hello, world!',
-        'subdirectory/hello-world.txt' => 'Hello, world!',
-    ),
-) );
-
-$fs = GitFilesystem::create( $repo );
+$head   = $repo->get_head();
+$commit = $repo->read_commit( $head );
 
-$fs->ls( '/' );
-// ['README.md', 'subdirectory']
+while ( $commit !== null ) {
+    echo $commit->message . "\n";
+    echo '  by ' . $commit->author_name . ' <' . $commit->author_email . ">\n";
 
-$fs->is_file( '/README.md' );           // true
-$fs->is_dir( '/subdirectory' );          // true
-$fs->get_contents( '/README.md' );       // "Hello, world!"
-
-// Writing creates a new commit automatically.
-$fs->put_contents( '/new-file.txt', 'content' );
-
-// Rename a directory.
-$fs->rename( '/subdirectory', '/renamed' );
+    $parent_hash = $commit->parent_hash;
+    $commit      = $parent_hash ? $repo->read_commit( $parent_hash ) : null;
+}
 ```
 
-### Working with remotes
+### Diff two commits
 
 ```php
-use WordPress\Filesystem\InMemoryFilesystem;
-use WordPress\Git\GitRepository;
+$changes = $repo->diff( $commit_hash_a, $commit_hash_b );
 
-$repo = new GitRepository( InMemoryFilesystem::create() );
-$repo->add_remote( 'origin', 'https://github.com/user/repo' );
+foreach ( $changes as $path => $change ) {
+    echo $change['status'] . ' ' . $path . "\n";
+    // 'A' = added, 'M' = modified, 'D' = deleted
+}
+```
 
-$remote = $repo->get_remote_client( 'origin' );
+### Use GitFilesystem anywhere a Filesystem is expected
 
-// List remote refs.
-$refs = $remote->ls_refs( 'refs/heads/' );
+Because `GitFilesystem` implements the `Filesystem` interface, you can pass it to any code that operates on a filesystem — including `ZipEncoder` to package a commit as a ZIP file:
 
-// Pull a branch.
-$remote->pull( 'refs/heads/trunk' );
+```php
+use WordPress\Git\GitFilesystem;
+use WordPress\Zip\ZipEncoder;
 
-// Push local changes.
-$remote->push( 'trunk' );
+$git_fs  = new GitFilesystem( $repo, $commit_hash );
+$encoder = new ZipEncoder( $output_stream );
+$encoder->append_from_filesystem( $git_fs, '/' );
+$encoder->finish();
 ```
 
-## API Reference
-
-### GitRepository
-
-| Method | Description |
-|---|---|
-| `__construct( Filesystem $fs )` | Create a repository backed by a filesystem |
-| `add_object( $type, $content )` | Store a blob, tree, or commit; returns its SHA-1 hash |
-| `read_object( $oid )` | Read an object by hash; returns a stream with `consume_all()` and `as_commit()` / `as_tree()` |
-| `has_object( $oid )` | Check whether an object exists locally |
-| `find_hash_by_path( $path, $commit )` | Resolve a file path to its object hash |
-| `read_object_by_path( $path, $commit )` | Read a file's content by path |
-| `commit( $options )` | Create a commit with `'updates'`, `'deletes'`, and `'move_trees'` |
-| `create_branch( $name, $oid )` | Create a new branch |
-| `checkout( $branch_or_hash )` | Switch HEAD to a branch or commit |
-| `get_branch_tip( $name )` | Get the commit hash a branch points to |
-| `set_branch_tip( $name, $oid )` | Point a branch at a specific commit |
-| `merge( $branch_name, $options )` | Three-way merge; returns `['new_head' => ..., 'conflicts' => [...]]` |
-| `diff_commits( $hash1, $hash2 )` | Diff two commits |
-| `add_remote( $name, $url )` | Register a remote |
-| `get_remote_client( $name )` | Get a `GitRemote` for push/pull operations |
-
-### GitFilesystem
-
-| Method | Description |
-|---|---|
-| `GitFilesystem::create( $repo )` | Wrap a repository with the Filesystem interface |
-| `ls( $path )` | List directory entries |
-| `is_file( $path )` / `is_dir( $path )` | Check entry type |
-| `get_contents( $path )` | Read file contents |
-| `put_contents( $path, $data )` | Write a file (creates a commit) |
-| `rename( $from, $to )` | Rename a file or directory |
-| `rm( $path )` / `rmdir( $path )` | Delete a file or directory |
-
-### Model classes
-
-| Class | Key properties |
-|---|---|
-| `Commit` | `$hash`, `$tree`, `$parents`, `$author`, `$message` |
-| `Tree` | `$entries` (map of name to `TreeEntry`) |
-| `TreeEntry` | `$mode`, `$name`, `$hash`; constants `FILE_MODE_REGULAR_NON_EXECUTABLE`, `FILE_MODE_DIRECTORY` |
-
-## Requirements
-
-- PHP 7.2+
-- No external dependencies (no `git` binary required)
+## Architecture notes
+
+Git object storage uses a two-level directory scheme: objects live in `.git/objects/ab/cdef...` where `ab` is the first two hex characters of the SHA-1 hash and `cdef...` is the rest. Pack files (compressed bundles of many objects) live in `.git/objects/pack/`. `GitRepository` handles both loose objects and pack file reading transparently.
+
+The HTTP smart protocol works in two round trips for a fetch: first a discovery request that returns the list of refs the remote knows about, then a pack-file negotiation that uploads a pack containing only the objects you don't already have. `GitRemote` implements this protocol using PHP's HTTP client, with no native dependencies.
diff --git a/components/HTML/README.md b/components/HTML/README.md
index b034be17d..a736e7918 100644
--- a/components/HTML/README.md
+++ b/components/HTML/README.md
@@ -1,260 +1,142 @@
 # HTML
 
-A full HTML5 parser and tag processor implemented in pure PHP, mirroring WordPress core's HTML API. It provides two levels of access: `WP_HTML_Tag_Processor` for fast, linear scanning and modification of HTML attributes, and `WP_HTML_Processor` for structure-aware parsing that understands nested elements, implicit tag closers, and the HTML5 insertion algorithm. No libxml2, no DOM extension, no external dependencies.
+## Why this exists
 
-## Installation
+Modifying HTML in PHP usually means one of two things: string manipulation (fragile, breaks on any attribute ordering or whitespace variation) or loading the DOM extension (which requires libxml2, triggers errors on valid HTML5 that doesn't conform to XML rules, and mangles the document in the process).
 
-```
-composer require wp-php-toolkit/html
-```
+WordPress needed a third option: a parser that can safely scan and modify real-world HTML — including malformed markup — without any native extension, without loading the whole document into memory, and without altering content it wasn't asked to change. The result is `WP_HTML_Tag_Processor` and `WP_HTML_Processor`, both mirrored here from WordPress core for use outside WordPress.
 
-## Quick Start
+The key design insight is that most HTML processing tasks don't need a full DOM tree. You want to find a tag and change one of its attributes. You want to add a class to every `<img>`. You don't need to understand the document structure for that — you just need to scan forward efficiently. `WP_HTML_Tag_Processor` handles that case. When you do need structure — "find the `<img>` inside a `<figure>` inside a `<div class='gallery'>`" — `WP_HTML_Processor` adds the HTML5 insertion algorithm on top.
 
-Find and modify HTML tags:
+## How it works
 
-```php
-$html = '<div class="entry"><img src="photo.jpg"><p>Hello</p></div>';
+### WP_HTML_Tag_Processor — fast linear scanning
 
-$tags = new WP_HTML_Tag_Processor( $html );
-if ( $tags->next_tag( 'img' ) ) {
-    $tags->set_attribute( 'loading', 'lazy' );
-    $tags->add_class( 'responsive' );
-}
+`WP_HTML_Tag_Processor` is a forward-only cursor over raw HTML bytes. You call `next_tag()` to advance to the next opening tag, optionally filtering by tag name or attribute. When the cursor is on a tag, you can read and modify its attributes. Calling `get_updated_html()` at the end returns the original HTML with your modifications applied.
 
-echo $tags->get_updated_html();
-// <div class="entry"><img loading="lazy" class="responsive" src="photo.jpg"><p>Hello</p></div>
-```
+The important thing it does *not* do: it doesn't build a tree, it doesn't understand nesting, it doesn't run the HTML5 parsing algorithm. It's a fast string scanner that knows what a tag looks like. This makes it useful for a huge class of real-world tasks that don't need structure awareness, and it makes it very fast.
 
-## Usage
-
-### Tag Processor: Linear Scanning
+### WP_HTML_Processor — structure-aware parsing
 
-`WP_HTML_Tag_Processor` scans through HTML linearly, finding tags by name, class, or other criteria. It does not parse the DOM tree -- it operates on a flat stream of tags, which makes it fast and predictable.
-
-```php
-$html = '<ul><li class="active">First</li><li>Second</li><li>Third</li></ul>';
-$tags = new WP_HTML_Tag_Processor( $html );
+`WP_HTML_Processor` extends the tag processor with the HTML5 tree-construction algorithm. It understands that `<li>` implicitly closes a previous `<li>`, that `<p>` can't contain `<div>`, that `<table>` creates a distinct parsing context. This lets you query by breadcrumb — a sequence of ancestor tags — rather than just by tag name.
 
-// Find tags by name.
-while ( $tags->next_tag( 'li' ) ) {
-    $tags->set_attribute( 'role', 'listitem' );
-}
-echo $tags->get_updated_html();
-// Every <li> now has role="listitem".
-```
+When it encounters markup it can't safely handle (certain edge cases in the HTML5 spec), it returns `null` rather than producing incorrect output. The design principle is "correct output or no output" — it refuses to silently corrupt a document.
 
-#### Querying with Arrays
+## Usage
 
-Pass an array to `next_tag()` to match by tag name, class, or both:
+### Add a class to every image
 
 ```php
-$tags = new WP_HTML_Tag_Processor( $html );
+use WordPress\HTML\WP_HTML_Tag_Processor;
 
-// Find by tag name.
-$tags->next_tag( array( 'tag_name' => 'img' ) );
+$html = new WP_HTML_Tag_Processor( $content );
 
-// Find by CSS class.
-$tags->next_tag( array( 'class_name' => 'hero' ) );
-
-// Find by both.
-$tags->next_tag( array( 'tag_name' => 'div', 'class_name' => 'sidebar' ) );
-```
-
-#### Reading Attributes
-
-```php
-$html = '<a href="https://wordpress.org" title="WP" class="button primary">Visit</a>';
-$tags = new WP_HTML_Tag_Processor( $html );
-
-if ( $tags->next_tag( 'a' ) ) {
-    $tags->get_tag();                   // 'A'
-    $tags->get_attribute( 'href' );     // 'https://wordpress.org'
-    $tags->get_attribute( 'title' );    // 'WP'
-    $tags->get_attribute( 'missing' );  // null (attribute not present)
-    $tags->has_class( 'button' );       // true
-    $tags->has_class( 'danger' );       // false
+while ( $html->next_tag( 'img' ) ) {
+    $html->add_class( 'responsive' );
 }
-```
 
-#### Modifying Attributes and Classes
-
-```php
-$tags = new WP_HTML_Tag_Processor( '<div class="old" data-x="1">' );
-$tags->next_tag();
-
-$tags->set_attribute( 'id', 'main' );       // Add a new attribute.
-$tags->set_attribute( 'data-x', '2' );      // Update an existing attribute.
-$tags->remove_attribute( 'data-x' );        // Remove an attribute.
-$tags->add_class( 'new' );                  // Add a CSS class.
-$tags->remove_class( 'old' );               // Remove a CSS class.
-
-echo $tags->get_updated_html();
-// <div id="main" class=" new">
+echo $html->get_updated_html();
 ```
 
-#### Custom Filtering
-
-When the query syntax is not enough, loop through tags and inspect them directly:
+### Find a tag with a specific attribute
 
 ```php
-$tags = new WP_HTML_Tag_Processor( $html );
-while ( $tags->next_tag() ) {
-    if (
-        ( 'DIV' === $tags->get_tag() || 'SPAN' === $tags->get_tag() ) &&
-        'highlight' === $tags->get_attribute( 'data-style' )
-    ) {
-        $tags->add_class( 'theme-highlight' );
+$html = new WP_HTML_Tag_Processor( $content );
+
+// Find the first <a> with a rel="noopener" attribute.
+if ( $html->next_tag( array( 'tag_name' => 'a', 'tag_closers' => 'skip' ) ) ) {
+    while ( $html->get_attribute( 'rel' ) !== 'noopener' ) {
+        if ( ! $html->next_tag( array( 'tag_name' => 'a' ) ) ) {
+            break;
+        }
     }
+    $html->set_attribute( 'target', '_blank' );
 }
 ```
 
-#### Bookmarks
-
-Bookmarks let you save a position and return to it later. This is the one exception to the forward-only scanning rule:
+### Read and modify attributes
 
 ```php
-$tags = new WP_HTML_Tag_Processor( '<div><span>text</span></div>' );
-$tags->next_tag( 'div' );
-$tags->set_bookmark( 'the-div' );
+$html = new WP_HTML_Tag_Processor( '<img src="old.jpg" alt="A photo" class="hero">' );
+$html->next_tag( 'img' );
 
-$tags->next_tag( 'span' );
-$tags->set_attribute( 'class', 'inner' );
+echo $html->get_attribute( 'src' );   // "old.jpg"
+echo $html->get_attribute( 'alt' );   // "A photo"
 
-// Jump back to the bookmarked position.
-$tags->seek( 'the-div' );
-$tags->set_attribute( 'class', 'outer' );
+$html->set_attribute( 'src', 'new.jpg' );
+$html->remove_attribute( 'class' );
 
-$tags->release_bookmark( 'the-div' );
-echo $tags->get_updated_html();
-// <div class="outer"><span class="inner">text</span></div>
+echo $html->get_updated_html();
+// <img src="new.jpg" alt="A photo">
 ```
 
-### HTML Processor: Structure-Aware Parsing
+### Query by structure with WP_HTML_Processor
 
-`WP_HTML_Processor` extends the tag processor with HTML5-compliant structural parsing. It understands nested elements, implied closers, and can query by element nesting (breadcrumbs).
+When you need to find a tag based on where it sits in the document tree, use `WP_HTML_Processor`. Breadcrumbs work like a simplified CSS selector with only the child combinator:
 
 ```php
-$html = '<figure><img src="photo.jpg"><figcaption>A <em>lovely</em> day</figcaption></figure>';
+use WordPress\HTML\WP_HTML_Processor;
 
-$processor = WP_HTML_Processor::create_fragment( $html );
+$html = WP_HTML_Processor::create_fragment( $content );
 
-// Find an IMG that is a direct child of FIGURE.
-if ( $processor->next_tag( array( 'breadcrumbs' => array( 'FIGURE', 'IMG' ) ) ) ) {
-    $processor->set_attribute( 'loading', 'lazy' );
+// Find every <img> that is a direct child of a <figure>.
+while ( $html->next_tag( array( 'breadcrumbs' => array( 'figure', 'img' ) ) ) ) {
+    $html->set_attribute( 'loading', 'lazy' );
 }
-```
-
-#### Breadcrumbs
-
-Breadcrumbs represent the stack of open elements from the root down to the current tag. They work like a CSS child combinator (`FIGURE > IMG`):
 
-```php
-$html = '<div><p>One</p><p>Two <em>Three</em></p></div>';
-$processor = WP_HTML_Processor::create_fragment( $html );
-
-while ( $processor->next_tag() ) {
-    $crumbs = $processor->get_breadcrumbs();
-    // First match:  array( 'HTML', 'BODY', 'DIV' )
-    // Second match: array( 'HTML', 'BODY', 'DIV', 'P' )
-    // ... and so on for each tag encountered.
-}
+echo $html->get_updated_html();
 ```
 
-#### Token-Level Access
+### Use bookmarks to return to a position
 
-Both processors support token-level iteration via `next_token()`, which visits every token in the document including text nodes, comments, and tags:
+Sometimes you want to mark a position in the document and come back to it later:
 
 ```php
-$processor = WP_HTML_Processor::create_fragment( '<p>Hello <b>world</b></p>' );
-
-while ( $processor->next_token() ) {
-    $type = $processor->get_token_type();
-    // '#tag'  for HTML tags (openers and closers)
-    // '#text' for text content
-    // Other types for comments, doctypes, etc.
+$html = new WP_HTML_Tag_Processor( $content );
 
-    if ( '#text' === $type ) {
-        echo $processor->get_modifiable_text();
-        // "Hello ", then "world"
+while ( $html->next_tag( 'div' ) ) {
+    if ( $html->get_attribute( 'id' ) === 'header' ) {
+        $html->set_bookmark( 'header' );
     }
 }
+
+// ... do other work ...
+
+$html->seek( 'header' );
+$html->add_class( 'processed' );
 ```
 
-#### Serialization
+### Decode HTML entities
 
-The processor can serialize its parsed document back to a well-formed HTML string:
+`WP_HTML_Decoder` handles entity decoding, including numeric character references and all named HTML entities, without needing the DOM or `html_entity_decode()`:
 
 ```php
-$messy = '<p>one<p>two';  // Missing closer -- valid HTML5, parsed as two paragraphs.
-$processor = WP_HTML_Processor::create_fragment( $messy );
-echo $processor->serialize();
-// <html><head></head><body><p>one</p><p>two</p></body></html>
+use WordPress\HTML\WP_HTML_Decoder;
+
+echo WP_HTML_Decoder::decode( '&lt;em&gt;Hello&lt;/em&gt;' );
+// <em>Hello</em>
+
+echo WP_HTML_Decoder::decode( '&#128512;' );
+// 😀
 ```
 
-### HTML Decoder
+## Choosing between the two processors
 
-`WP_HTML_Decoder` decodes HTML character references in text nodes and attribute values, handling named entities, numeric references, and edge cases from the HTML5 spec:
+Use `WP_HTML_Tag_Processor` when:
+- You're modifying attributes on specific tags (add/remove classes, change `src`, set `data-*`).
+- You don't care about document structure — just "find tags matching this name/attribute."
+- You want maximum performance on large documents.
 
-```php
-$decoded = WP_HTML_Decoder::decode_text_node( 'AT&amp;T &mdash; 100&percnt;' );
-// 'AT&T — 100%'
+Use `WP_HTML_Processor` when:
+- You need to find tags based on their ancestors ("the `<img>` inside a `<figure>`").
+- You're working with content that relies on implicit tag behavior (e.g., HTML that omits `</p>` or `</li>` close tags).
+- You need to understand the document tree, not just scan its surface.
 
-$decoded = WP_HTML_Decoder::decode_attribute( 'path?a=1&amp;b=2' );
-// 'path?a=1&b=2'
+## Important limitations
 
-// Check if an encoded attribute value starts with a given string.
-$starts = WP_HTML_Decoder::attribute_starts_with( 'http&colon;//example.com', 'http:', 'ascii-case-insensitive' );
-// true
-```
+Neither processor supports:
+- Modifying text content (only attributes and class names can be changed).
+- Inserting or removing entire tags (you can modify existing ones only).
+- JavaScript or CSS inside the document (those are treated as opaque text).
 
-## API Reference
-
-### WP_HTML_Tag_Processor
-
-| Method | Description |
-|--------|-------------|
-| `__construct( $html )` | Create a processor for the given HTML string |
-| `next_tag( $query = null )` | Advance to the next matching tag; returns `bool` |
-| `next_token()` | Advance to the next token (tag, text, comment); returns `bool` |
-| `get_tag()` | Get the uppercase tag name of the current tag |
-| `get_token_type()` | Get the token type (`#tag`, `#text`, `#comment`, etc.) |
-| `get_attribute( $name )` | Get an attribute value, `null` if missing, `true` for boolean attributes |
-| `set_attribute( $name, $value )` | Set or update an attribute |
-| `remove_attribute( $name )` | Remove an attribute |
-| `add_class( $class_name )` | Add a CSS class |
-| `remove_class( $class_name )` | Remove a CSS class |
-| `has_class( $wanted_class )` | Check if a CSS class is present |
-| `get_updated_html()` | Get the modified HTML string |
-| `get_modifiable_text()` | Get the text content of the current text node |
-| `set_bookmark( $name )` | Save the current position |
-| `seek( $bookmark_name )` | Return to a bookmarked position |
-| `release_bookmark( $name )` | Free a bookmark |
-
-### WP_HTML_Processor
-
-| Method | Description |
-|--------|-------------|
-| `create_fragment( $html )` | Create a processor for an HTML fragment (static factory) |
-| `next_tag( $query = null )` | Find the next tag, supports `'breadcrumbs'` queries |
-| `next_token()` | Advance to the next token with structural awareness |
-| `get_breadcrumbs()` | Get the stack of open elements as an array of tag names |
-| `serialize()` | Serialize the parsed document to well-formed HTML |
-
-Inherits all attribute and class methods from `WP_HTML_Tag_Processor`.
-
-### WP_HTML_Decoder
-
-| Method | Description |
-|--------|-------------|
-| `decode_text_node( $text )` | Decode character references in an HTML text node |
-| `decode_attribute( $text )` | Decode character references in an attribute value |
-| `attribute_starts_with( $haystack, $search, $case )` | Check if an encoded attribute starts with a plain string |
-
-## Attribution
-
-This component is extracted from [WordPress core's HTML API](https://developer.wordpress.org/reference/classes/wp_html_processor/). The `WP_HTML_Tag_Processor` and `WP_HTML_Processor` were created by the WordPress core team to provide a safe, spec-compliant way to modify HTML without regular expressions. Licensed under GPL v2.
-
-## Requirements
-
-- PHP 7.2+
-- No external dependencies
+`WP_HTML_Processor` will abort with `null` on constructs it can't safely handle. Always check return values when using it on untrusted or complex HTML.
diff --git a/components/Markdown/README.md b/components/Markdown/README.md
index d4fe3a823..813ca09c3 100644
--- a/components/Markdown/README.md
+++ b/components/Markdown/README.md
@@ -1,6 +1,6 @@
 # Markdown
 
-Bidirectional converter between Markdown and WordPress block markup. Use `MarkdownConsumer` to parse Markdown (with optional YAML frontmatter) into WordPress blocks, and `MarkdownProducer` to serialize blocks back to Markdown. Designed for content synchronization workflows where round-trip fidelity and whitespace preservation matter, such as three-way merging of static Markdown files with a WordPress database.
+Bidirectional converter between Markdown and WordPress block markup. Use `MarkdownConsumer` to parse Markdown (with optional YAML frontmatter) into WordPress blocks, and `MarkdownProducer` to serialize supported blocks back to Markdown. Designed for content synchronization workflows where a practical, structured conversion matters, such as three-way merging of static Markdown files with a WordPress database. It is not a byte-perfect Markdown formatter, and block attributes with no Markdown representation may be lost.
 
 ## Installation
 
diff --git a/components/XML/README.md b/components/XML/README.md
index bc37ccb79..d0a215331 100644
--- a/components/XML/README.md
+++ b/components/XML/README.md
@@ -1,223 +1,140 @@
 # XML
 
-A pure PHP XML processor that parses and modifies XML documents without requiring the `libxml2` extension. It implements a subset of the XML 1.0 specification and operates as a streaming, forward-only scanner with namespace support, attribute manipulation, and bookmark-based seeking. Designed for environments where native XML extensions are unavailable, such as sandboxed WordPress installations.
+## Why this exists
 
-## Installation
+PHP ships with excellent XML support — `SimpleXML`, `DOMDocument`, `XMLReader` — but all of them rely on `libxml2`, a native C library. In most PHP environments that's fine. In WordPress Playground, which runs PHP compiled to WebAssembly in the browser, native extensions aren't available. You get the PHP standard library and nothing else.
 
-```
-composer require wp-php-toolkit/xml
-```
+WordPress Playground needs to parse and modify XML to handle OPML files, RSS feeds, WordPress export files (WXR), and configuration formats. This component provides a pure PHP XML processor — no extensions, no external libraries — that covers the practical subset of XML 1.0 that real-world documents use.
 
-## Quick Start
+The design mirrors `WP_HTML_Tag_Processor` from the HTML component: a streaming, forward-only cursor you advance tag by tag, reading and modifying attributes as you go. If you already know the HTML processor, you'll be immediately comfortable here.
 
-```php
-use WordPress\XML\XMLProcessor;
+## How it works
 
-$xml = '<catalog><book price="29.99"><title>PHP Internals</title></book></catalog>';
-$processor = XMLProcessor::create_from_string( $xml );
+`XMLProcessor` is a forward-only scanner over an XML document string. Under the hood it implements a hand-written lexer that recognizes the token types XML defines: opening tags, closing tags, self-closing tags, text content, CDATA sections, processing instructions, and comments. It doesn't build a DOM tree. It doesn't allocate node objects. It simply advances a cursor through the bytes and lets you inspect and modify the token it's currently pointing at.
 
-if ( $processor->next_tag( 'book' ) ) {
-    $price = $processor->get_attribute( '', 'price' ); // "29.99"
-    $processor->set_attribute( '', 'price', '24.99' );
-}
+**Namespaces** work the same way they do in XML 1.0: a namespace declaration like `xmlns:wp="http://wordpress.org/export/1.2/"` maps a prefix to an expanded namespace name. Many namespace names look like URLs, but they are identifiers, not URLs the processor fetches. When querying for tags, you provide the expanded namespace name and the local name (not the prefix), making queries stable across documents that use different prefix conventions.
 
-echo $processor->get_updated_xml();
-// <catalog><book price="24.99"><title>PHP Internals</title></book></catalog>
-```
+**Bookmarks** let you mark positions in the document and seek back to them. This is useful for multi-pass processing: scan forward to collect information, then seek back to the marked positions to make changes.
 
-## Usage
+**Streaming mode** accepts input in chunks. The scanner can tell you when it needs more data, so you can process large documents without loading them entirely into memory.
 
-### Navigating Tags
+## Supported subset
 
-Use `next_tag()` to move the cursor forward through the document. It accepts a tag name string, a namespace-qualified array, or a query array.
+The processor handles:
+- Well-formed UTF-8 encoded XML documents
+- Namespace declarations and namespace-qualified tag queries
+- Processing instructions and comments (scannable but not modifiable)
+- CDATA sections (treated as opaque text)
+- All attribute operations: read, set, remove
 
-```php
-$xml = '<root><chapter><section id="intro">Hello</section></chapter></root>';
-$processor = XMLProcessor::create_from_string( $xml );
+It explicitly does not support:
+- DTDs, DOCTYPE declarations, ATTLIST, ENTITY, or conditional sections
+- XML schemas or validation
+- Encoding declarations other than UTF-8
 
-// Find any tag
-$processor->next_tag();
-echo $processor->get_tag_local_name(); // "root"
+For the XML that WordPress-ecosystem tools actually produce and consume, these constraints are rarely a limitation.
 
-// Find a specific tag by name
-$processor->next_tag( 'section' );
-echo $processor->get_attribute( '', 'id' ); // "intro"
-```
-
-### Working with Namespaces
+## Usage
 
-Namespaces are first-class citizens. Methods like `get_attribute()` and `set_attribute()` take the full namespace URI as the first argument, not a prefix.
+### Scan tags and read attributes
 
 ```php
-$xml = '<root xmlns:wp="http://wordpress.org/export/1.2/">'
-     . '<wp:post wp:status="draft">Content</wp:post>'
-     . '</root>';
-
-$processor = XMLProcessor::create_from_string( $xml );
-$ns = 'http://wordpress.org/export/1.2/';
+use WordPress\XML\XMLProcessor;
 
-// Find a namespaced tag by passing array( namespace_uri, local_name )
-if ( $processor->next_tag( array( $ns, 'post' ) ) ) {
-    echo $processor->get_tag_local_name();  // "post"
-    echo $processor->get_tag_namespace();   // "http://wordpress.org/export/1.2/"
+$xml = XMLProcessor::create_from_string( $document );
 
-    // Read and write namespaced attributes
-    echo $processor->get_attribute( $ns, 'status' ); // "draft"
-    $processor->set_attribute( $ns, 'status', 'published' );
+while ( $xml->next_tag() ) {
+    echo $xml->get_tag() . "\n";                    // local tag name
+    echo $xml->get_attribute( 'id' ) . "\n";        // attribute value or null
 }
-
-echo $processor->get_updated_xml();
-// <root xmlns:wp="http://wordpress.org/export/1.2/"><wp:post wp:status="published">Content</wp:post></root>
 ```
 
-### Modifying Attributes
+### Query by tag name
 
 ```php
-$xml = '<config><setting name="timeout" value="30" deprecated="yes" /></config>';
-$processor = XMLProcessor::create_from_string( $xml );
-
-if ( $processor->next_tag( 'setting' ) ) {
-    // Update an attribute
-    $processor->set_attribute( '', 'value', '60' );
-
-    // Remove an attribute
-    $processor->remove_attribute( '', 'deprecated' );
-
-    // Add a new attribute
-    $processor->set_attribute( '', 'unit', 'seconds' );
+$xml = XMLProcessor::create_from_string( $document );
+
+while ( $xml->next_tag( 'item' ) ) {
+    // Only visits <item> opening tags.
+    $title = '';
+    if ( $xml->next_tag( 'title' ) ) {
+        $xml->next_token();
+        $title = $xml->get_modifiable_text();
+    }
+    echo $title . "\n";
 }
-
-echo $processor->get_updated_xml();
-// <config><setting unit="seconds" name="timeout" value="60"  /></config>
 ```
 
-### Token-Level Processing
+### Query by namespace
 
-Use `next_token()` to visit every lexical token in the document, including text nodes, comments, CDATA sections, and processing instructions.
+When working with namespaced XML, pass a `[namespace_name, local_name]` tuple to `next_tag()`:
 
 ```php
-$xml = '<article><title>Hello World</title><body>Some text</body></article>';
-$processor = XMLProcessor::create_from_string( $xml );
+// WordPress export files use the "wp" namespace.
+$ns  = 'http://wordpress.org/export/1.2/';
+$xml = XMLProcessor::create_from_string( $wxr_document );
 
-$text_content = '';
-while ( $processor->next_token() ) {
-    if ( '#text' === $processor->get_token_name() ) {
-        $text_content .= $processor->get_modifiable_text();
-    }
+while ( $xml->next_tag( array( $ns, 'post_id' ) ) ) {
+    $xml->next_token();
+    echo $xml->get_modifiable_text() . "\n";  // the post ID value
 }
-
-echo $text_content; // "Hello WorldSome text"
 ```
 
-### Modifying Text Content
+### Modify attributes
 
 ```php
-$xml = '<greeting>Hello</greeting>';
-$processor = XMLProcessor::create_from_string( $xml );
+$xml = XMLProcessor::create_from_string( '<items><item id="1" status="draft"/></items>' );
 
-$processor->next_tag( 'greeting' );
-$processor->next_token(); // Move to the text node
-$processor->set_modifiable_text( 'Goodbye' );
+while ( $xml->next_tag( 'item' ) ) {
+    $xml->set_attribute( 'status', 'published' );
+    $xml->remove_attribute( 'id' );
+}
 
-echo $processor->get_updated_xml();
-// <greeting>Goodbye</greeting>
+echo $xml->get_updated_xml();
+// <items><item status="published"/></items>
 ```
 
-### Self-Closing Elements
+### Use bookmarks for multi-pass processing
 
 ```php
-$xml = '<root><img src="photo.jpg" /><br /><p>Text</p></root>';
-$processor = XMLProcessor::create_from_string( $xml );
+$xml = XMLProcessor::create_from_string( $document );
+$ids = array();
 
-while ( $processor->next_tag( array( 'tag_closers' => 'visit' ) ) ) {
-    if ( $processor->is_empty_element() ) {
-        echo $processor->get_tag_local_name() . ' is self-closing' . "\n";
-    }
+// First pass: collect all IDs.
+while ( $xml->next_tag( 'item' ) ) {
+    $xml->set_bookmark( 'item_' . $xml->get_attribute( 'id' ) );
+    $ids[] = $xml->get_attribute( 'id' );
+}
+
+// Second pass: update specific items.
+foreach ( $ids as $id ) {
+    $xml->seek( 'item_' . $id );
+    $xml->set_attribute( 'processed', 'true' );
 }
-// img is self-closing
-// br is self-closing
 ```
 
-### Bookmarks
+### Process a document in streaming chunks
 
-Bookmarks let you save a position in the document and return to it later. This is useful when you need to inspect downstream content before deciding how to modify an earlier tag.
+For large documents, feed data in pieces:
 
 ```php
-$xml = '<list><item>A</item><item>B</item><item>C</item></list>';
-$processor = XMLProcessor::create_from_string( $xml );
+$xml = XMLProcessor::create_for_streaming();
 
-$processor->next_tag( 'list' );
-$processor->set_bookmark( 'list-start' );
+while ( $chunk = fread( $handle, 65536 ) ) {
+    $xml->append_bytes( $chunk );
 
-// Count items
-$count = 0;
-while ( $processor->next_tag( 'item' ) ) {
-    $count++;
+    while ( $xml->next_tag() ) {
+        // Process tokens as they arrive.
+    }
 }
-
-// Go back and annotate the list with the count
-$processor->seek( 'list-start' );
-$processor->set_attribute( '', 'data-count', (string) $count );
-
-echo $processor->get_updated_xml();
-// <list data-count="3"><item>A</item><item>B</item><item>C</item></list>
 ```
 
-### Streaming XML Processing
-
-For large documents, use `create_for_streaming()` to feed XML in chunks and process it incrementally.
+## Relationship to the HTML component
 
-```php
-$processor = XMLProcessor::create_for_streaming();
-
-// Feed chunks of XML data
-$processor->append_bytes( '<root><item id=' );
-$processor->append_bytes( '"1">First</item>' );
-$processor->append_bytes( '<item id="2">Second</item></root>' );
-$processor->input_finished();
+`XMLProcessor` and `WP_HTML_Tag_Processor` share the same API philosophy: forward-only cursor, `next_tag()` to advance, attribute getters and setters, bookmarks for seeking, `get_updated_*()` to retrieve the modified document. The main differences are:
 
-// Process all tags
-while ( $processor->next_tag( 'item' ) ) {
-    echo $processor->get_attribute( '', 'id' ) . "\n";
-}
-// 1
-// 2
-```
+- XML is strict and well-formed; HTML is lenient about malformed markup.
+- XML has namespaces as a first-class concept; HTML's namespace handling is implicit.
+- XML has no equivalent to HTML's implicit tag closing rules.
 
-## API Reference
-
-### XMLProcessor
-
-| Method | Description |
-|--------|-------------|
-| `create_from_string( $xml )` | Create a processor for a complete XML string |
-| `create_for_streaming( $xml )` | Create a processor that accepts incremental input |
-| `next_tag( $query )` | Advance to the next matching tag. Returns `true` if found |
-| `next_token()` | Advance to the next lexical token of any kind |
-| `get_tag_local_name()` | Get the local name of the current tag |
-| `get_tag_namespace()` | Get the namespace URI of the current tag |
-| `is_tag_opener()` | Whether the current tag is an opening tag |
-| `is_tag_closer()` | Whether the current tag is a closing tag |
-| `is_empty_element()` | Whether the current tag is self-closing |
-| `get_attribute( $ns, $name )` | Get the decoded value of an attribute |
-| `set_attribute( $ns, $name, $value )` | Set or add an attribute on the current tag |
-| `remove_attribute( $ns, $name )` | Remove an attribute from the current tag |
-| `get_modifiable_text()` | Get decoded text content of the current text/CDATA/comment node |
-| `set_modifiable_text( $value )` | Replace text content of the current node |
-| `get_token_name()` | Get the name of the current token (tag name, `#text`, `#comment`, etc.) |
-| `set_bookmark( $name )` | Save the current position with a name |
-| `seek( $name )` | Return to a previously saved bookmark |
-| `release_bookmark( $name )` | Free a bookmark |
-| `get_updated_xml()` | Get the full XML document with all modifications applied |
-| `append_bytes( $chunk )` | Feed more XML bytes (streaming mode) |
-| `input_finished()` | Signal that all XML bytes have been provided |
-| `is_paused_at_incomplete_input()` | Whether the parser stopped due to incomplete input |
-
-## Attribution
-
-The `XMLProcessor` follows the same architecture and API patterns as [WordPress core's HTML API](https://developer.wordpress.org/reference/classes/wp_html_processor/), extending the streaming tag-processor approach from HTML to XML. Licensed under GPL v2.
-
-## Requirements
-
-- PHP 7.2+
-- No external PHP extensions required (no libxml2)
+If you're already comfortable with one, the other will feel immediately familiar.
diff --git a/components/XML/class-xmlprocessor.php b/components/XML/class-xmlprocessor.php
index c2998a05f..ca6f4d5a6 100644
--- a/components/XML/class-xmlprocessor.php
+++ b/components/XML/class-xmlprocessor.php
@@ -85,19 +85,19 @@
  * | Find any tag.                                            | `$processor->next_tag();`                                |
  * | Find next image tag.                                     | `$processor->next_tag( array( 'tag_name' => 'image' ) );`|
  * | Find next image tag (shorthand).                         | `$processor->next_tag( 'image' );`                       |
- * | Find next image tag in the "wp.org" namespace.           | `$processor->next_tag( array( 'wp.org', 'image' ) );`    |
+ * | Find next image tag in the "wp.org" namespace name.      | `$processor->next_tag( array( 'wp.org', 'image' ) );`    |
  *
  * #### Namespace Examples
  *
- * To work with namespaces, you can use the `breadcrumbs` query format, where each breadcrumb is a tuple of (namespace prefix, local name):
+ * To work with namespaces, pass a tuple of (namespace name, local name):
  *
- *     $xml = '<root xmlns:wp="http://wordpress.org/export/1.2/"><wp:image src="cat.jpg" /></root>';
+ *     $xml = '<root xmlns:wp="http://wordpress.org/export/1.2/"><wp:image wp:src="cat.jpg" /></root>';
  *     $processor = XMLProcessor::create_from_string( $xml );
  *     // Find the <wp:image> tag
  *     if ( $processor->next_tag( array( 'http://wordpress.org/export/1.2/', 'image' ) ) ) {
- *         // Get the namespace URI of the matched tag
+ *         // Get the namespace name of the matched tag
  *         $ns = $processor->get_tag_namespace(); // 'http://wordpress.org/export/1.2/'
- *         // Get the value of the 'src' attribute
+ *         // Get the value of the wp:src attribute
  *         $src = $processor->get_attribute( $ns, 'src' );
  *         // Set a new attribute in the same namespace
  *         $processor->set_attribute( $ns, 'alt', 'A cat' );
@@ -315,9 +315,10 @@
  *
  * ### Namespaces
  *
- * Namespaces are first-class citizens in the XMLProcessor. Methods such as `set_attribute()` and `remove_attribute()`
- * require the full namespace URI, not just the local name. The XML specification treats the local
- * name as a mere syntax sugar. The actual matching is always done on the fully qualified namespace name.
+ * Namespaces are first-class citizens in the XMLProcessor. Namespace-aware methods such as
+ * `set_attribute()` and `remove_attribute()` require the expanded namespace name from the
+ * matching `xmlns` declaration, not the prefix written in the tag.
+ * The actual matching is done on the expanded namespace name plus the local name.
  *
  * Example:
  *
diff --git a/components/Zip/README.md b/components/Zip/README.md
index 29ba4df92..3b0c5232d 100644
--- a/components/Zip/README.md
+++ b/components/Zip/README.md
@@ -1,173 +1,139 @@
 # Zip
 
-A pure PHP library for reading and writing ZIP archives without the `libzip` extension or `ZipArchive` class. It provides a streaming `ZipFilesystem` reader that exposes ZIP contents through a standard filesystem interface, and a `ZipEncoder` that writes ZIP files incrementally. Handles both stored and deflate-compressed entries.
+## Why this exists
 
-## Installation
+PHP ships with `ZipArchive`, a convenient class for reading and writing ZIP files. The catch: it requires the `libzip` native extension, which isn't available everywhere. WordPress Playground compiles PHP to WebAssembly and runs it in the browser — no native extensions, no `libzip`, no `ZipArchive`.
 
-```
-composer require wp-php-toolkit/zip
-```
+WordPress Playground needs ZIP files constantly. Installing a plugin, importing a theme, exporting a site — all of these move data as ZIP archives. This component implements ZIP reading and writing entirely in pure PHP so that Playground (and any other extension-free PHP environment) can work with ZIP files without restriction.
 
-## Quick Start
+## How it works
 
-```php
-use WordPress\ByteStream\ReadStream\FileReadStream;
-use WordPress\Zip\ZipFilesystem;
+A ZIP file is structured with the actual file data at the front and a "central directory" at the end. The central directory is an index: it lists every file in the archive along with the offset where its data starts. This layout is what makes ZIP files streamable — you can start writing file data immediately without knowing the final offsets, then write the index at the end.
 
-// Open a ZIP file and read its contents
-$zip = ZipFilesystem::create( FileReadStream::from_path( 'archive.zip' ) );
+### Reading: ZipFilesystem
 
-// List top-level entries
-$entries = $zip->ls(); // ['readme.txt', 'src', 'images']
+`ZipFilesystem` reads the central directory first (from the end of the file) to build an in-memory index, then lazily reads individual file entries on demand. It implements the `Filesystem` interface from this toolkit, so reading a ZIP archive looks identical to reading a local directory. Code that accepts a `Filesystem` argument works against a ZIP file without any changes.
 
-// Read a file
-$content = $zip->get_contents( 'readme.txt' );
-```
+The central directory is capped at 2 MB to keep memory usage predictable even for large archives.
 
-## Usage
+### Writing: ZipEncoder
 
-### Reading ZIP Archives
+`ZipEncoder` writes a ZIP archive incrementally to a `ByteWriteStream`. You add files one at a time; it writes each local file header and data immediately. When you call `finish()`, it writes the central directory and end-of-central-directory record, completing the archive.
 
-`ZipFilesystem` implements the `Filesystem` interface, so you can list directories, check paths, and read files just like a regular filesystem.
+Files can be stored uncompressed (`STORE`) or compressed with DEFLATE. The encoder handles CRC32 checksums and compressed/uncompressed size tracking automatically.
+
+## Usage
+
+### Read files from a ZIP archive
 
 ```php
-use WordPress\ByteStream\ReadStream\FileReadStream;
 use WordPress\Zip\ZipFilesystem;
 
-$zip = ZipFilesystem::create( FileReadStream::from_path( 'book.epub' ) );
+$fs = ZipFilesystem::create( '/path/to/plugin.zip' );
 
-// List the root directory
-$entries = $zip->ls();
-// ['mimetype', 'EPUB', 'META-INF']
+// Works just like any other Filesystem.
+foreach ( $fs->ls( '/' ) as $name ) {
+    echo $name . "\n";
+}
 
-// List a subdirectory
-$epub_files = $zip->ls( '/EPUB' );
-// ['cover.xhtml', 'css', 'images', 'nav.xhtml', 'package.opf', ...]
+$contents = $fs->get_contents( '/readme.txt' );
+```
 
-// Check if a path exists
-$zip->exists( 'mimetype' );      // true
-$zip->is_file( 'mimetype' );     // true
-$zip->is_dir( 'EPUB' );          // true
-$zip->is_file( 'EPUB' );         // false
+### Check if a path exists
 
-// Read file contents
-$mimetype = $zip->get_contents( 'mimetype' );
-// "application/epub+zip"
+```php
+if ( $fs->is_file( '/plugin.php' ) ) {
+    $main_file = $fs->get_contents( '/plugin.php' );
+}
 
-$cover = $zip->get_contents( 'EPUB/cover.xhtml' );
-// "<?xml version="1.0" encoding="UTF-8"?>..."
+if ( $fs->is_dir( '/assets' ) ) {
+    foreach ( $fs->ls( '/assets' ) as $asset ) {
+        echo $asset . "\n";
+    }
+}
 ```
 
-### Streaming File Reads
+### Mount a ZIP archive alongside other filesystems
 
-For large files inside the archive, use `open_read_stream()` to read data incrementally instead of loading everything into memory.
+Because `ZipFilesystem` implements `Filesystem`, you can pass it anywhere a filesystem is expected — including to code that recursively copies files:
 
 ```php
-use WordPress\ByteStream\ReadStream\FileReadStream;
 use WordPress\Zip\ZipFilesystem;
-
-$zip = ZipFilesystem::create( FileReadStream::from_path( 'archive.zip' ) );
-
-$stream = $zip->open_read_stream( 'large-dataset.csv' );
-while ( $bytes = $stream->pull( 4096 ) ) {
-    $chunk = $stream->consume( $bytes );
-    // Process the chunk...
+use WordPress\Filesystem\LocalFilesystem;
+use WordPress\Filesystem\Visitor\FilesystemVisitor;
+
+$zip   = ZipFilesystem::create( '/tmp/theme.zip' );
+$local = new LocalFilesystem( '/var/www/html/wp-content/themes' );
+
+// Extract the ZIP to the local filesystem.
+$visitor = new FilesystemVisitor( $zip, '/' );
+while ( $visitor->next() ) {
+    $event = $visitor->get_event();
+    $path  = $event->get_path();
+    if ( $event->is_dir() ) {
+        $local->mkdir( $path );
+    } elseif ( $event->is_file() ) {
+        $local->put_contents( $path, $zip->get_contents( $path ) );
+    }
 }
 ```
 
-### Creating ZIP Archives
-
-Use `ZipEncoder` to build ZIP files from scratch. Write individual files with `append_file()`, or copy an entire filesystem tree with `append_from_filesystem()`.
+### Create a ZIP archive
 
 ```php
-use WordPress\ByteStream\MemoryPipe;
-use WordPress\ByteStream\WriteStream\FileWriteStream;
-use WordPress\Zip\FileEntry;
-use WordPress\Zip\ZipDecoder;
 use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\FileEntry;
+
+// Write to a file on disk.
+$handle = fopen( '/tmp/output.zip', 'wb' );
+$stream = new FileWriteStream( $handle );
+
+$encoder = new ZipEncoder( $stream );
+
+// Add a simple text file (stored uncompressed).
+$entry = new FileEntry( 'hello.txt', 'Hello, world.' );
+$encoder->append_file( $entry );
 
-// Create a new ZIP file
-$output = FileWriteStream::from_path( 'output.zip', 'truncate' );
-$encoder = new ZipEncoder( $output );
-
-// Add a file with no compression
-$encoder->append_file(
-    new FileEntry( array(
-        'path'               => 'hello.txt',
-        'compression_method' => ZipDecoder::COMPRESSION_NONE,
-        'body_reader'        => new MemoryPipe( 'Hello, world!' ),
-    ) )
-);
-
-// Add a file with deflate compression
-$encoder->append_file(
-    new FileEntry( array(
-        'path'               => 'data/notes.txt',
-        'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
-        'body_reader'        => new MemoryPipe( 'This will be compressed.' ),
-    ) )
-);
-
-// Finalize and close
-$encoder->close();
-$output->close_writing();
+// Add a compressed file.
+$entry = new FileEntry( 'data.json', json_encode( $data ), ZipEncoder::COMPRESSION_DEFLATE );
+$encoder->append_file( $entry );
+
+$encoder->finish();
+fclose( $handle );
 ```
 
-### Copying from One ZIP to Another
+### Package a filesystem as a ZIP
 
-Because `ZipFilesystem` implements the standard `Filesystem` interface, you can pass it directly to `ZipEncoder::append_from_filesystem()` to repackage a ZIP archive.
+`ZipEncoder` can recursively archive any `Filesystem` implementation — a local directory, an in-memory tree, or even another ZIP:
 
 ```php
-use WordPress\ByteStream\ReadStream\FileReadStream;
-use WordPress\ByteStream\WriteStream\FileWriteStream;
 use WordPress\Zip\ZipEncoder;
-use WordPress\Zip\ZipFilesystem;
+use WordPress\Filesystem\LocalFilesystem;
 
-// Open the source ZIP
-$source = ZipFilesystem::create( FileReadStream::from_path( 'original.zip' ) );
+$fs      = new LocalFilesystem( '/var/www/html' );
+$handle  = fopen( '/tmp/site-backup.zip', 'wb' );
+$encoder = new ZipEncoder( new FileWriteStream( $handle ) );
 
-// Create a new ZIP with the same contents
-$output = FileWriteStream::from_path( 'copy.zip', 'truncate' );
-$encoder = new ZipEncoder( $output );
-$encoder->append_from_filesystem( $source );
-$encoder->close();
-$output->close_writing();
+$encoder->append_from_filesystem( $fs, '/' );
+$encoder->finish();
+fclose( $handle );
 ```
 
-## API Reference
-
-### ZipFilesystem
-
-| Method | Description |
-|--------|-------------|
-| `create( ByteReadStream $reader )` | Create a filesystem view of a ZIP archive |
-| `ls( $dir = '/' )` | List entries in a directory |
-| `is_file( $path )` | Check if a path is a file |
-| `is_dir( $path )` | Check if a path is a directory |
-| `exists( $path )` | Check if a path exists |
-| `get_contents( $path )` | Read an entire file as a string |
-| `open_read_stream( $path )` | Open a streaming reader for a file |
+### Stream a ZIP archive directly to the browser
 
-### ZipEncoder
+Because `ZipEncoder` writes to any `ByteWriteStream`, you can send a ZIP to the browser without creating a temporary file:
 
-| Method | Description |
-|--------|-------------|
-| `__construct( ByteWriteStream $output )` | Create an encoder that writes to the given stream |
-| `append_file( FileEntry $entry )` | Add a single file to the archive |
-| `append_from_filesystem( Filesystem $fs, $path )` | Recursively add files from a filesystem |
-| `close()` | Write the central directory and finalize the archive |
-
-### FileEntry
+```php
+header( 'Content-Type: application/zip' );
+header( 'Content-Disposition: attachment; filename="export.zip"' );
 
-Constructed with an associative array of header fields:
+$encoder = new ZipEncoder( new StdoutWriteStream() );
+$encoder->append_from_filesystem( $fs, '/' );
+$encoder->finish();
+```
 
-| Field | Description |
-|-------|-------------|
-| `path` | File path inside the archive |
-| `body_reader` | A `ByteReadStream` with the file data |
-| `compression_method` | `ZipDecoder::COMPRESSION_NONE` or `ZipDecoder::COMPRESSION_DEFLATE` |
+## ZIP format notes
 
-## Requirements
+ZIP stores file data as individual local file records followed by a central directory at the end. Because the encoder writes data before it knows final sizes (for streamed or large files), it uses data descriptors — a technique allowed by the ZIP specification — to record CRC32 and size values after the file data rather than before it.
 
-- PHP 7.2+
-- No external PHP extensions required (no libzip)
+Compression uses PHP's built-in `deflate_init()` / `deflate_add()` functions from the `zlib` extension. If `zlib` is unavailable, files can still be stored uncompressed; only DEFLATE compression requires it.
diff --git a/docs/_legacy/README.md b/docs/_legacy/README.md
new file mode 100644
index 000000000..77f176a6b
--- /dev/null
+++ b/docs/_legacy/README.md
@@ -0,0 +1,61 @@
+# Runnable docs site
+
+Static HTML at `docs/` deployed to GitHub Pages by `.github/workflows/docs.yml`.
+
+## How a page works
+
+Every component page is generated by `bin/build-docs.py` from a single content
+catalog. Most executable examples render as runnable Playground snippets;
+examples that are illustrative rather than executable render as
+`<php-snippet runnable="false">`. The page imports two scripts:
+
+- `https://playground.wordpress.net/php-code-snippet.js` — the upstream
+  `<php-snippet>` web component (see WordPress/wordpress-playground#3528 and
+  #3536). It handles the Run button, the syntax-highlighted code rendering, and
+  shared-runtime reuse across all runnable snippets on a page.
+- `assets/page.js` — local enhancement script that fills the shared blueprint
+  with an absolute URL to `assets/php-toolkit.zip`, builds the sticky
+  table-of-contents from `<h2>` and `<h3>` headings, and patches each snippet's
+  shadow DOM to make runnable code editable and to hide run controls for
+  non-runnable snippets.
+
+The blueprint sits in a `<script id="toolkit-setup" type="application/json">`
+element, populated at runtime by `page.js`. It's a one-step blueprint that
+unzips the toolkit into `/wordpress/wp-content/php-toolkit/` inside the
+Playground runtime. Snippets then `require '/wordpress/wp-content/php-toolkit/vendor/autoload.php'`
+— exactly what real consumers of the library do.
+
+## Local preview
+
+```sh
+python3 bin/serve-docs.py     # http://localhost:8787
+```
+
+`serve-docs.py` adds `Access-Control-Allow-Origin: *` so the cross-origin
+Playground iframe can fetch the bundle. GitHub Pages serves that header
+automatically, so no separate runtime is needed in production.
+
+## Rebuilding
+
+After any change to `components/` or `bin/build-docs.py`:
+
+```sh
+bin/build-docs-bundle.sh
+```
+
+This runs `composer install --no-dev --optimize-autoloader`, bundles the result
+into `docs/assets/php-toolkit.zip`, and regenerates `docs/<component>/index.html`
+for every component.
+
+The CI workflow (`docs.yml`) does the same on every push to `trunk` and
+deploys to Pages.
+
+## Editable snippets
+
+Editing is currently a shadow-DOM patch in `page.js`: the rendered `<code>`
+gets `contenteditable="plaintext-only"` and edits are pushed back into the
+component's internal `_code` field on `input`. Highlighting re-runs on `blur`.
+
+Cleanest fix: an `editable` attribute on `<php-snippet>` itself in
+WordPress/wordpress-playground. Until that lands, the patch in `page.js` is
+the workaround.
diff --git a/docs/_legacy/blockparser/index.html b/docs/_legacy/blockparser/index.html
new file mode 100644
index 000000000..becbfd483
--- /dev/null
+++ b/docs/_legacy/blockparser/index.html
@@ -0,0 +1,300 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>BlockParser — PHP Toolkit</title>
+<meta name="description" content="WordPress core&#x27;s block parser, packaged as a standalone library. Turn block markup into a structured tree, lint posts for common authoring mistakes, and audit block usage — all without booting WordPress.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li class="current"><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>BlockParser</h1>
+		<p class="lede">WordPress core's block parser, packaged as a standalone library. Turn block markup into a structured tree, lint posts for common authoring mistakes, and audit block usage — all without booting WordPress.</p>
+		<code class="install">composer require wp-php-toolkit/blockparser</code>
+		<p>Block markup is not plain HTML. A post can contain HTML comments that identify blocks, JSON attributes inside those comments, freeform HTML between blocks, and nested blocks whose rendered HTML is interleaved with parent markup.</p><p>This component packages WordPress core's block parser so importers, linters, migration tools, and static analyzers can understand block content without loading WordPress. It deliberately mirrors core behavior, including <code>null</code> blocks for freeform HTML and core block names such as <code>core/paragraph</code>.</p><p>That fidelity to core is intentional. The project history includes removing toolkit-only behavior that was not present in WordPress core because even small mismatches can break importer and migration code that expects core parser semantics.</p><p>Reach for it when you need answers about the block tree: which blocks a post uses, which attributes they carry, where nested blocks appear, or whether content violates a rule your project cares about.</p>
+		<p>The parser turns serialized post content into the block array shape WordPress core returns. It does not render blocks, load <code>block.json</code>, or ask a registry whether a block exists.</p><p>Handle <code>blockName === null</code> first. A real post can contain a paragraph block, a custom block, and loose HTML before or after both.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Inspect the returned shape</li>
+			<li>Walk the tree</li>
+			<li>Ask editorial questions</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="what-you-get-back">What you get back</h2>
+		<p><code>WP_Block_Parser::parse()</code> returns an array of blocks. Each block is an associative array with five keys: <code>blockName</code>, <code>attrs</code>, <code>innerBlocks</code>, <code>innerHTML</code>, and <code>innerContent</code>.</p><p><code>innerHTML</code> is the HTML inside the block <em>with inner blocks stripped out</em>. <code>innerContent</code> is the interleaved version: an array of HTML strings with <code>null</code> placeholders marking where each inner block belongs.</p><p>Most code starts by checking <code>blockName</code>, then reading <code>attrs</code> or <code>innerHTML</code>. When a post has container blocks such as Group, Columns, or Navigation, look inside <code>innerBlocks</code> too.</p><p><strong>Footgun:</strong> freeform HTML between blocks shows up as a block with <code>blockName === null</code>. Always skip that case before comparing names.</p>
+		<h2 id="parse-a-document">Parse a document</h2>
+		<p>The simplest possible use. Pass a string, get back a tree.</p>
+<php-snippet blueprint="toolkit-setup" name="parse.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = "<!-- wp:heading {\"level\":2} -->\n<h2>Welcome</h2>\n<!-- /wp:heading -->\n\n"
+	. "<!-- wp:paragraph -->\n<p>Hello from the block editor.</p>\n<!-- /wp:paragraph -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+foreach ( $blocks as $block ) {
+	if ( null === $block['blockName'] ) {
+		continue;
+	}
+	echo $block['blockName'] . ': ' . trim( strip_tags( $block['innerHTML'] ) ) . "\n";
+}
+</script>
+<script type="text/expected-output">
+core/heading: Welcome
+core/paragraph: Hello from the block editor.
+</script>
+</php-snippet>
+		<h2 id="count-every-block-type-in-a-post">Count every block type in a post</h2>
+		<p>A common audit task: "How many Paragraph, Image, and Gallery blocks does this post use?" A small queue keeps the example readable while still visiting nested blocks.</p>
+<php-snippet blueprint="toolkit-setup" name="count-blocks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = "<!-- wp:group --><div class=\"wp-block-group\">"
+	. "<!-- wp:heading --><h2>Title</h2><!-- /wp:heading -->"
+	. "<!-- wp:paragraph --><p>One.</p><!-- /wp:paragraph -->"
+	. "<!-- wp:paragraph --><p>Two.</p><!-- /wp:paragraph -->"
+	. "<!-- wp:image {\"id\":1} --><figure><img src=\"a.jpg\"/></figure><!-- /wp:image -->"
+	. "</div><!-- /wp:group -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+$counts = array();
+$queue  = $blocks;
+
+while ( ! empty( $queue ) ) {
+	$block = array_shift( $queue );
+
+	if ( null !== $block['blockName'] ) {
+		$name             = $block['blockName'];
+		$counts[ $name ] = isset( $counts[ $name ] ) ? $counts[ $name ] + 1 : 1;
+	}
+
+	foreach ( $block['innerBlocks'] as $inner_block ) {
+		$queue[] = $inner_block;
+	}
+}
+
+arsort( $counts );
+foreach ( $counts as $name => $n ) {
+	echo str_pad( (string) $n, 4, ' ', STR_PAD_LEFT ) . '  ' . $name . "\n";
+}
+</script>
+<script type="text/expected-output">
+   2  core/paragraph
+   1  core/group
+   1  core/heading
+   1  core/image
+</script>
+</php-snippet>
+		<h2 id="check-whether-a-post-uses-a-block">Check whether a post uses a block</h2>
+		<p>Useful for templates, audits, and migrations: answer one yes/no question without caring where the block appears in the tree.</p>
+<php-snippet blueprint="toolkit-setup" name="has-block.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = "<!-- wp:group --><div class=\"wp-block-group\">"
+	. "<!-- wp:buttons --><div class=\"wp-block-buttons\">"
+	. "<!-- wp:button --><div class=\"wp-block-button\"><a>Buy now</a></div><!-- /wp:button -->"
+	. "</div><!-- /wp:buttons -->"
+	. "</div><!-- /wp:group -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+function post_has_block( $blocks, $name ) {
+	$queue = $blocks;
+
+	while ( ! empty( $queue ) ) {
+		$block = array_shift( $queue );
+		if ( $name === $block['blockName'] ) {
+			return true;
+		}
+
+		foreach ( $block['innerBlocks'] as $inner_block ) {
+			$queue[] = $inner_block;
+		}
+	}
+
+	return false;
+}
+
+echo post_has_block( $blocks, 'core/button' ) ? "has button\n" : "missing button\n";
+echo post_has_block( $blocks, 'core/gallery' ) ? "has gallery\n" : "missing gallery\n";
+</script>
+<script type="text/expected-output">
+has button
+missing gallery
+</script>
+</php-snippet>
+		<h2 id="lint-headings-for-hierarchy-mistakes">Lint headings for hierarchy mistakes</h2>
+		<p>"Don't skip from H2 to H4" is a real accessibility rule. The helper below keeps headings in document order, including headings nested inside Group, Column, and Cover blocks.</p>
+<php-snippet blueprint="toolkit-setup" name="lint-headings.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = "<!-- wp:heading -->\n<h2>Intro</h2>\n<!-- /wp:heading -->"
+	. "<!-- wp:heading {\"level\":4} -->\n<h4>Subsection</h4>\n<!-- /wp:heading -->"
+	. "<!-- wp:heading {\"level\":3} -->\n<h3>Body</h3>\n<!-- /wp:heading -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+function collect_headings( $blocks, &$headings ) {
+	foreach ( $blocks as $block ) {
+		if ( 'core/heading' === $block['blockName'] ) {
+			$headings[] = array(
+				'level' => isset( $block['attrs']['level'] ) ? (int) $block['attrs']['level'] : 2,
+				'text'  => trim( strip_tags( $block['innerHTML'] ) ),
+			);
+		}
+
+		collect_headings( $block['innerBlocks'], $headings );
+	}
+}
+
+$headings = array();
+collect_headings( $blocks, $headings );
+
+$last = 1;
+foreach ( $headings as $heading ) {
+	$level = $heading['level'];
+	$label = $heading['text'];
+
+	if ( $level > $last + 1 ) {
+		echo "WARN {$label}: jumped from H{$last} to H{$level}\n";
+	} else {
+		echo "ok   {$label}: H{$level}\n";
+	}
+	$last = $level;
+}
+</script>
+<script type="text/expected-output">
+ok   Intro: H2
+WARN Subsection: jumped from H2 to H4
+ok   Body: H3
+</script>
+</php-snippet>
+		<h2 id="find-all-instances-of-a-custom-block">Find all instances of a custom block</h2>
+		<p>When auditing an export for a block your plugin owns, collect every match and print the fields a human cares about.</p>
+<php-snippet blueprint="toolkit-setup" name="find-custom-block.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = "<!-- wp:paragraph --><p>Reviews</p><!-- /wp:paragraph -->"
+	. "<!-- wp:my-plugin/testimonial {\"author\":\"Jane\",\"rating\":5} -->"
+	. "<blockquote>Loved it.</blockquote>"
+	. "<!-- /wp:my-plugin/testimonial -->"
+	. "<!-- wp:my-plugin/testimonial {\"author\":\"Joe\",\"rating\":4} -->"
+	. "<blockquote>Pretty good.</blockquote>"
+	. "<!-- /wp:my-plugin/testimonial -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+function find_blocks_by_name( $blocks, $name, &$matches ) {
+	foreach ( $blocks as $block ) {
+		if ( $name === $block['blockName'] ) {
+			$matches[] = $block;
+		}
+
+		find_blocks_by_name( $block['innerBlocks'], $name, $matches );
+	}
+}
+
+$testimonials = array();
+find_blocks_by_name( $blocks, 'my-plugin/testimonial', $testimonials );
+
+foreach ( $testimonials as $i => $b ) {
+	echo ( $i + 1 ) . '. ' . $b['attrs']['author'] . ' (' . $b['attrs']['rating'] . '/5): '
+		. trim( strip_tags( $b['innerHTML'] ) ) . "\n";
+}
+</script>
+<script type="text/expected-output">
+1. Jane (5/5): Loved it.
+2. Joe (4/5): Pretty good.
+</script>
+</php-snippet>
+		<h2 id="detect-blocks-with-stale-embed-urls">Detect blocks with stale embed URLs</h2>
+		<p>A real-world content audit: find every <code>core/embed</code> whose URL points at a domain you have retired.</p>
+<php-snippet blueprint="toolkit-setup" name="audit-embeds.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = '<!-- wp:embed {"url":"https://twitter.com/wordpress/status/1","providerNameSlug":"twitter"} /-->'
+	. '<!-- wp:embed {"url":"https://youtube.com/watch?v=abc","providerNameSlug":"youtube"} /-->'
+	. '<!-- wp:embed {"url":"https://vine.co/v/xyz","providerNameSlug":"vine"} /-->';
+
+$retired = array( 'vine.co', 'plus.google.com' );
+
+foreach ( ( new WP_Block_Parser() )->parse( $document ) as $b ) {
+	if ( 'core/embed' !== $b['blockName'] ) {
+		continue;
+	}
+	$url  = isset( $b['attrs']['url'] ) ? $b['attrs']['url'] : '';
+	$host = parse_url( $url, PHP_URL_HOST );
+	$bad  = $host && in_array( $host, $retired, true );
+	echo ( $bad ? 'STALE  ' : 'ok     ' ) . $url . "\n";
+}
+</script>
+<script type="text/expected-output">
+ok     https://twitter.com/wordpress/status/1
+ok     https://youtube.com/watch?v=abc
+STALE  https://vine.co/v/xyz
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../html/">HTML</a><span>Inspect or rewrite the HTML carried by parsed blocks.</span></li>
+			<li><a href="../markdown/">Markdown</a><span>Move between author-friendly Markdown and serialized block markup.</span></li>
+			<li><a href="../dataliberation/">DataLiberation</a><span>Audit and transform blocks while migrating content.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/blueprints/index.html b/docs/_legacy/blueprints/index.html
new file mode 100644
index 000000000..7f20475ec
--- /dev/null
+++ b/docs/_legacy/blueprints/index.html
@@ -0,0 +1,228 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Blueprints — PHP Toolkit</title>
+<meta name="description" content="Declarative WordPress site provisioning. Write a JSON description of plugins, options, and content; let the runner execute it.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li class="current"><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>Blueprints</h1>
+		<p class="lede">Declarative WordPress site provisioning. Write a JSON description of plugins, options, and content; let the runner execute it.</p>
+		<code class="install">composer require wp-php-toolkit/blueprints</code>
+		<p>A WordPress environment is more than a database dump. It can require a specific core version, plugins, themes, site options, uploaded files, content, and setup steps. Rebuilding that by hand makes demos, tests, bug reports, workshops, and CI fixtures drift over time.</p><p>The Blueprints component treats site setup as data. A blueprint JSON document describes the desired steps, and the runner applies them to either a new WordPress install or an existing one. The validator exists because user-authored JSON needs clear, path-specific errors rather than generic schema failures.</p><p>Recent design work also reflects real hosting layouts: the web root and WordPress core directory can live in separate directories, so runner configuration makes those paths explicit instead of assuming one common directory shape.</p><p>Blueprints can <em>create</em> a new WordPress install (download core, set up the database, apply steps) or <em>apply to an existing</em> site. Creating a fresh site needs filesystem access this in-browser runtime doesn't have, so the snippets focus on <code>APPLY_TO_EXISTING_SITE</code>.</p>
+		<p>A Blueprint is a versioned recipe for a WordPress site. It can install Gutenberg, set permalink structure, import content, copy files, and run WP-CLI steps in a predictable order.</p><p>The runner supplies the environment: site root, site URL, execution mode, and filesystem access. The validator checks user-authored JSON before the runner mutates the target site.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Configure the target</li>
+			<li>Generate repeatable recipes</li>
+			<li>Validate before running</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="configure-a-runner-for-an-existing-site">Configure a runner for an existing site</h2>
+		<p><code>RunnerConfiguration</code> is a fluent builder. The minimum: target site root, target site URL, execution mode.</p>
+<php-snippet blueprint="toolkit-setup" name="configure.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Blueprints\Runner;
+use WordPress\Blueprints\RunnerConfiguration;
+
+$config = ( new RunnerConfiguration() )
+	->set_execution_mode( Runner::EXECUTION_MODE_APPLY_TO_EXISTING_SITE )
+	->set_target_site_root( '/wordpress' )
+	->set_target_site_url( 'http://playground.test/' );
+
+echo "mode: " . $config->get_execution_mode() . "\n";
+echo "root: " . $config->get_target_site_root() . "\n";
+echo "url:  " . $config->get_target_site_url() . "\n";
+</script>
+<script type="text/expected-output">
+mode: apply-to-existing-site
+root: /wordpress
+url:  http://playground.test/
+</script>
+</php-snippet>
+		<h2 id="generate-blueprint-json-from-php">Generate blueprint JSON from PHP</h2>
+		<p>CI jobs and tests stay clearer when PHP builds the blueprint from data instead of hand-writing JSON. Keep the structure plain: <code>version</code>, then a list of step arrays.</p>
+<php-snippet blueprint="toolkit-setup" name="build-json.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$site_name = 'Demo Site';
+$plugins   = array( 'gutenberg', 'classic-editor' );
+
+$blueprint = array(
+	'version' => 2,
+	'steps'   => array(
+		array(
+			'step'    => 'setSiteOptions',
+			'options' => array(
+				'blogname'              => $site_name,
+				'permalink_structure'   => '/%postname%/',
+				'show_on_front'         => 'page',
+			),
+		),
+	),
+);
+
+foreach ( $plugins as $slug ) {
+	$blueprint['steps'][] = array(
+		'step'       => 'installPlugin',
+		'pluginData' => "https://downloads.wordpress.org/plugin/{$slug}.zip",
+	);
+	$blueprint['steps'][] = array(
+		'step'   => 'activatePlugin',
+		'plugin' => "{$slug}/{$slug}.php",
+	);
+}
+
+echo json_encode( $blueprint, JSON_PRETTY_PRINT | JSON_UNESCAPED_SLASHES ) . "\n";
+</script>
+<script type="text/expected-output">
+{
+    "version": 2,
+    "steps": [
+        {
+            "step": "setSiteOptions",
+            "options": {
+                "blogname": "Demo Site",
+                "permalink_structure": "/%postname%/",
+                "show_on_front": "page"
+            }
+        },
+        {
+            "step": "installPlugin",
+            "pluginData": "https://downloads.wordpress.org/plugin/gutenberg.zip"
+        },
+        {
+            "step": "activatePlugin",
+            "plugin": "gutenberg/gutenberg.php"
+        },
+        {
+            "step": "installPlugin",
+            "pluginData": "https://downloads.wordpress.org/plugin/classic-editor.zip"
+        },
+        {
+            "step": "activatePlugin",
+            "plugin": "classic-editor/classic-editor.php"
+        }
+    ]
+}
+</script>
+</php-snippet>
+		<h2 id="validate-before-running">Validate before running</h2>
+		<p>The schema validator returns a human-readable <code>ValidationError</code> instead of a generic "does not match schema" failure. Use it before handing user-authored JSON to a runner.</p>
+<php-snippet blueprint="toolkit-setup" name="validate.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Blueprints\Validator\HumanFriendlySchemaValidator;
+
+$schema = array(
+	'type'       => 'object',
+	'required'   => array( 'version', 'steps' ),
+	'properties' => array(
+		'version' => array( 'type' => 'integer' ),
+		'steps'   => array(
+			'type'  => 'array',
+			'items' => array(
+				'type'       => 'object',
+				'required'   => array( 'step' ),
+				'properties' => array(
+					'step' => array( 'type' => 'string' ),
+				),
+			),
+		),
+	),
+);
+
+$blueprint = array(
+	'version' => 2,
+	'steps'   => array(
+		array( 'pluginData' => 'https://downloads.wordpress.org/plugin/gutenberg.zip' ),
+	),
+);
+
+$error = ( new HumanFriendlySchemaValidator( $schema ) )->validate( $blueprint );
+if ( null === $error ) {
+	echo "valid\n";
+} else {
+	echo $error->get_pretty_path() . ": " . $error->message . "\n";
+}
+</script>
+<script type="text/expected-output">
+Blueprint root["steps"][0]: Missing required field: step.
+</script>
+</php-snippet>
+		<h2 id="the-blueprint-json-shape">The Blueprint JSON shape</h2>
+		<p>A blueprint is a JSON document with a <code>version</code> field and a <code>steps</code> array. Each step has a <code>"step"</code> discriminator and step-specific fields. This is the same shape used by <a href="https://playground.wordpress.net/">WordPress Playground</a>.</p><pre><code>{
+  "version": 2,
+  "steps": [
+    { "step": "setSiteOptions",
+      "options": {
+        "blogname": "Demo Site",
+        "permalink_structure": "/%postname%/"
+      } },
+    { "step": "installPlugin",
+      "pluginData": "https://downloads.wordpress.org/plugin/gutenberg.zip" },
+    { "step": "activatePlugin",
+      "plugin": "gutenberg/gutenberg.php" }
+  ]
+}</code></pre>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../filesystem/">Filesystem</a><span>Prepare files and fixtures before applying site setup steps.</span></li>
+			<li><a href="../httpclient/">HttpClient</a><span>Download packages or source data as part of provisioning workflows.</span></li>
+			<li><a href="../cli/">CLI</a><span>Wrap repeatable blueprint operations in a small command.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/bytestream/index.html b/docs/_legacy/bytestream/index.html
new file mode 100644
index 000000000..ae5166238
--- /dev/null
+++ b/docs/_legacy/bytestream/index.html
@@ -0,0 +1,223 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>ByteStream — PHP Toolkit</title>
+<meta name="description" content="Composable streaming primitives for reading, writing, transforming, hashing, and compressing byte data. Pull/peek/consume semantics let parsers backtrack without copying, and deflate, inflate, and checksum filters snap together like Lego.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li class="current"><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>ByteStream</h1>
+		<p class="lede">Composable streaming primitives for reading, writing, transforming, hashing, and compressing byte data. Pull/peek/consume semantics let parsers backtrack without copying, and deflate, inflate, and checksum filters snap together like Lego.</p>
+		<code class="install">composer require wp-php-toolkit/bytestream</code>
+		<p>PHP's native streams are powerful but inconsistent. <code>fread</code> on a socket may return short reads with no warning; <code>stream_filter_append</code> is awkward to compose; gzip helpers and file handles expose different APIs. The ByteStream component normalizes these behind one small interface — <code>pull / peek / consume</code> — so a parser, a hash function, and a deflate filter all see the same shape.</p><p>The split between <em>pull</em> (buffer up to N bytes) and <em>consume</em> (advance past N bytes) is the secret. Parsers can <code>peek</code> ahead to detect a record boundary and decide whether to <code>consume</code>, without copying or allocating.</p>
+		<p>A read stream separates three actions: pull bytes, inspect the buffer, then consume the bytes you accepted. That pattern lets a parser wait for a full line, a ZIP decoder wait for a complete header, or an HTTP client report progress without losing data.</p><p>Write streams make the destination boring. The caller writes chunks; the sink decides whether those bytes go to memory, a file, a compressor, or another component.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Read in chunks</li>
+			<li>Handle awkward boundaries</li>
+			<li>Add behavior around bytes</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="read-a-file-in-chunks">Read a file in chunks</h2>
+		<p>The canonical loop. <code>pull()</code> tells you how many bytes are buffered; <code>consume()</code> reads them and advances. The buffer never grows beyond the chunk size you ask for.</p>
+<php-snippet blueprint="toolkit-setup" name="teaser-read.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\ReadStream\FileReadStream;
+
+$path = tempnam( sys_get_temp_dir(), 'demo' );
+file_put_contents( $path, str_repeat( "log line\n", 200 ) );
+
+$reader = FileReadStream::from_path( $path );
+$total = 0;
+while ( ! $reader->reached_end_of_data() ) {
+	$n = $reader->pull( 256 );
+	if ( 0 === $n ) break;
+	$total += strlen( $reader->consume( $n ) );
+}
+$reader->close_reading();
+echo "Read {$total} bytes in 256-byte chunks.\n";
+</script>
+<script type="text/expected-output">
+Read 1800 bytes in 256-byte chunks.
+</script>
+</php-snippet>
+		<h2 id="memorypipe-as-write-then-read-buffer">MemoryPipe as write-then-read buffer</h2>
+		<p><code>MemoryPipe</code> is bidirectional: you <code>append_bytes()</code> as a writer and <code>pull/consume</code> as a reader. Easiest way to wire one component's output into another's input.</p><p>Gotcha: a producer must call <code>close_writing()</code> when done — otherwise the consumer eventually throws <code>NotEnoughDataException</code> instead of seeing EOF.</p>
+<php-snippet blueprint="toolkit-setup" name="memory-pipe.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+
+$pipe = new MemoryPipe();
+$pipe->append_bytes( "first chunk\n" );
+$pipe->append_bytes( "second chunk\n" );
+$pipe->append_bytes( "third chunk\n" );
+$pipe->close_writing();
+
+while ( ! $pipe->reached_end_of_data() ) {
+	$n = $pipe->pull( 1024 );
+	if ( 0 === $n ) break;
+	echo "got: " . $pipe->consume( $n );
+}
+</script>
+<script type="text/expected-output">
+got: first chunk
+second chunk
+third chunk
+</script>
+</php-snippet>
+		<h2 id="compress-on-the-way-in-decompress-on-the-way-out">Compress on the way in, decompress on the way out</h2>
+		<p>Wrap a stream in <code>DeflateReadStream</code> to get compressed bytes out; wrap it in <code>InflateReadStream</code> to get decompressed bytes out. Both are full <code>ByteReadStream</code> implementations, so they nest into anything else that takes a stream.</p>
+<php-snippet blueprint="toolkit-setup" name="deflate-roundtrip.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\DeflateReadStream;
+use WordPress\ByteStream\ReadStream\InflateReadStream;
+
+$original = str_repeat( "the quick brown fox. ", 50 );
+
+$src        = new MemoryPipe( $original );
+$src->close_writing();
+$deflated   = new DeflateReadStream( $src, ZLIB_ENCODING_DEFLATE );
+$compressed = $deflated->consume_all();
+
+$src2     = new MemoryPipe( $compressed );
+$src2->close_writing();
+$inflated = new InflateReadStream( $src2, ZLIB_ENCODING_DEFLATE );
+$round    = $inflated->consume_all();
+
+printf( "original  : %d bytes\n", strlen( $original ) );
+printf( "deflated  : %d bytes (%.1f%%)\n", strlen( $compressed ), 100 * strlen( $compressed ) / strlen( $original ) );
+printf( "round-trip: %s\n", $round === $original ? 'OK' : 'BROKEN' );
+</script>
+<script type="text/expected-output">
+original  : 1050 bytes
+deflated  : 45 bytes (4.3%)
+round-trip: OK
+</script>
+</php-snippet>
+		<h2 id="line-by-line-reads-from-a-chunked-source">Line-by-line reads from a chunked source</h2>
+		<p>Reading text by line means handling chunk boundaries that fall mid-line. Keep the trailing partial line and prepend it to the next pull. The rest of the loop pretends the data was always whole.</p>
+<php-snippet blueprint="toolkit-setup" name="lines.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+
+$pipe = new MemoryPipe();
+$pipe->append_bytes( "alpha\nbravo\ncharl" );
+$pipe->append_bytes( "ie\ndelta\necho\n" );
+$pipe->close_writing();
+
+$tail = '';
+$count = 0;
+while ( ! $pipe->reached_end_of_data() ) {
+	$n = $pipe->pull( 8 );
+	if ( 0 === $n ) break;
+	$buf   = $tail . $pipe->consume( $n );
+	$lines = explode( "\n", $buf );
+	$tail  = array_pop( $lines );
+	foreach ( $lines as $line ) {
+		printf( "[%d] %s\n", ++$count, $line );
+	}
+}
+if ( '' !== $tail ) {
+	printf( "[%d] %s\n", ++$count, $tail );
+}
+</script>
+<script type="text/expected-output">
+[1] alpha
+[2] bravo
+[3] charlie
+[4] delta
+[5] echo
+</script>
+</php-snippet>
+		<h2 id="limit-a-stream-to-a-fixed-window">Limit a stream to a fixed window</h2>
+		<p><code>LimitedByteReadStream</code> exposes only the next N bytes of an underlying stream as if those were the entire stream. This is how the ZIP decoder hands you the body of one entry without letting you read into the next.</p>
+<php-snippet blueprint="toolkit-setup" name="limited.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\LimitedByteReadStream;
+
+$source = new MemoryPipe( "HEADER:42|BODY:hello there|FOOTER:done" );
+$source->close_writing();
+
+$source->pull( 10 );
+$source->consume( 10 );
+
+$body = new LimitedByteReadStream( $source, 16 );
+echo "body sees: " . $body->consume_all() . "\n";
+echo "remaining in source: " . $source->consume_all() . "\n";
+</script>
+<script type="text/expected-output">
+body sees: BODY:hello there
+remaining in source: |FOOTER:done
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../filesystem/">Filesystem</a><span>Back file reads and writes with the same stream primitives.</span></li>
+			<li><a href="../zip/">Zip</a><span>Read and write archive entries one stream at a time.</span></li>
+			<li><a href="../httpclient/">HttpClient</a><span>Process request and response bodies incrementally.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/cli/index.html b/docs/_legacy/cli/index.html
new file mode 100644
index 000000000..5d02e9fc3
--- /dev/null
+++ b/docs/_legacy/cli/index.html
@@ -0,0 +1,256 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>CLI — PHP Toolkit</title>
+<meta name="description" content="POSIX-style argument parser. Long options, short bundles, inline values, positional args — one static call.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li class="current"><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>CLI</h1>
+		<p class="lede">POSIX-style argument parser. Long options, short bundles, inline values, positional args — one static call.</p>
+		<code class="install">composer require wp-php-toolkit/cli</code>
+		<p>Real CLI tools in PHP usually mean either pulling in <code>symfony/console</code> (and 30+ transitive packages) or hand-rolling argv parsing that breaks the first time someone writes <code>-vvv</code> or <code>--port=8080</code>. The toolkit's <code>CLI</code> class is one static method, no dependencies, and handles the POSIX shapes you actually see.</p>
+		<p>Define the command-line contract once, then parse <code>argv</code> against it. The parser returns positional arguments and named options; your application validates them and runs the command.</p><p>A command such as <code>toolkit import posts/launch.md --site=demo --dry-run -vv</code> should not need a console framework just to understand flags, values, and positionals.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Parse the smallest command</li>
+			<li>Accept normal shell shapes</li>
+			<li>Build command behavior</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="parse-a-single-flag">Parse a single flag</h2>
+		<p>The smallest useful invocation: one boolean flag, one positional. Each option is a four-tuple of <code>[ short, has_value, default, description ]</code>.</p>
+<php-snippet blueprint="toolkit-setup" name="parse-flag.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\CLI\CLI;
+
+$option_defs = array(
+	'verbose' => array( 'v', false, false, 'Enable verbose output' ),
+);
+
+list( $positionals, $options ) = CLI::parse_command_args_and_options(
+	array( '-v', 'input.txt' ),
+	$option_defs
+);
+
+echo "verbose: " . ( $options['verbose'] ? 'yes' : 'no' ) . "\n";
+echo "input:   " . $positionals[0] . "\n";
+</script>
+<script type="text/expected-output">
+verbose: yes
+input:   input.txt
+</script>
+</php-snippet>
+		<h2 id="mix-values-flags-and-bundles">Mix values, flags, and bundles</h2>
+		<p>The parser accepts <code>--port 8080</code>, <code>--port=8080</code>, <code>-p 8080</code>, and <code>-p=8080</code>. It also expands bundled boolean shorts such as <code>-afv</code>.</p>
+<php-snippet blueprint="toolkit-setup" name="mix-shapes.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\CLI\CLI;
+
+$option_defs = array(
+	'all'     => array( 'a', false, false, 'Process everything' ),
+	'force'   => array( 'f', false, false, 'Overwrite existing files' ),
+	'verbose' => array( 'v', false, false, 'Verbose output' ),
+	'output'  => array( 'o', true,  null,  'Output path' ),
+	'port'    => array( 'p', true,  '3000', 'Server port' ),
+);
+
+$argv = array( '-afv', '--port=8080', '-o', '/tmp/result.txt', 'input.json' );
+list( $positionals, $options ) = CLI::parse_command_args_and_options( $argv, $option_defs );
+
+echo "input:   " . $positionals[0] . "\n";
+echo "flags:   " . implode( ', ', array_keys( array_filter( array(
+	'all'     => $options['all'],
+	'force'   => $options['force'],
+	'verbose' => $options['verbose'],
+) ) ) ) . "\n";
+echo "output:  " . $options['output'] . "\n";
+echo "port:    " . $options['port'] . "\n";
+</script>
+<script type="text/expected-output">
+input:   input.json
+flags:   all, force, verbose
+output:  /tmp/<tempfile>.txt
+port:    8080
+</script>
+</php-snippet>
+		<h2 id="validate-required-options">Validate required options</h2>
+		<p>The parser fills in defaults but never enforces "required". Check for <code>null</code> after parsing — full control over the error message.</p>
+<php-snippet blueprint="toolkit-setup" name="require-options.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\CLI\CLI;
+
+$option_defs = array(
+	'site-url'  => array( 'u', true, null, 'Public site URL (required)' ),
+	'site-path' => array( null, true, null, 'Target directory (required)' ),
+);
+
+$argv = array( '--site-url', 'https://mysite.test' );
+
+try {
+	list( , $options ) = CLI::parse_command_args_and_options( $argv, $option_defs );
+	foreach ( array( 'site-url', 'site-path' ) as $name ) {
+		if ( null === $options[ $name ] ) {
+			throw new RuntimeException( "Missing required option --{$name}" );
+		}
+	}
+	echo "All good.\n";
+} catch ( Exception $e ) {
+	echo "error: " . $e->getMessage() . "\n";
+}
+</script>
+<script type="text/expected-output">
+error: Missing required option --site-path
+</script>
+</php-snippet>
+		<h2 id="generate---help-from-definitions">Generate --help from definitions</h2>
+		<p>Because each option carries its own description, you can render help text by walking the same definitions you parse with. No second source of truth.</p>
+<php-snippet blueprint="toolkit-setup" name="help-text.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\CLI\CLI;
+
+$option_defs = array(
+	'output'  => array( 'o', true,  null,  'Write result to FILE' ),
+	'force'   => array( 'f', false, false, 'Overwrite existing files' ),
+	'verbose' => array( 'v', false, false, 'Verbose output' ),
+	'help'    => array( 'h', false, false, 'Show this help and exit' ),
+);
+
+function render_help( array $defs ) {
+	echo "Usage: mytool [options] <input>\n\nOptions:\n";
+	foreach ( $defs as $long => $def ) {
+		list( $short, $has_value, $default, $desc ) = $def;
+		$flag = ( $short ? "-{$short}, " : '    ' ) . "--{$long}";
+		if ( $has_value ) $flag .= '=VALUE';
+		echo sprintf( "  %-28s %s\n", $flag, $desc );
+	}
+}
+
+list( , $options ) = CLI::parse_command_args_and_options( array( '-h' ), $option_defs );
+if ( $options['help'] ) render_help( $option_defs );
+</script>
+<script type="text/expected-output">
+Usage: mytool [options] <input>
+
+Options:
+  -o, --output=VALUE           Write result to FILE
+  -f, --force                  Overwrite existing files
+  -v, --verbose                Verbose output
+  -h, --help                   Show this help and exit
+</script>
+</php-snippet>
+		<h2 id="git-style-subcommands">Git-style subcommands</h2>
+		<p>To build a tool with subcommands like <code>mytool deploy</code>, peel the first positional off <code>argv</code>, dispatch, and parse the rest with a per-command option set.</p>
+<php-snippet blueprint="toolkit-setup" name="subcommands.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\CLI\CLI;
+
+$commands = array(
+	'deploy' => array(
+		'env'     => array( 'e', true, 'staging', 'Target environment' ),
+		'dry-run' => array( 'n', false, false, 'Preview without applying' ),
+	),
+	'rollback' => array(
+		'to' => array( 't', true, null, 'Revision to roll back to' ),
+	),
+);
+
+function run( array $argv, array $commands ) {
+	if ( empty( $argv ) ) {
+		echo "Usage: mytool <command> [options]\nCommands: " . implode( ', ', array_keys( $commands ) ) . "\n";
+		return;
+	}
+	$command = array_shift( $argv );
+	if ( ! isset( $commands[ $command ] ) ) {
+		echo "Unknown command: {$command}\n";
+		return;
+	}
+	list( $positionals, $options ) = CLI::parse_command_args_and_options( $argv, $commands[ $command ] );
+	echo "command={$command}\n";
+	echo "options: " . json_encode( $options ) . "\n";
+	echo "positionals: " . json_encode( $positionals ) . "\n";
+}
+
+run( array( 'deploy', '--env=production', '-n', 'web-01', 'web-02' ), $commands );
+echo "---\n";
+run( array( 'rollback', '-t', 'abc123' ), $commands );
+</script>
+<script type="text/expected-output">
+command=deploy
+options: {"env":"production","dry-run":true}
+positionals: ["web-01","web-02"]
+---
+command=rollback
+options: {"to":"abc123"}
+positionals: []
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../filesystem/">Filesystem</a><span>Keep command behavior testable with in-memory storage.</span></li>
+			<li><a href="../blueprints/">Blueprints</a><span>Build repeatable site setup commands around parsed options.</span></li>
+			<li><a href="../httpserver/">HttpServer</a><span>Add a local web UI to a CLI workflow.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/coding-standards/index.html b/docs/_legacy/coding-standards/index.html
new file mode 100644
index 000000000..6fdae2c26
--- /dev/null
+++ b/docs/_legacy/coding-standards/index.html
@@ -0,0 +1,103 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>ToolkitCodingStandards — PHP Toolkit</title>
+<meta name="description" content="PHP_CodeSniffer sniffs used by this project: enforce Yoda comparisons and ban the short ternary where it hides falsy-value bugs.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li class="current"><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>ToolkitCodingStandards</h1>
+		<p class="lede">PHP_CodeSniffer sniffs used by this project: enforce Yoda comparisons and ban the short ternary where it hides falsy-value bugs.</p>
+		<code class="install">composer require wp-php-toolkit/toolkit-coding-standards</code>
+		<p>This package is not a general-purpose style guide. It holds project-specific PHP_CodeSniffer rules for review comments the toolkit wants automated: comparisons should follow the WordPress Yoda style, and short ternaries should not hide whether a fallback is meant for <code>null</code> only or for all falsy values.</p><p>Use it in this monorepo, or in a project that intentionally wants the same review tradeoffs. If your project does not follow WordPress-style comparisons, the Yoda sniff is probably the wrong rule for you.</p>
+		<p>Turn repeat review comments into PHPCS sniffs. If the project always rejects short ternaries, loose comparisons, or a confusing Yoda condition, the tool should report it before a reviewer does.</p><p>Keep each sniff narrow. A useful sniff names the risky pattern and shows the replacement code shape contributors should write.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Enable the ruleset</li>
+			<li>Read the rule as review guidance</li>
+			<li>Write the explicit form</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="reference-the-standard-from-your-phpcsxml">Reference the standard from your phpcs.xml</h2>
+		<p>The component is a PHPCS ruleset, so the useful examples are configuration and before/after code rather than runtime snippets. Activate both sniffs at once by referencing <code>WordPressToolkitCodingStandards</code>:</p><pre><code>&lt;?xml version="1.0"?&gt;
+&lt;ruleset name="My Project"&gt;
+  &lt;file&gt;src/&lt;/file&gt;
+
+  &lt;!-- Activate both toolkit sniffs --&gt;
+  &lt;rule ref="WordPressToolkitCodingStandards"/&gt;
+
+  &lt;!-- Or pick them individually --&gt;
+  &lt;!-- &lt;rule ref="WordPressToolkitCodingStandards.PHP.EnforceYodaComparison"/&gt; --&gt;
+  &lt;!-- &lt;rule ref="WordPressToolkitCodingStandards.PHP.DisallowShortTernary"/&gt; --&gt;
+&lt;/ruleset&gt;</code></pre><p>Then run phpcs and phpcbf the usual way:</p><pre><code>vendor/bin/phpcs --standard=phpcs.xml .
+vendor/bin/phpcbf --standard=phpcs.xml .</code></pre>
+		<h2 id="enforceyodacomparison-catches-accidental-assignment">EnforceYodaComparison: catches accidental assignment</h2>
+		<p>Yoda comparisons (<code>true === $x</code>) make typo-induced assignments easier to catch and match the WordPress style used throughout the toolkit:</p><pre><code>// Bug: single = inside a condition. Always truthy, mutates $status.
+if ( $status = 'published' ) {
+    publish_post( $post );
+}
+
+// Yoda style: writing this typo would be a parse error.
+if ( 'published' === $status ) {
+    publish_post( $post );
+}</code></pre><p>The sniff covers <code>===</code>, <code>!==</code>, <code>==</code>, and <code>!=</code>, and stays quiet when both sides are dynamic.</p>
+		<h2 id="why-ban-the-short-ternary">Why ban the short ternary</h2>
+		<p>Developers confuse the short ternary (<code>$a ?: $b</code>) with the null-coalescing operator (<code>$a ?? $b</code>). They differ on falsy-but-not-null values: <code>0 ?: 'fallback'</code> returns <code>'fallback'</code>, but <code>0 ?? 'fallback'</code> returns <code>0</code>. The sniff bans <code>?:</code> entirely so reviewers don't have to relitigate this on every PR.</p>
+		<h2 id="review-friendly-replacements">Review-friendly replacements</h2>
+		<p>When the fallback should apply only to <code>null</code>, use <code>??</code>. When the fallback should apply to every falsy value, write the full ternary so the intent is visible in review.</p><pre><code>// Only missing values fall back. 0 and "" are preserved.
+$limit = $request_limit ?? 20;
+
+// Any falsy value falls back. The duplicated condition is intentional.
+$title = $raw_title ? $raw_title : 'Untitled';</code></pre>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../polyfill/">Polyfill</a><span>Share WordPress-style compatibility expectations across standalone packages.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/corsproxy/index.html b/docs/_legacy/corsproxy/index.html
new file mode 100644
index 000000000..33f03658c
--- /dev/null
+++ b/docs/_legacy/corsproxy/index.html
@@ -0,0 +1,182 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>CORSProxy — PHP Toolkit</title>
+<meta name="description" content="A small PHP CORS proxy intended for browser-side code that needs to reach servers without CORS headers.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li class="current"><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>CORSProxy</h1>
+		<p class="lede">A small PHP CORS proxy intended for browser-side code that needs to reach servers without CORS headers.</p>
+		<code class="install">composer require wp-php-toolkit/corsproxy</code>
+		<p>A Playground-style browser tool reads <code>https://api.github.com/repos/WordPress/php-toolkit</code>, a plugin ZIP from <code>downloads.wordpress.org</code>, or a raw fixture from GitHub. The browser blocks the response when the upstream server does not send the required CORS headers, even though PHP can fetch the same public URL server-side.</p><p>The CORSProxy component is that server-side bridge. It accepts a target URL, fetches it from PHP, and returns a browser-readable response. Because an open proxy is a security and abuse risk, real deployments should add host allowlists, rate limits, header controls, and private-network protections appropriate to their environment.</p>
+		<p>A browser app cannot read <code>https://api.github.com/repos/WordPress/php-toolkit</code> unless GitHub sends CORS headers the app can use. A PHP proxy can fetch that URL server-side and return a controlled browser-readable response.</p><p>Deploy the proxy as a gate, not as an open tunnel. Allow <code>api.github.com</code> and <code>raw.githubusercontent.com</code> for a docs tool; reject private IP ranges, unknown hosts, oversized responses, and credential-bearing request headers.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>See the proxy URL shape</li>
+			<li>Lock down deployment</li>
+			<li>Use it from the browser</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="run-the-proxy-locally">Run the proxy locally</h2>
+		<p class="callout"><strong>Run on your machine:</strong> the proxy needs to listen on a port. Start PHP's built-in server and request any HTTPS URL through it.</p><pre><code>PLAYGROUND_CORS_PROXY_DISABLE_RATE_LIMIT=1 \
+  php -S 127.0.0.1:5263 vendor/wp-php-toolkit/corsproxy/cors-proxy.php
+
+# In another terminal:
+curl -s "http://127.0.0.1:5263/cors-proxy.php/https://api.github.com/repos/WordPress/php-toolkit" | head
+</code></pre>
+		<h2 id="production-rate-limiting">Production rate limiting</h2>
+		<p>Drop a <code>cors-proxy-config.php</code> next to <code>cors-proxy.php</code>. The proxy refuses to boot without one — that is the point.</p><p>This example uses a per-IP token bucket stored on disk. Replace with Redis / memcached for multi-host deployments.</p>
+<php-snippet blueprint="toolkit-setup" name="cors-proxy-config.php" runnable="false">
+<script type="application/x-php">
+<?php
+// cors-proxy-config.php — placed next to cors-proxy.php.
+
+function playground_cors_proxy_maybe_rate_limit() {
+	$ip      = isset( $_SERVER['REMOTE_ADDR'] ) ? $_SERVER['REMOTE_ADDR'] : '0.0.0.0';
+	$bucket  = sys_get_temp_dir() . '/cors-rl-' . md5( $ip );
+	$now     = time();
+	$window  = 60;
+	$max_req = 30;
+
+	$hits = array();
+	if ( file_exists( $bucket ) ) {
+		$hits = json_decode( file_get_contents( $bucket ), true );
+		if ( ! is_array( $hits ) ) $hits = array();
+	}
+	$hits = array_filter( $hits, function ( $t ) use ( $now, $window ) {
+		return $t > $now - $window;
+	} );
+
+	if ( count( $hits ) >= $max_req ) {
+		header( 'Retry-After: ' . $window );
+		http_response_code( 429 );
+		echo 'Rate limit exceeded';
+		exit;
+	}
+
+	$hits[] = $now;
+	file_put_contents( $bucket, json_encode( array_values( $hits ) ) );
+}
+
+echo "Config loaded — rate limiter armed.\n";
+</script>
+</php-snippet>
+		<h2 id="allowlist-upstream-hosts">Allowlist upstream hosts</h2>
+		<p>Out of the box the proxy will fetch any public URL. Most real deployments want a fixed list of upstreams — GitHub, Packagist, wp.org.</p>
+<php-snippet blueprint="toolkit-setup" name="allowlist-config.php" runnable="false">
+<script type="application/x-php">
+<?php
+function playground_cors_proxy_maybe_rate_limit() {
+	$allow = array(
+		'api.github.com',
+		'raw.githubusercontent.com',
+		'codeload.github.com',
+		'repo.packagist.org',
+		'downloads.wordpress.org',
+		'api.wordpress.org',
+	);
+
+	$target = isset( $_SERVER['PATH_INFO'] ) ? $_SERVER['PATH_INFO'] : ( '/' . ( isset( $_SERVER['QUERY_STRING'] ) ? $_SERVER['QUERY_STRING'] : '' ) );
+	$target = ltrim( $target, '/' );
+	$host   = parse_url( $target, PHP_URL_HOST );
+
+	if ( ! $host || ! in_array( strtolower( $host ), $allow, true ) ) {
+		http_response_code( 403 );
+		header( 'Content-Type: text/plain' );
+		echo "Upstream not allowed: " . ( $host ? $host : '(none)' );
+		exit;
+	}
+}
+
+echo "Allowlist config active.\n";
+</script>
+</php-snippet>
+		<h2 id="browser-side-fetch-through-the-proxy">Browser-side fetch through the proxy</h2>
+		<p>Once deployed, the client side is just <code>fetch()</code> with the proxy URL. Drop this into any HTML page.</p><pre><code>const PROXY = "https://cors.example.com/cors-proxy.php";
+
+async function viaProxy(url, init = {}) {
+  const res = await fetch(`${PROXY}/${url}`, {
+    ...init,
+    headers: {
+      ...(init.headers || {}),
+      "X-Cors-Proxy-Allowed-Request-Headers": "Authorization",
+    },
+  });
+  if (!res.ok) throw new Error(`Proxy returned ${res.status}`);
+  return res;
+}
+
+const repo = await viaProxy("https://api.github.com/repos/WordPress/php-toolkit").then(r =&gt; r.json());
+console.log(repo.full_name, repo.stargazers_count);
+</code></pre>
+		<h2 id="deploy-behind-nginx">Deploy behind nginx</h2>
+		<p>The proxy is a single PHP script — any SAPI works. nginx + php-fpm is a common production setup. <code>PATH_INFO</code> is what the proxy reads to learn the target URL.</p><pre><code>server {
+  listen 443 ssl http2;
+  server_name cors.example.com;
+
+  root /var/www/cors-proxy;
+  index cors-proxy.php;
+
+  location ~ ^/cors-proxy\.php(/.*)?$ {
+    fastcgi_pass unix:/run/php/php8.1-fpm.sock;
+    fastcgi_split_path_info ^(.+\.php)(/.*)$;
+    fastcgi_param SCRIPT_FILENAME $document_root/cors-proxy.php;
+    fastcgi_param PATH_INFO $fastcgi_path_info;
+    include fastcgi_params;
+  }
+}
+</code></pre>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../httpclient/">HttpClient</a><span>Fetch upstream responses from PHP when browser CORS blocks direct access.</span></li>
+			<li><a href="../httpserver/">HttpServer</a><span>Understand the local-server shape before deploying a proxy endpoint.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/dataliberation/index.html b/docs/_legacy/dataliberation/index.html
new file mode 100644
index 000000000..328e56f12
--- /dev/null
+++ b/docs/_legacy/dataliberation/index.html
@@ -0,0 +1,299 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>DataLiberation — PHP Toolkit</title>
+<meta name="description" content="Streaming WordPress import/export. WXR, SQL, block markup — without loading whole datasets into memory.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li class="current"><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>DataLiberation</h1>
+		<p class="lede">Streaming WordPress import/export. WXR, SQL, block markup — without loading whole datasets into memory.</p>
+		<code class="install">composer require wp-php-toolkit/data-liberation</code>
+		<p>WordPress content should be portable, but real migrations cross several formats. A site export might arrive as WXR, a Markdown folder, or entities from another CMS. URLs can hide in block attributes, HTML, CSS, feeds, GUIDs, and post meta. Importers must also resume after a failed media download or upload.</p><p>The DataLiberation component streams WordPress-shaped data through readers, transformers, and writers. It models posts, terms, comments, attachments, and metadata as <code>ImportEntity</code> objects, then lets a pipeline rewrite each entity without loading the full export into memory.</p><p>The API reflects specific migration bugs: relative URLs in known block attributes, URLs inside inline CSS, self-closing block comments that must keep their shape, and origin-only URLs whose trailing slash style should not change during a rewrite.</p><p>Reach for it when the job combines formats: build WXR from another CMS, rewrite a staging export for production, frontload remote assets, or compose Markdown, XML, HTML, CSS, and URL rewriting into one pipeline.</p>
+		<p>Model a migration as a stream of WordPress-shaped entities. Read a post, rewrite its content and metadata, write it out, then move to the next entity.</p><p>The useful work happens between readers and writers: rewrite <code>https://staging.example.test</code> inside HTML, block attributes, CSS, GUIDs, and media URLs; download attachments; and keep enough state to resume after a failed request.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Write one entity</li>
+			<li>Transform as you stream</li>
+			<li>Compose a migration</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="write-a-wxr-file-in-five-lines">Write a WXR file in five lines</h2>
+		<p>Stream a single post into a WXR document via <code>WXRWriter</code>. The writer holds no buffer beyond what is needed to close currently-open tags, so memory stays flat regardless of input size.</p>
+<php-snippet blueprint="toolkit-setup" name="wxr-quickstart.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+$writer->append_entity( new ImportEntity( 'post', array(
+	'post_title' => 'Hello',
+	'content'    => 'World.',
+	'post_id'    => '1',
+	'status'     => 'publish',
+) ) );
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+$wxr = $pipe->consume_all();
+
+echo "bytes: " . strlen( $wxr ) . "\n";
+echo false !== strpos( $wxr, '<title>Hello</title>' ) ? "title exported\n" : "title missing\n";
+echo false !== strpos( $wxr, '<wp:status>publish</wp:status>' ) ? "status exported\n" : "status missing\n";
+</script>
+<script type="text/expected-output">
+bytes: 475
+title exported
+status exported
+</script>
+</php-snippet>
+		<h2 id="build-a-wxr-programmatically-from-any-source">Build a WXR programmatically from any source</h2>
+		<p>The writer doesn't care where entities come from. Loop over rows from a CMS, a CSV, or a Notion API dump and emit posts plus their meta and comments.</p>
+<php-snippet blueprint="toolkit-setup" name="build-wxr.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+
+$rows = array(
+	array( 'id' => 10, 'title' => 'About', 'body' => '<p>About us.</p>', 'tags' => array( 'company' ) ),
+	array( 'id' => 11, 'title' => 'Blog',  'body' => '<p>Hello world.</p>', 'tags' => array( 'news', 'launch' ) ),
+);
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+
+foreach ( $rows as $row ) {
+	$writer->append_entity( new ImportEntity( 'post', array(
+		'post_id'    => (string) $row['id'],
+		'post_title' => $row['title'],
+		'content'    => $row['body'],
+		'status'     => 'publish',
+		'post_type'  => 'post',
+	) ) );
+	foreach ( $row['tags'] as $i => $tag ) {
+		$writer->append_entity( new ImportEntity( 'term', array(
+			'term_id'  => (string) ( $row['id'] * 100 + $i ),
+			'taxonomy' => 'post_tag',
+			'slug'     => $tag,
+			'parent'   => '0',
+		) ) );
+	}
+}
+
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+
+$wxr = $pipe->consume_all();
+echo "items: " . substr_count( $wxr, '<item>' ) . "\n";
+echo "terms: " . substr_count( $wxr, '<wp:term>' ) . "\n";
+echo false !== strpos( $wxr, '<title>Blog</title>' ) ? "Blog post exported\n" : "Blog post missing\n";
+</script>
+<script type="text/expected-output">
+items: 2
+terms: 3
+Blog post exported
+</script>
+</php-snippet>
+		<h2 id="read-entities-from-a-wxr-file-with-constant-memory">Read entities from a WXR file with constant memory</h2>
+		<p><code>WXREntityReader</code> emits one entity at a time. A 10 GB WXR uses the same memory as a 10 KB one.</p>
+<php-snippet blueprint="toolkit-setup" name="wxr-read.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\DataLiberation\EntityReader\WXREntityReader;
+
+$wxr = <<<XML
+<?xml version="1.0" encoding="UTF-8" ?>
+<rss version="2.0" xmlns:wp="http://wordpress.org/export/1.2/" xmlns:content="http://purl.org/rss/1.0/modules/content/">
+<channel>
+<title>Demo</title>
+<item><title>First</title><wp:post_id>1</wp:post_id><wp:post_type>post</wp:post_type><content:encoded>Body 1</content:encoded></item>
+<item><title>Second</title><wp:post_id>2</wp:post_id><wp:post_type>post</wp:post_type><content:encoded>Body 2</content:encoded></item>
+</channel>
+</rss>
+XML;
+
+$reader = WXREntityReader::create();
+$reader->append_bytes( $wxr );
+$reader->input_finished();
+
+while ( $reader->next_entity() ) {
+	$entity = $reader->get_entity();
+	echo $entity->get_type() . ': ' . json_encode( $entity->get_data() ) . "\n";
+}
+</script>
+<script type="text/expected-output">
+site_option: {"option_name":"blogname","option_value":"Demo"}
+post: {"post_title":"First","post_id":"1","post_type":"post","post_content":"Body 1"}
+post: {"post_title":"Second","post_id":"2","post_type":"post","post_content":"Body 2"}
+</script>
+</php-snippet>
+		<h2 id="streaming-transform-rewrite-urls-while-copying-wxr">Streaming transform: rewrite URLs while copying WXR</h2>
+		<p>Wire reader to writer to rewrite a WXR file on the fly. This pattern is how you migrate a staging export to production: swap <code>staging.example.com</code> for <code>example.com</code> without ever loading the file into memory.</p>
+<php-snippet blueprint="toolkit-setup" name="rewrite-urls.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityReader\WXREntityReader;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+
+$source_xml = <<<XML
+<?xml version="1.0" encoding="UTF-8" ?>
+<rss version="2.0" xmlns:wp="http://wordpress.org/export/1.2/" xmlns:content="http://purl.org/rss/1.0/modules/content/">
+<channel>
+<item><title>Hello</title><wp:post_id>1</wp:post_id><wp:post_type>post</wp:post_type>
+<content:encoded>Visit https://staging.example.com/about for more.</content:encoded></item>
+</channel>
+</rss>
+XML;
+
+$reader = WXREntityReader::create();
+$reader->append_bytes( $source_xml );
+$reader->input_finished();
+
+$out_pipe = new MemoryPipe();
+$writer   = new WXRWriter( $out_pipe );
+
+while ( $reader->next_entity() ) {
+	$entity = $reader->get_entity();
+	$data   = $entity->get_data();
+	foreach ( array( 'post_content', 'content', 'description' ) as $field ) {
+		if ( isset( $data[ $field ] ) ) {
+			$data[ $field ] = str_replace( 'staging.example.com', 'example.com', $data[ $field ] );
+		}
+	}
+	if ( 'post' === $entity->get_type() ) {
+		$data['content'] = isset( $data['post_content'] ) ? $data['post_content'] : ( isset( $data['content'] ) ? $data['content'] : '' );
+	}
+	$writer->append_entity( new ImportEntity( $entity->get_type(), $data ) );
+}
+
+$writer->finalize();
+$writer->close_writing();
+$out_pipe->close_writing();
+
+$wxr = $out_pipe->consume_all();
+echo false !== strpos( $wxr, 'https://example.com/about' ) ? "new URL present\n" : "new URL missing\n";
+echo false === strpos( $wxr, 'staging.example.com' ) ? "old URL removed\n" : "old URL still present\n";
+</script>
+<script type="text/expected-output">
+new URL present
+old URL removed
+</script>
+</php-snippet>
+		<h2 id="render-markdown-into-a-wxr-import-in-one-pipeline">Render Markdown into a WXR import in one pipeline</h2>
+		<p>Compose <code>MarkdownConsumer</code> with <code>WXRWriter</code> to publish a folder of Markdown directly as a WordPress import file.</p>
+<php-snippet blueprint="toolkit-setup" name="md-to-wxr.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+use WordPress\Markdown\MarkdownConsumer;
+
+@mkdir( '/tmp/md-src', 0777, true );
+file_put_contents( '/tmp/md-src/hello.md',  "---\ntitle: Hello\n---\n\n# Hello\n\nFirst post." );
+file_put_contents( '/tmp/md-src/second.md', "---\ntitle: Second\n---\n\nMore text **here**." );
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+
+$id = 1;
+foreach ( glob( '/tmp/md-src/*.md' ) as $path ) {
+	$consumer = new MarkdownConsumer( file_get_contents( $path ) );
+	$consumer->consume();
+	$writer->append_entity( new ImportEntity( 'post', array(
+		'post_id'    => (string) $id++,
+		'post_title' => $consumer->get_meta_value( 'title' ) ?: basename( $path, '.md' ),
+		'content'    => $consumer->get_block_markup(),
+		'status'     => 'publish',
+		'post_type'  => 'post',
+		'post_name'  => basename( $path, '.md' ),
+	) ) );
+}
+
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+
+$wxr = $pipe->consume_all();
+echo "posts: " . substr_count( $wxr, '<item>' ) . "\n";
+echo false !== strpos( $wxr, '&lt;!-- wp:heading' ) ? "block markup exported\n" : "block markup missing\n";
+echo false !== strpos( $wxr, '<title>Second</title>' ) ? "frontmatter title exported\n" : "frontmatter title missing\n";
+</script>
+<script type="text/expected-output">
+posts: 2
+block markup exported
+frontmatter title exported
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../markdown/">Markdown</a><span>Use Markdown as a source or destination format.</span></li>
+			<li><a href="../blockparser/">BlockParser</a><span>Analyze serialized blocks inside post content.</span></li>
+			<li><a href="../httpclient/">HttpClient</a><span>Download media and remote source data while importing.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/encoding/index.html b/docs/_legacy/encoding/index.html
new file mode 100644
index 000000000..1967292af
--- /dev/null
+++ b/docs/_legacy/encoding/index.html
@@ -0,0 +1,216 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Encoding — PHP Toolkit</title>
+<meta name="description" content="UTF-8 validation and scrubbing with a pure-PHP fallback when mbstring is unavailable. Detects malformed bytes and replaces them per the Unicode maximal-subpart algorithm.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li class="current"><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>Encoding</h1>
+		<p class="lede">UTF-8 validation and scrubbing with a pure-PHP fallback when <code>mbstring</code> is unavailable. Detects malformed bytes and replaces them per the Unicode maximal-subpart algorithm.</p>
+		<code class="install">composer require wp-php-toolkit/encoding</code>
+		<p>Every parser in this toolkit eventually has to decide what to do with text bytes. XML rejects malformed UTF-8. JSON and databases can fail late. CSS, HTML, WXR, and Blueprint validation all need consistent answers about whether a string is well-formed Unicode.</p><p>The Encoding component provides the small UTF-8 primitives the rest of the toolkit can share: validate bytes, scrub invalid sequences, scan code points, and detect Unicode noncharacters. When <code>mbstring</code> is available it can delegate to it; when it is not, the component uses its own byte scanner so behavior stays available in restricted PHP environments.</p><p>Historically, this became the common foundation for Blueprint validation and CSS/XML processing, replacing ad hoc Unicode helpers with the WordPress core UTF-8 routines used here.</p>
+		<p>Run Encoding before a strict parser sees unknown bytes. A Latin-1 title from an old export, an overlong UTF-8 sequence in an upload, or a Unicode noncharacter can break XML, JSON, or a database write later in the pipeline.</p><p>The component gives the same answer whether PHP has <code>mbstring</code> available or falls back to the pure-PHP scanner.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Reject invalid bytes</li>
+			<li>Repair when content matters</li>
+			<li>Check downstream limits</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="validating-utf-8-before-storing-it">Validating UTF-8 before storing it</h2>
+		<p><code>wp_is_valid_utf8()</code> rejects overlong sequences, surrogate halves, and stray ISO-8859-1 bytes. Use it as a guard in front of any code path that assumes UTF-8 (database, JSON, XML).</p>
+<php-snippet blueprint="toolkit-setup" name="validate.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Encoding\wp_is_valid_utf8;
+
+$samples = array(
+	'ASCII'          => 'just a test',
+	'UTF-8 pencil'   => "\xE2\x9C\x8F",
+	'latin-1 byte'   => "B\xFCch",
+	'overlong slash' => "\xC1\xBF",
+	'surrogate half' => "\xED\xB0\x80",
+);
+
+foreach ( $samples as $label => $bytes ) {
+	echo sprintf( "%-14s %s\n", $label . ':', wp_is_valid_utf8( $bytes ) ? 'valid' : 'invalid' );
+}
+</script>
+<script type="text/expected-output">
+ASCII:         valid
+UTF-8 pencil:  valid
+latin-1 byte:  invalid
+overlong slash: invalid
+surrogate half: invalid
+</script>
+</php-snippet>
+		<h2 id="scrubbing-invalid-bytes-with-ufffd">Scrubbing invalid bytes with U+FFFD</h2>
+		<p>Replace each ill-formed sequence with the Unicode replacement character. Useful right before serializing to XML, JSON, or sending to an LLM that will choke on broken bytes.</p>
+<php-snippet blueprint="toolkit-setup" name="scrub.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Encoding\wp_scrub_utf8;
+
+$broken = "the byte \xC0 should not be here.";
+echo wp_scrub_utf8( $broken ) . "\n";
+
+echo wp_scrub_utf8( ".\xE2\x8C\xE2\x8C." ) . "\n";
+</script>
+<script type="text/expected-output">
+the byte � should not be here.
+.��.
+</script>
+</php-snippet>
+		<h2 id="detecting-noncharacters-mysqlutf8mb4-will-reject">Detecting noncharacters MySQL/utf8mb4 will reject</h2>
+		<p>Code points like U+FFFE, U+FFFF, and the U+FDD0–U+FDEF block are valid Unicode but forbidden in XML and rejected by some databases. Check before inserting user-submitted content into a strict <code>utf8mb4</code> column.</p>
+<php-snippet blueprint="toolkit-setup" name="noncharacters.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Encoding\wp_has_noncharacters;
+
+$samples = array(
+	'normal text' => 'normal text',
+	'U+FFFE'      => "oops \u{FFFE}",
+	'U+FDD0'      => "hi \u{FDD0} bye",
+);
+
+foreach ( $samples as $label => $text ) {
+	echo sprintf( "%-12s %s\n", $label . ':', wp_has_noncharacters( $text ) ? 'reject' : 'ok' );
+}
+</script>
+<script type="text/expected-output">
+normal text: ok
+U+FFFE:      reject
+U+FDD0:      reject
+</script>
+</php-snippet>
+		<h2 id="three-way-pipeline-validate-scrub-then-check-noncharacters">Three-way pipeline: validate, scrub, then check noncharacters</h2>
+		<p>Real-world inputs are messy: an old WXR export, a CSV with mixed encodings, a paste from Word. Combination of validate + scrub + noncharacter-check covers the three classes of breakage that bite later.</p>
+<php-snippet blueprint="toolkit-setup" name="pipeline.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Encoding\wp_is_valid_utf8;
+use function WordPress\Encoding\wp_scrub_utf8;
+use function WordPress\Encoding\wp_has_noncharacters;
+
+$inputs = array(
+	'good'      => 'Café',
+	'latin1'    => "caf\xE9",
+	'overlong'  => "x\xC1\xBFy",
+	'noncharac' => "hi \u{FFFE} there",
+);
+
+foreach ( $inputs as $label => $bytes ) {
+	$valid    = wp_is_valid_utf8( $bytes );
+	$cleaned  = wp_scrub_utf8( $bytes );
+	$weird    = wp_has_noncharacters( $cleaned );
+	echo sprintf( "%-10s valid=%s noncharacter=%s -> %s\n", $label, $valid ? 'Y' : 'N', $weird ? 'Y' : 'N', $cleaned );
+}
+</script>
+<script type="text/expected-output">
+good       valid=Y noncharacter=N -> Café
+latin1     valid=N noncharacter=N -> caf�
+overlong   valid=N noncharacter=N -> x��y
+noncharac  valid=Y noncharacter=Y -> hi ￾ there
+</script>
+</php-snippet>
+		<h2 id="salvaging-a-legacy-iso-8859-1-column-inside-a-utf-8-corpus">Salvaging a legacy ISO-8859-1 column inside a UTF-8 corpus</h2>
+		<p>Old WordPress databases sometimes mix encodings: most rows are UTF-8 but a few were stored as latin-1. Detect the bad rows with <code>wp_is_valid_utf8()</code> and only re-encode those.</p>
+<php-snippet blueprint="toolkit-setup" name="mixed-encoding.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Encoding\wp_is_valid_utf8;
+use function WordPress\Encoding\wp_scrub_utf8;
+
+$rows = array(
+	1 => 'Plain ASCII',
+	2 => 'Café',
+	3 => "caf\xE9",
+	4 => "weird \xC0 byte",
+);
+
+foreach ( $rows as $id => $value ) {
+	if ( wp_is_valid_utf8( $value ) ) {
+		echo "#$id ok: $value\n";
+		continue;
+	}
+	$converted = @iconv( 'ISO-8859-1', 'UTF-8', $value );
+	if ( false !== $converted && wp_is_valid_utf8( $converted ) ) {
+		echo "#$id recovered as latin1: $converted\n";
+	} else {
+		echo "#$id unrecoverable, scrubbing: " . wp_scrub_utf8( $value ) . "\n";
+	}
+}
+</script>
+<script type="text/expected-output">
+#1 ok: Plain ASCII
+#2 ok: Café
+#3 recovered as latin1: café
+#4 recovered as latin1: weird À byte
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../html/">HTML</a><span>Normalize incoming text before HTML tokenization.</span></li>
+			<li><a href="../xml/">XML</a><span>Keep invalid bytes out of XML streams.</span></li>
+			<li><a href="../dataliberation/">DataLiberation</a><span>Clean content before importing it into WordPress.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/filesystem/index.html b/docs/_legacy/filesystem/index.html
new file mode 100644
index 000000000..f2fc64ea5
--- /dev/null
+++ b/docs/_legacy/filesystem/index.html
@@ -0,0 +1,268 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Filesystem — PHP Toolkit</title>
+<meta name="description" content="One Filesystem interface across local disk, in-memory trees, SQLite databases, and ZIP archives. Forward-slash paths everywhere — even on Windows — so the same code runs in tests, in production, and inside read-only ZIPs.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li class="current"><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>Filesystem</h1>
+		<p class="lede">One <code>Filesystem</code> interface across local disk, in-memory trees, SQLite databases, and ZIP archives. Forward-slash paths everywhere — even on Windows — so the same code runs in tests, in production, and inside read-only ZIPs.</p>
+		<code class="install">composer require wp-php-toolkit/filesystem</code>
+		<p>Code that touches the filesystem is hard to test, hard to port to Windows, and impossible to point at non-disk storage without rewriting it. Swap <code>LocalFilesystem</code> for <code>InMemoryFilesystem</code> in tests and your suite stops touching <code>/tmp</code>; swap it for <code>SQLiteFilesystem</code> and your "files" become rows in a portable database; swap it for <code>ZipFilesystem</code> and you can read inside an archive with the same calls.</p><p>Every backend uses forward slashes regardless of host OS. No <code>DIRECTORY_SEPARATOR</code> juggling, no Windows-only test failures, no surprises when a path moves between backends.</p>
+		<p>Write your tool against a filesystem object, not against the host machine. Tests can pass an in-memory tree, a CLI command can pass a local directory, and an importer can pass a ZIP-backed filesystem.</p><p>Every toolkit path uses forward slashes. A path such as <code>wp-content/uploads/2026/logo.png</code> means the same thing on macOS, Windows, Playground, and inside an archive.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Start in memory</li>
+			<li>Move to a real backend</li>
+			<li>Copy between backends</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="in-memory-tree">In-memory tree</h2>
+		<p>The fastest backend. No disk I/O, no cleanup, no test-isolation problems.</p>
+<php-snippet blueprint="toolkit-setup" name="teaser-memory.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+
+$fs = InMemoryFilesystem::create();
+$fs->put_contents( '/hello.txt', 'Hello, world!' );
+echo $fs->get_contents( '/hello.txt' );
+</script>
+<script type="text/expected-output">
+Hello, world!
+</script>
+</php-snippet>
+		<h2 id="test-code-without-touching-disk">Test code without touching disk</h2>
+		<p>Pass production code a <code>Filesystem</code> instead of using <code>file_get_contents</code> directly, and your tests run against an in-memory tree with no setup or teardown.</p>
+<php-snippet blueprint="toolkit-setup" name="test-without-disk.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\Filesystem;
+use WordPress\Filesystem\InMemoryFilesystem;
+
+function bump_version( Filesystem $fs, $path ) {
+	$json = json_decode( $fs->get_contents( $path ), true );
+	list( $maj, $min, $patch ) = explode( '.', $json['version'] );
+	$json['version'] = $maj . '.' . $min . '.' . ( (int) $patch + 1 );
+	$fs->put_contents( $path, json_encode( $json ) );
+}
+
+$fs = InMemoryFilesystem::create();
+$fs->put_contents( '/package.json', '{"version":"1.2.3"}' );
+bump_version( $fs, '/package.json' );
+
+echo $fs->get_contents( '/package.json' ) . "\n";
+</script>
+<script type="text/expected-output">
+{"version":"1.2.4"}
+</script>
+</php-snippet>
+		<h2 id="local-disk-with-a-chrooted-root">Local disk with a chrooted root</h2>
+		<p><code>LocalFilesystem::create($root)</code> is implicitly chrooted: every path resolves relative to <code>$root</code> and a <code>../</code> cannot escape. Reach for it when a request path or CLI argument names a file inside one project directory.</p>
+<php-snippet blueprint="toolkit-setup" name="local-chroot.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\LocalFilesystem;
+
+$root = sys_get_temp_dir() . '/toolkit-' . uniqid();
+$fs   = LocalFilesystem::create( $root );
+
+$fs->mkdir( '/uploads', array( 'recursive' => true ) );
+$fs->put_contents( '/uploads/note.txt', 'Hi from local disk.' );
+
+echo $fs->get_contents( '/uploads/../uploads/note.txt' ) . "\n";
+
+$fs->rmdir( '/', array( 'recursive' => true ) );
+echo "exists after cleanup? " . ( is_dir( $root ) ? 'yes' : 'no' ) . "\n";
+</script>
+<script type="text/expected-output">
+Hi from local disk.
+exists after cleanup? no
+</script>
+</php-snippet>
+		<h2 id="sqlite-as-a-portable-file-store">SQLite as a portable file store</h2>
+		<p>The whole tree lives in one SQLite database file. Use it for self-contained scratch storage that survives process boundaries without leaving loose files behind.</p>
+<php-snippet blueprint="toolkit-setup" name="sqlite.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\SQLiteFilesystem;
+
+$fs = SQLiteFilesystem::create( ':memory:' );
+$fs->mkdir( '/posts', array( 'recursive' => true ) );
+for ( $i = 1; $i <= 3; $i++ ) {
+	$fs->put_contents( "/posts/post-{$i}.md", "# Post {$i}\n\nBody {$i}." );
+}
+
+foreach ( $fs->ls( '/posts' ) as $name ) {
+	$first = strtok( $fs->get_contents( '/posts/' . $name ), "\n" );
+	echo "{$name}: {$first}\n";
+}
+</script>
+<script type="text/expected-output">
+post-1.md: # Post 1
+post-2.md: # Post 2
+post-3.md: # Post 3
+</script>
+</php-snippet>
+		<h2 id="copy-a-tree-across-backends">Copy a tree across backends</h2>
+		<p>The killer composability move: <code>copy_between_filesystems()</code> streams files chunk-by-chunk from any source to any target. Pull a ZIP into SQLite, snapshot SQLite to disk, mirror disk into RAM — all the same call.</p>
+<php-snippet blueprint="toolkit-setup" name="cross-backend-copy.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Filesystem\LocalFilesystem;
+use WordPress\Filesystem\SQLiteFilesystem;
+use function WordPress\Filesystem\copy_between_filesystems;
+
+$root  = sys_get_temp_dir() . '/copytree-' . uniqid();
+$local = LocalFilesystem::create( $root );
+$local->mkdir( '/site/posts', array( 'recursive' => true ) );
+$local->put_contents( '/site/posts/2024-01.md', '# Hello 2024' );
+$local->put_contents( '/site/index.html', '<h1>Home</h1>' );
+
+$sqlite = SQLiteFilesystem::create( ':memory:' );
+copy_between_filesystems( array(
+	'source_filesystem' => $local,
+	'source_path'       => '/site',
+	'target_filesystem' => $sqlite,
+	'target_path'       => '/snapshot',
+) );
+
+$mem = InMemoryFilesystem::create();
+copy_between_filesystems( array(
+	'source_filesystem' => $sqlite,
+	'source_path'       => '/snapshot',
+	'target_filesystem' => $mem,
+	'target_path'       => '/copy',
+) );
+
+echo "in memory after two copies:\n";
+echo "  posts: " . implode( ', ', $mem->ls( '/copy/posts' ) ) . "\n";
+echo "  index: " . $mem->get_contents( '/copy/index.html' ) . "\n";
+
+$local->rmdir( '/', array( 'recursive' => true ) );
+</script>
+<script type="text/expected-output">
+in memory after two copies:
+  posts: 2024-01.md
+  index: <h1>Home</h1>
+</script>
+</php-snippet>
+		<h2 id="atomic-write-via-tempfile-rename">Atomic write via tempfile rename</h2>
+		<p>Write to a sibling tempfile, then rename — that's how you avoid leaving a half-written file on crash. <code>rename()</code> is atomic within a single filesystem.</p>
+<php-snippet blueprint="toolkit-setup" name="atomic-write.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\Filesystem;
+use WordPress\Filesystem\LocalFilesystem;
+
+function atomic_put_contents( Filesystem $fs, $path, $bytes ) {
+	$tmp = $path . '.tmp.' . bin2hex( random_bytes( 4 ) );
+	$fs->put_contents( $tmp, $bytes );
+	$fs->rename( $tmp, $path );
+}
+
+$root = sys_get_temp_dir() . '/atomic-' . uniqid();
+$fs   = LocalFilesystem::create( $root );
+
+$fs->put_contents( '/config.json', '{"v":1}' );
+atomic_put_contents( $fs, '/config.json', '{"v":2}' );
+
+echo "config: " . $fs->get_contents( '/config.json' ) . "\n";
+echo "no .tmp leftovers: " . count( $fs->ls( '/' ) ) . " entries in root\n";
+
+$fs->rmdir( '/', array( 'recursive' => true ) );
+</script>
+<script type="text/expected-output">
+config: {"v":2}
+no .tmp leftovers: 1 entries in root
+</script>
+</php-snippet>
+		<h2 id="path-helpers-that-behave-the-same-on-windows">Path helpers that behave the same on Windows</h2>
+		<p>Unix path semantics apply on every host OS. This matters for abstract paths such as a SQLite key or a ZIP entry name because those paths do not live on a real drive.</p>
+<php-snippet blueprint="toolkit-setup" name="path-helpers.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Filesystem\wp_join_unix_paths;
+use function WordPress\Filesystem\wp_unix_dirname;
+use function WordPress\Filesystem\wp_unix_path_resolve_dots;
+
+echo wp_join_unix_paths( '/var/www', '/site/', '/index.php' ) . "\n";
+echo wp_unix_dirname( '/a/b/c/d.txt', 2 ) . "\n";
+echo wp_unix_path_resolve_dots( '/a/b/../c/./d/../e' ) . "\n";
+</script>
+<script type="text/expected-output">
+/var/www/site/index.php
+/a/b
+a/c/e
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../bytestream/">ByteStream</a><span>Open files as readers and writers instead of loading full strings.</span></li>
+			<li><a href="../zip/">Zip</a><span>Mount archives and copy data between archive-backed and normal filesystems.</span></li>
+			<li><a href="../git/">Git</a><span>Expose repository trees through a filesystem-shaped API.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/git/index.html b/docs/_legacy/git/index.html
new file mode 100644
index 000000000..6b87b9a8d
--- /dev/null
+++ b/docs/_legacy/git/index.html
@@ -0,0 +1,284 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Git — PHP Toolkit</title>
+<meta name="description" content="A pure-PHP Git client and server. Commits, branches, diffs, HTTP push/pull — all without shelling out to git.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li class="current"><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>Git</h1>
+		<p class="lede">A pure-PHP Git client and server. Commits, branches, diffs, HTTP push/pull — all without shelling out to <code>git</code>.</p>
+		<code class="install">composer require wp-php-toolkit/git</code>
+		<p>Git is a useful storage model even when a server cannot run the <code>git</code> binary: snapshots, branches, object-addressed files, diffs, merges, and sync over HTTP. That matters for WordPress tools that want revision history for generated files, content snapshots, site state, or collaborative edits in constrained runtimes.</p><p>The Git component implements the core repository operations in PHP and stores objects through the toolkit <code>Filesystem</code> interface. That means the same repository can live on disk, in memory, or in another backend, and higher-level code can commit files without knowing where objects are stored.</p><p>The docs start with simple commits because that mental model scales: a repository is just objects plus refs. From there, branches, history walking, root commits, and merges become details you can reason about instead of magic shell behavior.</p><p>Choose it for tests, browser-like sandboxes, hosted WordPress environments, and applications that need Git behavior through PHP APIs instead of shell commands.</p>
+		<p>Git stores snapshots as objects: blobs hold file bytes, trees hold directory listings, commits point at trees, and refs name commits.</p><p>This component keeps those objects visible. A browser-based editor can commit generated files, move <code>refs/heads/main</code>, expose a commit tree as a filesystem, and merge another branch without running the <code>git</code> binary.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Create a snapshot</li>
+			<li>Read history by name</li>
+			<li>Coordinate edits</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="commit-files-into-an-in-memory-repo">Commit files into an in-memory repo</h2>
+		<p>The simplest possible repository: an <code>InMemoryFilesystem</code> as object storage and one <code>commit()</code> call. Reach for this in tests, in WP-CLI snapshots, or any place you want versioning without touching disk.</p>
+<php-snippet blueprint="toolkit-setup" name="commit-in-memory.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+
+$oid = $repo->commit( array(
+	'updates' => array(
+		'README.md'           => "# My Project\n",
+		'src/hello-world.php' => '<?php echo "Hello!";',
+	),
+) );
+
+echo "commit: {$oid}\n";
+echo "HEAD:   " . $repo->get_branch_tip( 'HEAD' ) . "\n";
+echo "README: " . $repo->read_object_by_path( '/README.md' )->consume_all();
+</script>
+<script type="text/expected-output">
+commit: <oid>
+HEAD: <oid>
+README: # My Project
+</script>
+</php-snippet>
+		<h2 id="walk-the-commit-history">Walk the commit history</h2>
+		<p>Follow the parent chain from <code>HEAD</code> backwards. Building block for a WP-CLI "post revisions" log or a "what changed since release X" report.</p>
+<php-snippet blueprint="toolkit-setup" name="walk-history.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitRepository;
+use WordPress\Git\Model\Commit;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+foreach ( array( 'add intro', 'fix typo', 'expand examples' ) as $i => $msg ) {
+	$repo->commit( array(
+		'updates' => array( 'post.md' => "# Draft {$i}" ),
+		'commit'  => array( 'message' => $msg ),
+	) );
+}
+
+$oid = $repo->get_branch_tip( 'HEAD' );
+while ( ! Commit::is_null_hash( $oid ) ) {
+	$c = $repo->read_object( $oid )->as_commit();
+	echo substr( $c->hash, 0, 7 ) . '  ' . trim( $c->message ) . "\n";
+	$oid = $c->get_first_parent_hash();
+	if ( ! $oid || ! $repo->has_object( $oid ) ) break;
+}
+</script>
+<script type="text/expected-output">
+<hash>  expand examples
+<hash>  fix typo
+<hash>  add intro
+</script>
+</php-snippet>
+		<h2 id="treat-a-repository-like-a-filesystem">Treat a repository like a filesystem</h2>
+		<p><code>GitFilesystem</code> wraps a repository in this toolkit's <code>Filesystem</code> interface. With the default options, each <code>put_contents()</code> records a new commit.</p>
+<php-snippet blueprint="toolkit-setup" name="git-filesystem.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitFilesystem;
+use WordPress\Git\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+$fs   = GitFilesystem::create( $repo );
+
+$fs->put_contents( '/posts/hello.md', "# Hello\nFirst draft." );
+$fs->put_contents( '/posts/about.md', "# About\nWho we are." );
+$fs->put_contents( '/posts/hello.md', "# Hello\nSecond draft." );
+
+echo "tree:\n";
+foreach ( $fs->ls( '/posts' ) as $name ) {
+	echo "  /posts/{$name}\n";
+}
+echo "\nhello.md now:\n" . $fs->get_contents( '/posts/hello.md' ) . "\n";
+</script>
+<script type="text/expected-output">
+tree:
+  /posts/about.md
+  /posts/hello.md
+
+hello.md now:
+# Hello
+Second draft.
+</script>
+</php-snippet>
+		<h2 id="branch-edit-and-switch-back">Branch, edit, and switch back</h2>
+		<p>Create a feature branch off the current commit, change files, flip <code>HEAD</code> back. Useful for experimental edits in collaborative tools.</p>
+<php-snippet blueprint="toolkit-setup" name="branches.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+$base = $repo->commit( array(
+	'updates' => array( 'config.json' => '{"flag":false}' ),
+	'commit'  => array( 'message' => 'baseline' ),
+) );
+
+$repo->create_branch( 'refs/heads/experiment', $base );
+$repo->checkout( 'refs/heads/experiment' );
+$repo->commit( array(
+	'updates' => array( 'config.json' => '{"flag":true}' ),
+	'commit'  => array( 'message' => 'flip the flag' ),
+) );
+
+echo "on experiment: " . $repo->read_object_by_path( '/config.json' )->consume_all() . "\n";
+
+$repo->checkout( 'refs/heads/trunk' );
+echo "on trunk:      " . $repo->read_object_by_path( '/config.json' )->consume_all() . "\n";
+</script>
+<script type="text/expected-output">
+on experiment: {"flag":true}
+on trunk:      {"flag":false}
+</script>
+</php-snippet>
+		<h2 id="three-way-merge-two-branches">Three-way merge two branches</h2>
+		<p>The classic Git workflow: branch off, edit on each side, merge. <code>$repo-&gt;merge()</code> finds the common ancestor, three-way-merges every file, and creates a merge commit.</p>
+<php-snippet blueprint="toolkit-setup" name="merge-branches.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+$base = $repo->commit( array( 'updates' => array(
+	'todo.txt' => "buy milk\nwalk dog\nread book\n",
+) ) );
+
+$repo->commit( array( 'updates' => array(
+	'todo.txt' => "buy oat milk\nwalk dog\nread book\n",
+) ) );
+
+$repo->create_branch( 'refs/heads/feature', $base );
+$repo->checkout( 'refs/heads/feature' );
+$repo->commit( array( 'updates' => array(
+	'todo.txt' => "buy milk\nwalk dog\nread book\nwrite blog post\n",
+) ) );
+
+$repo->checkout( 'refs/heads/trunk' );
+$result = $repo->merge( 'refs/heads/feature' );
+
+echo "merge head: {$result['new_head']}\n";
+echo "conflicts:  " . ( $result['conflicts'] ? implode( ',', $result['conflicts'] ) : 'none' ) . "\n";
+echo "result:\n" . $repo->read_object_by_path( '/todo.txt' )->consume_all();
+</script>
+<script type="text/expected-output">
+merge head: <oid>
+conflicts:  none
+result:
+buy oat milk
+walk dog
+read book
+write blog post
+</script>
+</php-snippet>
+		<h2 id="snapshot-wordpress-options-into-a-repo">Snapshot WordPress options into a repo</h2>
+		<p>Serialize a chunk of WP state (options, post meta, a theme config) on every save and commit it. You get free history, diffs between snapshots, and a "rollback to last week" button.</p>
+<php-snippet blueprint="toolkit-setup" name="options-snapshot.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+
+$snapshots = array(
+	array( 'blogname' => 'My Site',  'posts_per_page' => 10, 'timezone_string' => 'UTC' ),
+	array( 'blogname' => 'My Site',  'posts_per_page' => 20, 'timezone_string' => 'UTC' ),
+	array( 'blogname' => 'New Name', 'posts_per_page' => 20, 'timezone_string' => 'Europe/Warsaw' ),
+);
+
+foreach ( $snapshots as $i => $options ) {
+	$repo->commit( array(
+		'updates' => array( 'options.json' => json_encode( $options, JSON_PRETTY_PRINT ) ),
+		'commit'  => array( 'message' => "snapshot #{$i}" ),
+	) );
+}
+
+$head    = $repo->get_branch_tip( 'HEAD' );
+$parent  = $repo->read_object( $head )->as_commit()->get_first_parent_hash();
+$diff    = $repo->diff_commits( $head, $parent );
+
+echo "Files changed in last snapshot:\n";
+foreach ( $diff as $name => $entry ) {
+	echo "  {$name}\n";
+}
+</script>
+<script type="text/expected-output">
+Files changed in last snapshot:
+  options.json
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../filesystem/">Filesystem</a><span>Work with repository trees through a storage abstraction.</span></li>
+			<li><a href="../merge/">Merge</a><span>Resolve divergent histories with explicit three-way merge logic.</span></li>
+			<li><a href="../bytestream/">ByteStream</a><span>Read and write object data without accidental buffering.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/html/index.html b/docs/_legacy/html/index.html
new file mode 100644
index 000000000..70c3bc34b
--- /dev/null
+++ b/docs/_legacy/html/index.html
@@ -0,0 +1,354 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>HTML — PHP Toolkit</title>
+<meta name="description" content="A pure-PHP HTML5 parser and tag rewriter mirroring WordPress core&#x27;s HTML API. Treat HTML the way browsers do — without libxml2, DOMDocument, or regex hacks — and rewrite attributes in a single linear pass.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li class="current"><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>HTML</h1>
+		<p class="lede">A pure-PHP HTML5 parser and tag rewriter mirroring WordPress core's HTML API. Treat HTML the way browsers do — without <code>libxml2</code>, <code>DOMDocument</code>, or regex hacks — and rewrite attributes in a single linear pass.</p>
+		<code class="install">composer require wp-php-toolkit/html</code>
+		<p>WordPress filters HTML fragments from post content, block markup, comments, excerpts, widgets, feeds, and imported documents. Those fragments can omit <code>&lt;html&gt;</code> and <code>&lt;body&gt;</code>, close tags implicitly, or mix browser-correct markup with author mistakes that <code>DOMDocument</code> and regular expressions do not model well.</p><p>The HTML component gives WordPress-style code the same parsing model WordPress core uses: a browser-compatible tokenizer and tree-aware processor that run in pure PHP. Choose it for exact-byte rewrites, imperfect fragments, and post-content filters where a full DOM would do too much work.</p><p>The component gives you two processors. <code>WP_HTML_Tag_Processor</code> is a forward-only cursor over tags and tokens — useful for attribute rewriting at scale. <code>WP_HTML_Processor</code> layers HTML5 tree construction on top so you can query by ancestry (breadcrumbs), serialize the parsed document, and trust that <code>&lt;p&gt;one&lt;p&gt;two</code> parses as two paragraphs the way a browser sees it.</p><p><strong>Footgun:</strong> mutations are buffered. Nothing changes in the source string until you call <code>get_updated_html()</code>. If you read <code>get_attribute()</code> after a <code>set_attribute()</code> on the same tag, you see the new value — but downstream tooling reading the original string sees stale HTML until you serialize.</p>
+		<p>Start with the tag processor when you need to change markup that WordPress already stored: add <code>loading="lazy"</code> to post images, make feed links absolute, or remove inline event handlers from pasted HTML. It scans forward and preserves every byte it does not touch.</p><p>Switch to the full processor when the browser tree matters. Use it to find images inside figures, walk heading depth, or return to a saved parent after inspecting child tags.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Rewrite one tag safely</li>
+			<li>Protect real content</li>
+			<li>Use structure when you need it</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="add-loadinglazy-to-every-image">Add loading=&quot;lazy&quot; to every image</h2>
+		<p>The "hello world" of tag rewriting. One linear pass, no DOM, no reserialization cost beyond the bytes you actually changed.</p><p><strong>Try this:</strong> click <em>Run</em>, then change <code>'lazy'</code> to <code>'eager'</code> on the first image only by guarding it with <code>$tags-&gt;get_attribute( 'src' ) === 'hero.jpg'</code>. Run again and notice that <code>get_updated_html()</code> only rewrites the bytes for that one tag.</p>
+<php-snippet blueprint="toolkit-setup" name="lazy-load-images.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<article>
+	<img src="hero.jpg" alt="Hero">
+	<p>Intro copy.</p>
+	<img src="inline.jpg" alt="Inline">
+</article>';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag( 'img' ) ) {
+	// Don't clobber an explicit eager hint the author already set.
+	if ( null === $tags->get_attribute( 'loading' ) ) {
+		$tags->set_attribute( 'loading', 'lazy' );
+	}
+	$tags->set_attribute( 'decoding', 'async' );
+}
+
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<article>
+	<img decoding="async" loading="lazy" src="hero.jpg" alt="Hero">
+	<p>Intro copy.</p>
+	<img decoding="async" loading="lazy" src="inline.jpg" alt="Inline">
+</article>
+</script>
+</php-snippet>
+		<h2 id="rewrite-relative-links-to-absolute-urls">Rewrite relative links to absolute URLs</h2>
+		<p>Use this before sending post content to an RSS feed, an email template, or a CDN-backed copy of a site. The processor rewrites only the changed bytes, so untouched markup stays byte-identical.</p>
+<php-snippet blueprint="toolkit-setup" name="absolute-links.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<p>See <a href="/about">about</a>, <a href="https://example.com/x">x</a>, '
+	. 'and <a href="contact.html">contact</a>.</p>';
+
+$base = 'https://my-site.test/';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag( 'a' ) ) {
+	$href = $tags->get_attribute( 'href' );
+	if ( null === $href || '' === $href ) {
+		continue;
+	}
+	if ( preg_match( '#^[a-z][a-z0-9+.-]*:#i', $href ) || 0 === strpos( $href, '//' ) || 0 === strpos( $href, '#' ) ) {
+		continue;
+	}
+	$tags->set_attribute( 'href', rtrim( $base, '/' ) . '/' . ltrim( $href, '/' ) );
+}
+
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<p>See <a href="https://my-site.test/about">about</a>, <a href="https://example.com/x">x</a>, and <a href="https://my-site.test/contact.html">contact</a>.</p>
+</script>
+</php-snippet>
+		<h2 id="strip-every-script-and-inline-event-handler">Strip every script and inline event handler</h2>
+		<p>A common sanitization step: neutralize untrusted HTML before display. Blank a script's body with <code>set_modifiable_text()</code> and strip every <code>on*</code> attribute via <code>get_attribute_names_with_prefix()</code>.</p>
+<php-snippet blueprint="toolkit-setup" name="sanitize-html.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$untrusted = '<p>Hi <b onclick="steal()">friend</b>!</p>'
+	. '<script>alert("xss")<\/script>'
+	. '<img src=x onerror="boom()">';
+
+$tags = new WP_HTML_Tag_Processor( $untrusted );
+while ( $tags->next_tag() ) {
+	if ( 'SCRIPT' === $tags->get_tag() && ! $tags->is_tag_closer() ) {
+		$tags->set_modifiable_text( '' );
+	}
+	$on_handlers = $tags->get_attribute_names_with_prefix( 'on' );
+	if ( $on_handlers ) {
+		foreach ( $on_handlers as $name ) {
+			$tags->remove_attribute( $name );
+		}
+	}
+}
+
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<p>Hi <b >friend</b>!</p><script><\/script><img src=x >
+</script>
+</php-snippet>
+		<h2 id="stamp-a-csp-nonce-on-inline-scripts-and-styles">Stamp a CSP nonce on inline scripts and styles</h2>
+		<p>Content Security Policy in <code>nonce-</code> mode requires every inline <code>&lt;script&gt;</code> and <code>&lt;style&gt;</code> to carry a matching nonce attribute. Tag-by-tag is exactly the right granularity.</p>
+<php-snippet blueprint="toolkit-setup" name="csp-nonce.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$nonce = bin2hex( random_bytes( 8 ) );
+
+$html = '<head><style>body{font:16px sans-serif}</style></head>'
+	. '<body><script>console.log("hi")<\/script><script src="vendor.js"><\/script></body>';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag() ) {
+	$tag = $tags->get_tag();
+	if ( ( 'SCRIPT' === $tag || 'STYLE' === $tag ) && ! $tags->is_tag_closer() ) {
+		$tags->set_attribute( 'nonce', $nonce );
+	}
+}
+
+echo "nonce: {$nonce}\n\n";
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+nonce: <random>
+
+<head><style nonce="<random>">body{font:16px sans-serif}</style></head><body><script nonce="<random>">console.log("hi")<\/script><script nonce="<random>" src="vendor.js"><\/script></body>
+</script>
+</php-snippet>
+		<h2 id="build-a-srcset-from-a-single-src">Build a srcset from a single src</h2>
+		<p>Generate responsive image markup at render time without touching the editor data model. Read the existing <code>src</code>, derive a <code>srcset</code> with width descriptors, add a <code>sizes</code> hint.</p>
+<php-snippet blueprint="toolkit-setup" name="srcset-rewrite.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<figure><img src="https://cdn.test/uploads/photo.jpg" alt="Sunset"></figure>';
+$widths = array( 480, 768, 1200 );
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag( 'img' ) ) {
+	$src = $tags->get_attribute( 'src' );
+	if ( null === $src || $tags->get_attribute( 'srcset' ) !== null ) {
+		continue;
+	}
+	$variants = array();
+	foreach ( $widths as $w ) {
+		$variants[] = $src . '?w=' . $w . ' ' . $w . 'w';
+	}
+	$tags->set_attribute( 'srcset', implode( ', ', $variants ) );
+	$tags->set_attribute( 'sizes', '(max-width: 768px) 100vw, 768px' );
+}
+
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<figure><img sizes="(max-width: 768px) 100vw, 768px" srcset="https://cdn.test/uploads/photo.jpg?w=480 480w, https://cdn.test/uploads/photo.jpg?w=768 768w, https://cdn.test/uploads/photo.jpg?w=1200 1200w" src="https://cdn.test/uploads/photo.jpg" alt="Sunset"></figure>
+</script>
+</php-snippet>
+		<h2 id="decode-html-entities-the-way-the-spec-demands">Decode HTML entities the way the spec demands</h2>
+		<p>The HTML5 entity table has roughly 2,200 named references and a long list of edge cases. <code>WP_HTML_Decoder</code> implements the algorithm — don't roll your own.</p>
+<php-snippet blueprint="toolkit-setup" name="decode-entities.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+echo "attribute: " . WP_HTML_Decoder::decode_attribute( 'path?a=1&amp;b=2&amp;copy' ) . "\n";
+echo "text:      " . WP_HTML_Decoder::decode_text_node( 'AT&amp;T &mdash; 100&percnt; &#x1F600;' ) . "\n";
+
+// Safe URL prefix check that respects encoded colons (a classic XSS vector).
+$is_javascript = WP_HTML_Decoder::attribute_starts_with(
+	'java&#x09;script:alert(1)',
+	'javascript:',
+	'ascii-case-insensitive'
+);
+var_dump( $is_javascript );
+</script>
+<script type="text/expected-output">
+attribute: path?a=1&b=2&copy
+text:      AT&T — 100% 😀
+bool(false)
+</script>
+</php-snippet>
+		<h2 id="find-images-by-ancestry-with-breadcrumbs">Find images by ancestry with breadcrumbs</h2>
+		<p>The full <code>WP_HTML_Processor</code> understands HTML5 tree construction, so you can ask "find every <code>&lt;img&gt;</code> directly inside a <code>&lt;figure&gt;</code>" without writing your own DOM walker.</p>
+<php-snippet blueprint="toolkit-setup" name="breadcrumbs.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<article>'
+	. '<figure><img src="hero.jpg" alt="Hero"><figcaption>Hero shot</figcaption></figure>'
+	. '<p>Body copy <img src="emoji.png" alt=""> mid-paragraph.</p>'
+	. '<figure><img src="diagram.png" alt="Diagram"></figure>'
+	. '</article>';
+
+$p = WP_HTML_Processor::create_fragment( $html );
+$figure_images = 0;
+while ( $p->next_tag( array( 'breadcrumbs' => array( 'FIGURE', 'IMG' ) ) ) ) {
+	$p->add_class( 'figure-image' );
+	$figure_images++;
+}
+
+echo "found {$figure_images} figure images\n";
+echo $p->get_updated_html();
+</script>
+<script type="text/expected-output">
+found 2 figure images
+<article><figure><img class="figure-image" src="hero.jpg" alt="Hero"><figcaption>Hero shot</figcaption></figure><p>Body copy <img src="emoji.png" alt=""> mid-paragraph.</p><figure><img class="figure-image" src="diagram.png" alt="Diagram"></figure></article>
+</script>
+</php-snippet>
+		<h2 id="outline-a-document-by-walking-tokens-with-depth">Outline a document by walking tokens with depth</h2>
+		<p>The full processor exposes <code>get_current_depth()</code> and <code>get_breadcrumbs()</code>. Combine with <code>next_token()</code> to print a structural outline.</p>
+<php-snippet blueprint="toolkit-setup" name="outline.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<section><h1>Title</h1>'
+	. '<section><h2>Chapter 1</h2><p>Body</p></section>'
+	. '<section><h2>Chapter 2</h2><p>More body</p></section>'
+	. '</section>';
+
+$p = WP_HTML_Processor::create_fragment( $html );
+while ( $p->next_token() ) {
+	if ( '#tag' !== $p->get_token_type() || $p->is_tag_closer() ) {
+		continue;
+	}
+	$tag = $p->get_tag();
+	if ( ! preg_match( '/^H[1-6]$/', $tag ) ) {
+		continue;
+	}
+	$indent = str_repeat( '  ', max( 0, $p->get_current_depth() - 2 ) );
+	$text = '';
+	while ( $p->next_token() ) {
+		if ( '#text' === $p->get_token_type() ) {
+			$text .= $p->get_modifiable_text();
+			continue;
+		}
+		if ( '#tag' === $p->get_token_type() && $tag === $p->get_tag() && $p->is_tag_closer() ) {
+			break;
+		}
+	}
+	echo "{$indent}{$tag}  {$text}\n";
+}
+</script>
+<script type="text/expected-output">
+    H1  Title
+      H2  Chapter 1
+      H2  Chapter 2
+</script>
+</php-snippet>
+		<h2 id="bookmarks-annotate-a-parent-based-on-its-children">Bookmarks: annotate a parent based on its children</h2>
+		<p>Bookmarks are the one escape from forward-only scanning. Save a position, scan ahead, decide what to do, then <code>seek()</code> back and rewrite the earlier tag.</p>
+<php-snippet blueprint="toolkit-setup" name="bookmarks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<ul>'
+	. '<li><input type="checkbox" checked> Buy milk</li>'
+	. '<li><input type="checkbox"> Walk the dog</li>'
+	. '<li><input type="checkbox" checked> Read book</li>'
+	. '</ul>';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+$tags->next_tag( 'ul' );
+$tags->set_bookmark( 'list' );
+
+$total = 0;
+$done = 0;
+while ( $tags->next_tag( 'input' ) ) {
+	$total++;
+	if ( null !== $tags->get_attribute( 'checked' ) ) {
+		$done++;
+	}
+}
+
+$tags->seek( 'list' );
+$tags->set_attribute( 'data-progress', $done . '/' . $total );
+$tags->release_bookmark( 'list' );
+
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<ul data-progress="2/3"><li><input type="checkbox" checked> Buy milk</li><li><input type="checkbox"> Walk the dog</li><li><input type="checkbox" checked> Read book</li></ul>
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../blockparser/">BlockParser</a><span>Parse block comments first, then rewrite the HTML inside each block.</span></li>
+			<li><a href="../markdown/">Markdown</a><span>Convert Markdown to blocks before polishing generated HTML.</span></li>
+			<li><a href="../dataliberation/">DataLiberation</a><span>Rewrite URLs and media references during import/export pipelines.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/httpclient/index.html b/docs/_legacy/httpclient/index.html
new file mode 100644
index 000000000..b7bdebcbe
--- /dev/null
+++ b/docs/_legacy/httpclient/index.html
@@ -0,0 +1,576 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>HttpClient — PHP Toolkit</title>
+<meta name="description" content="Async HTTP client without curl required. Uses sockets when curl is missing, supports concurrent requests and streaming responses.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li class="current"><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>HttpClient</h1>
+		<p class="lede">Async HTTP client without <code>curl</code> required. Uses sockets when curl is missing, supports concurrent requests and streaming responses.</p>
+		<code class="install">composer require wp-php-toolkit/http-client</code>
+		<p>A plugin installer starts with one request to download <code>plugin.zip</code>. A migration then adds progress reporting, a ten-request media window, resumable downloads, and a remote ZIP reader that feeds ZipFilesystem directly. Those workflows need the same request API from the first GET to the final streamed archive.</p><p>The HttpClient component gives the toolkit a small request/response model, middleware for redirects and caching, concurrent fetches, and response bodies exposed as byte streams. It runs through curl when PHP provides curl and through pure PHP sockets when it does not. Callers keep the same code path.</p><p>Use it to fetch plugin metadata, submit import callbacks, mirror a media library, read a WXR export, or pipe a remote archive into Zip and Filesystem code.</p>
+		<p>Make the first request boring: <code>GET https://api.wordpress.org/plugins/info/1.2/</code>, then read the response status and body. From there, add the details the workflow actually needs: a POST body, JSON headers, redirects, cache policy, or a chosen transport.</p><p>When the response becomes a file, keep it as a stream. A plugin installer can show progress while downloading a ZIP, resume a partial archive with <code>Range</code>, and hand the remote body to ZipFilesystem without first building a giant string.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Start with GET and POST</li>
+			<li>Configure the request path</li>
+			<li>Scale the transfer</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="get-a-url">GET a URL</h2>
+		<p class="callout"><strong>Network access in the demo runtime.</strong> Live request examples show the real API, but outbound HTTP in browser sandboxes may require a CORS proxy.</p><p>The smallest flow has three steps: create a request, wait until headers arrive, then consume the body stream. This is intentionally close to the Fetch API shape, but the body is a toolkit byte stream instead of a buffered string.</p>
+<php-snippet blueprint="toolkit-setup" name="get.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$client  = new Client();
+$stream  = $client->fetch( new Request( 'https://example.com/' ) );
+
+$response = $stream->await_response();
+echo "status: " . $response->status_code . "\n";
+echo "first 80 bytes: " . substr( $stream->consume_all(), 0, 80 ) . "\n";
+</script>
+</php-snippet>
+		<h2 id="post-to-a-url">POST to a URL</h2>
+		<p>Uploads use the same shape. The only difference is that the request declares a method, request headers, and an upload body stream. Here the body is form-encoded text wrapped in <code>MemoryPipe</code>; a file upload could provide a file-backed read stream instead.</p>
+<php-snippet blueprint="toolkit-setup" name="post.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+use WordPress\ByteStream\MemoryPipe;
+
+$payload = http_build_query(
+	array(
+		'title' => 'Hello',
+		'tags'  => 'http,php',
+	),
+	'',
+	'&'
+);
+
+$client  = new Client();
+$request = new Request( 'https://httpbin.org/post', array(
+	'method'      => 'POST',
+	'headers'     => array(
+		'content-type'   => 'application/x-www-form-urlencoded',
+		'content-length' => (string) strlen( $payload ),
+	),
+	'body_stream' => new MemoryPipe( $payload ),
+) );
+
+$response = $client->fetch( $request )->json();
+echo "Server saw form title: " . $response['form']['title'] . "\n";
+</script>
+</php-snippet>
+		<h2 id="build-a-json-request-object">Build a JSON request object</h2>
+		<p>A <code>Request</code> is just data until a client enqueues it. That makes it easy to test request construction without network access. The constructor normalizes headers, calculates <code>content-length</code> when the body stream has a known length, and moves URL credentials into an Authorization header.</p>
+<php-snippet blueprint="toolkit-setup" name="request-object.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\HttpClient\Request;
+
+$body = new MemoryPipe( json_encode( array(
+	'title' => 'Hello',
+	'tags'  => array( 'docs', 'php' ),
+) ) );
+$body->close_writing();
+
+$request = new Request( 'https://user:secret@api.example.test/posts', array(
+	'method'      => 'POST',
+	'headers'     => array( 'content-type' => 'application/json' ),
+	'body_stream' => $body,
+) );
+
+echo $request->method . ' ' . $request->url . "\n";
+echo "content-type: " . $request->get_header( 'content-type' ) . "\n";
+echo "content-length: " . $request->get_header( 'content-length' ) . "\n";
+echo "authorization: " . substr( $request->get_header( 'authorization' ), 0, 10 ) . "...\n";
+</script>
+<script type="text/expected-output">
+POST https://api.example.test/posts
+content-type: application/json
+content-length: 39
+authorization: Basic dXNl...
+</script>
+</php-snippet>
+		<h2 id="parse-response-headers">Parse response headers</h2>
+		<p>Most applications receive <code>Response</code> objects from <code>await_response()</code>. Transports, middleware, and tests sometimes need the lower-level parser: <code>Response::from_http_headers()</code> turns raw HTTP header bytes into normalized status and case-insensitive headers.</p>
+<php-snippet blueprint="toolkit-setup" name="parse-response.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Request;
+use WordPress\HttpClient\Response;
+
+$request = new Request( 'https://api.example.test/posts/42' );
+$raw = "HTTP/1.1 201 Created\r\n"
+	. "Content-Type: application/json\r\n"
+	. "Location: /posts/42\r\n"
+	. "Content-Length: 27\r\n\r\n";
+
+$response = Response::from_http_headers( $raw, $request );
+
+echo "status: " . $response->status_code . ' ' . $response->get_reason_phrase() . "\n";
+echo "ok:     " . ( $response->ok() ? 'yes' : 'no' ) . "\n";
+echo "type:   " . $response->get_header( 'CONTENT-TYPE' ) . "\n";
+echo "size:   " . $response->total_bytes . " bytes\n";
+</script>
+<script type="text/expected-output">
+status: 201 Created
+ok:     yes
+type:   application/json
+size:   27 bytes
+</script>
+</php-snippet>
+		<h2 id="pick-the-right-reading-style">Pick the right reading style</h2>
+		<p>There are three common ways to consume a response. Start simple, then move down the table only when the workflow demands it.</p><table><thead><tr><th>Style</th><th>Use when</th><th>Tradeoff</th></tr></thead><tbody><tr><td><code>consume_all()</code> or <code>json()</code></td><td>Small HTML, JSON, or API responses.</td><td>Buffers the full body.</td></tr><tr><td><code>Client::await_next_event()</code></td><td>Progress bars, streaming to disk, queues, failure handling.</td><td>You own the event loop.</td></tr><tr><td>Filesystem and parser composition</td><td>Remote ZIPs, WXR files, import pipelines.</td><td>Requires a stream-aware consumer.</td></tr></tbody></table>
+		<h2 id="choose-a-transport">Choose a transport</h2>
+		<p>The transport is the I/O backend. It should not change your request, response, redirect, cache, or stream code; it only changes how bytes move across the network.</p><table><thead><tr><th>Transport</th><th>What it does</th><th>When to choose it</th></tr></thead><tbody><tr><td><code>auto</code></td><td>Uses curl when loaded, otherwise sockets.</td><td>Application default. Best when you want portability and the fastest available backend.</td></tr><tr><td><code>sockets</code></td><td>Uses PHP stream sockets, no curl extension.</td><td>Tests, Playground-style runtimes, hosts where curl is unavailable, or proving the dependency-free path works.</td></tr><tr><td><code>curl</code></td><td>Uses the curl extension.</td><td>Hosts where curl is available and you want to compare behavior or performance explicitly.</td></tr></tbody></table><p><code>concurrency</code>, <code>timeout_ms</code>, <code>cache_dir</code>, redirects, and response streaming sit above the transport, so the examples later on work with either backend.</p>
+<php-snippet blueprint="toolkit-setup" name="transports.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+
+$default = new Client(); // Same as array( 'transport' => 'auto' ).
+
+$portable = new Client( array(
+	'transport' => 'sockets',
+) );
+
+if ( extension_loaded( 'curl' ) ) {
+	$curl = new Client( array(
+		'transport' => 'curl',
+	) );
+}
+</script>
+</php-snippet>
+		<h2 id="follow-redirects-and-inspect-the-final-request">Follow redirects and inspect the final request</h2>
+		<p>Redirects are middleware, not transport behavior. The client follows up to five redirects by default. The original <code>Request</code> keeps a chain to the final request, so importers can log where a source URL actually landed.</p>
+<php-snippet blueprint="toolkit-setup" name="redirects.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$client   = new Client();
+$request  = new Request( 'https://httpbin.org/redirect-to?url=https://example.com/' );
+$stream   = $client->fetch( $request );
+$response = $stream->await_response();
+$stream->consume_all();
+
+$final = $request->latest_redirect();
+echo "original: " . $request->url . "\n";
+echo "final:    " . $final->url . "\n";
+echo "status:   " . $response->status_code . "\n";
+</script>
+</php-snippet>
+		<h2 id="cache-repeatable-get-responses">Cache repeatable GET responses</h2>
+		<p>Pass <code>cache_dir</code> to add disk caching for cacheable GET and HEAD responses. Fresh cached responses replay the same header/body events as a network response, so crawlers and importers do not need a separate cache code path. Non-GET requests invalidate matching cache entries instead of being cached.</p>
+<php-snippet blueprint="toolkit-setup" name="cache.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$cache_dir = sys_get_temp_dir() . '/http-cache-' . uniqid();
+mkdir( $cache_dir );
+
+$client = new Client( array( 'cache_dir' => $cache_dir ) );
+$url    = 'https://httpbin.org/cache/60';
+
+for ( $i = 1; $i <= 2; $i++ ) {
+	$stream   = $client->fetch( new Request( $url ) );
+	$response = $stream->await_response();
+	$body     = $stream->consume_all();
+	echo "request {$i}: HTTP " . $response->status_code . ', body=' . strlen( $body ) . " bytes\n";
+}
+
+echo "cache files: " . count( glob( $cache_dir . '/*' ) ) . "\n";
+</script>
+</php-snippet>
+		<h2 id="handle-failures-without-losing-the-queue">Handle failures without losing the queue</h2>
+		<p>Failures arrive as events. That lets a crawler, importer, package installer, or media frontloader log one bad URL and keep processing the rest of the queue. Treat failure handling as part of the event loop, not as one global try/catch around the whole batch.</p>
+<php-snippet blueprint="toolkit-setup" name="failures.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$client = new Client( array( 'timeout_ms' => 5000 ) );
+$client->enqueue( array(
+	new Request( 'https://example.com/', array( 'method' => 'HEAD' ) ),
+	new Request( 'https://example.invalid/missing' ),
+) );
+
+while ( $client->await_next_event() ) {
+	$request = $client->get_request();
+	$event   = $client->get_event();
+
+	if ( Client::EVENT_GOT_HEADERS === $event ) {
+		echo "ok: " . $request->url . " HTTP " . $request->response->status_code . "\n";
+	} elseif ( Client::EVENT_FAILED === $event ) {
+		echo "failed: " . $request->url . "\n";
+	} elseif ( Client::EVENT_FINISHED === $event ) {
+		echo "finished: " . $request->url . "\n";
+	}
+}
+</script>
+</php-snippet>
+		<h2 id="monitor-download-progress">Monitor download progress</h2>
+		<p>When you care about progress, use the event loop directly. Count bytes from each <code>EVENT_BODY_CHUNK_AVAILABLE</code> event and compare them with <code>Content-Length</code> when the server provides one.</p>
+<php-snippet blueprint="toolkit-setup" name="progress.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$url  = 'https://raw.githubusercontent.com/WordPress/php-toolkit/trunk/components/Zip/Tests/fixtures/childrens-literature.zip';
+$dest = sys_get_temp_dir() . '/progress-' . uniqid() . '.zip';
+
+$client  = new Client();
+$request = new Request( $url );
+$client->enqueue( array( $request ) );
+
+$downloaded = 0;
+$last_step  = -1;
+@unlink( $dest );
+
+while ( $client->await_next_event() ) {
+	$event   = $client->get_event();
+	$request = $client->get_request();
+
+	if ( Client::EVENT_GOT_HEADERS === $event ) {
+		echo "status: " . $request->response->status_code . "\n";
+		continue;
+	}
+
+	if ( Client::EVENT_BODY_CHUNK_AVAILABLE === $event ) {
+		$chunk       = $client->get_response_body_chunk();
+		$downloaded += strlen( $chunk );
+		file_put_contents( $dest, $chunk, FILE_APPEND );
+
+		$total = $request->response->total_bytes;
+		if ( $total ) {
+			$step = min( 100, (int) floor( $downloaded / $total * 100 ) );
+			if ( $step >= $last_step + 25 || 100 === $step ) {
+				echo "progress: {$step}% ({$downloaded}/{$total} bytes)\n";
+				$last_step = $step;
+			}
+		} else {
+			echo "downloaded: {$downloaded} bytes\n";
+		}
+		continue;
+	}
+
+	if ( Client::EVENT_FINISHED === $event ) {
+		echo "saved: {$dest}\n";
+	} elseif ( Client::EVENT_FAILED === $event ) {
+		echo "failed: " . $request->error->message . "\n";
+	}
+}
+</script>
+</php-snippet>
+		<h2 id="keep-a-sliding-window-of-10-requests">Keep a sliding window of 10 requests</h2>
+		<p>For large queues, do not enqueue everything at once. Keep at most ten active requests, enqueue another as each one finishes, and let the client multiplex only that window.</p>
+<php-snippet blueprint="toolkit-setup" name="sliding-window.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$urls = array();
+for ( $i = 1; $i <= 25; $i++ ) {
+	$urls[] = 'https://example.com/?request=' . $i;
+}
+
+$client  = new Client( array( 'concurrency' => 10 ) );
+$pending = $urls;
+$active  = array();
+$done    = 0;
+
+$enqueue_next = function () use ( &$pending, &$active, $client ) {
+	if ( ! $pending ) {
+		return;
+	}
+	$url     = array_shift( $pending );
+	$request = new Request( $url, array( 'method' => 'HEAD' ) );
+	$active[ $request->id ] = $request;
+	$client->enqueue( array( $request ) );
+};
+
+for ( $i = 0; $i < 10; $i++ ) {
+	$enqueue_next();
+}
+
+while ( $active && $client->await_next_event() ) {
+	$request = $client->get_request();
+	$event   = $client->get_event();
+
+	if ( Client::EVENT_GOT_HEADERS === $event ) {
+		echo "headers {$request->id}: " . $request->response->status_code . "\n";
+		continue;
+	}
+
+	if ( Client::EVENT_FINISHED === $event || Client::EVENT_FAILED === $event ) {
+		unset( $active[ $request->id ] );
+		$done++;
+		echo "finished {$done}/25, active=" . count( $active ) . "\n";
+		$enqueue_next();
+	}
+}
+</script>
+</php-snippet>
+		<h2 id="resume-a-partial-download">Resume a partial download</h2>
+		<p>Resuming is an HTTP contract between you and the server. Save what you already have, send a <code>Range</code> request for the remaining bytes, and append only if the server returns <code>206 Partial Content</code>.</p>
+<php-snippet blueprint="toolkit-setup" name="resume-download.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$url  = 'https://raw.githubusercontent.com/WordPress/php-toolkit/trunk/components/Zip/Tests/fixtures/childrens-literature.zip';
+$dest = sys_get_temp_dir() . '/resume-' . uniqid() . '.zip';
+
+$client = new Client();
+
+// Simulate an interrupted first attempt by downloading only the first 32 KB.
+$first = new Request( $url, array(
+	'headers' => array( 'range' => 'bytes=0-32767' ),
+) );
+$stream   = $client->fetch( $first );
+$response = $stream->await_response();
+file_put_contents( $dest, $stream->consume_all() );
+
+if ( 206 !== $response->status_code ) {
+	echo "Server did not honor Range; start over with a full download.\n";
+	exit;
+}
+
+$downloaded = filesize( $dest );
+echo "partial file: {$downloaded} bytes\n";
+
+$resume = new Request( $url, array(
+	'headers' => array( 'range' => 'bytes=' . $downloaded . '-' ),
+) );
+$stream   = $client->fetch( $resume );
+$response = $stream->await_response();
+
+if ( 206 !== $response->status_code ) {
+	echo "Server did not resume; discard partial file and retry from byte 0.\n";
+	exit;
+}
+
+while ( ! $stream->reached_end_of_data() ) {
+	$n = $stream->pull( 8192 );
+	if ( 0 === $n ) {
+		break;
+	}
+	file_put_contents( $dest, $stream->consume( $n ), FILE_APPEND );
+}
+
+echo "complete file: " . filesize( $dest ) . " bytes\n";
+echo "saved: {$dest}\n";
+</script>
+</php-snippet>
+		<h2 id="stream-unzip-a-remote-archive">Stream-unzip a remote archive</h2>
+		<p>Mount the remote archive with <code>ZipFilesystem</code>, then copy it into any writable filesystem. <code>SeekableRequestReadStream</code> caches received bytes to a temporary file so <code>ZipFilesystem</code> can read the central directory and seek to entries without first writing the ZIP yourself.</p>
+<php-snippet blueprint="toolkit-setup" name="stream-unzip.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\ByteStream\SeekableRequestReadStream;
+use WordPress\HttpClient\Request;
+use WordPress\Filesystem\LocalFilesystem;
+use WordPress\Zip\ZipFilesystem;
+use function WordPress\Filesystem\copy_between_filesystems;
+use function WordPress\Filesystem\ls_recursive;
+
+$url  = 'https://raw.githubusercontent.com/WordPress/php-toolkit/trunk/components/Zip/Tests/fixtures/childrens-literature.zip';
+$root = sys_get_temp_dir() . '/remote-zip-' . uniqid();
+mkdir( $root );
+
+$client = new Client();
+$reader = new SeekableRequestReadStream(
+	new Request( $url ),
+	array( 'client' => $client )
+);
+
+$response = $reader->await_response();
+if ( ! $response->ok() ) {
+	echo "HTTP " . $response->status_code . "\n";
+	exit;
+}
+
+$zip   = ZipFilesystem::create( $reader );
+$local = LocalFilesystem::create( $root );
+
+copy_between_filesystems( array(
+	'source_filesystem' => $zip,
+	'source_path'       => '/',
+	'target_filesystem' => $local,
+	'target_path'       => '/',
+) );
+
+$tree  = ls_recursive( $local, '/' );
+$files = 0;
+array_walk_recursive( $tree, function ( $value, $key ) use ( &$files ) {
+	if ( 'type' === $key && 'file' === $value ) {
+		$files++;
+	}
+} );
+
+echo "extracted {$files} files\n";
+echo "root: {$root}\n";
+</script>
+</php-snippet>
+		<h2 id="parallel-fan-out-fetch-many-urls-at-once">Parallel fan-out: fetch many URLs at once</h2>
+		<p>Enqueue a batch of requests and react to events as they fire. The client multiplexes them — total wall time is roughly the slowest request, not the sum.</p>
+<php-snippet blueprint="toolkit-setup" name="fan-out.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$urls = array(
+	'https://wordpress.org/',
+	'https://make.wordpress.org/',
+	'https://developer.wordpress.org/',
+);
+
+$client = new Client();
+$client->enqueue( array_map( function ( $url ) {
+	return new Request( $url, array( 'method' => 'HEAD' ) );
+}, $urls ) );
+
+$results = array();
+while ( $client->await_next_event() ) {
+	$request = $client->get_request();
+	if ( Client::EVENT_GOT_HEADERS === $client->get_event() ) {
+		$results[ $request->url ] = $request->response->status_code;
+	} elseif ( Client::EVENT_FAILED === $client->get_event() ) {
+		$results[ $request->url ] = 'ERR ' . $request->error->message;
+	}
+}
+
+foreach ( $results as $url => $status ) {
+	printf( "%-40s %s\n", $url, $status );
+}
+</script>
+</php-snippet>
+		<h2 id="stream-a-download-to-disk-without-oom">Stream a download to disk without OOM</h2>
+		<p>Process the body chunk-by-chunk via the event loop. Memory stays flat regardless of file size.</p>
+<php-snippet blueprint="toolkit-setup" name="stream-to-disk.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$dest   = sys_get_temp_dir() . '/wp-readme.html';
+$client = new Client();
+$client->enqueue( array( new Request( 'https://wordpress.org/' ) ) );
+
+$bytes = 0;
+@unlink( $dest );
+
+while ( $client->await_next_event() ) {
+	switch ( $client->get_event() ) {
+		case Client::EVENT_BODY_CHUNK_AVAILABLE:
+			$chunk  = $client->get_response_body_chunk();
+			$bytes += strlen( $chunk );
+			file_put_contents( $dest, $chunk, FILE_APPEND );
+			break;
+		case Client::EVENT_FINISHED:
+			echo "Wrote {$bytes} bytes to {$dest}\n";
+			break;
+	}
+}
+
+echo "Peak memory: " . round( memory_get_peak_usage( true ) / 1024 / 1024, 2 ) . " MB\n";
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../bytestream/">ByteStream</a><span>Stream request and response bodies.</span></li>
+			<li><a href="../filesystem/">Filesystem</a><span>Persist large downloads without buffering them in memory.</span></li>
+			<li><a href="../corsproxy/">CORSProxy</a><span>Bridge browser-side tools to servers without CORS headers.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/httpserver/index.html b/docs/_legacy/httpserver/index.html
new file mode 100644
index 000000000..08df63089
--- /dev/null
+++ b/docs/_legacy/httpserver/index.html
@@ -0,0 +1,176 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>HttpServer — PHP Toolkit</title>
+<meta name="description" content="A minimal blocking TCP HTTP server in pure PHP. For CLI tools and tests, not for production traffic.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li class="current"><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>HttpServer</h1>
+		<p class="lede">A minimal blocking TCP HTTP server in pure PHP. For CLI tools and tests, not for production traffic.</p>
+		<code class="install">composer require wp-php-toolkit/http-server</code>
+		<p>Sometimes a PHP tool needs a tiny local HTTP surface: a test fixture server, a webhook receiver during development, a CLI tool with a browser UI, or a demo endpoint for another component. Pulling in a production web framework would obscure the example and add dependencies the toolkit avoids.</p><p>The HttpServer component is intentionally small: a blocking TCP server, incoming request objects, and response writers. It is useful for local tools and tests. It is not a replacement for nginx, Apache, php-fpm, RoadRunner, Swoole, or a production application server.</p>
+		<p>Use HttpServer when a PHP tool needs one local endpoint. A CLI command can open <code>http://127.0.0.1:8765/callback</code> for an OAuth flow, serve fixture JSON to HttpClient tests, or expose a tiny status page during an import.</p><p>The server accepts a connection, parses one request, and gives your handler a response writer. Keep the process lifetime and shutdown rule in your command.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Serve one response</li>
+			<li>Route a small local API</li>
+			<li>Buffer when headers depend on the body</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="hello-world-on-port-8080">Hello world on port 8080</h2>
+		<p class="callout"><strong>Run on your machine:</strong> the Playground sandbox does not allow processes to bind listening TCP ports. Save this snippet locally and run <code>php hello-server.php</code>.</p>
+<php-snippet blueprint="toolkit-setup" name="hello-server.php" runnable="false">
+<script type="application/x-php">
+<?php
+require __DIR__ . '/vendor/autoload.php';
+
+use WordPress\HttpServer\TcpServer;
+use WordPress\HttpServer\IncomingRequest;
+use WordPress\HttpServer\Response\ResponseWriteStream;
+
+$server = new TcpServer( '127.0.0.1', 8080 );
+
+$server->set_handler( function ( IncomingRequest $request, ResponseWriteStream $response ) {
+	$response->send_http_code( 200 );
+	$response->send_header( 'Content-Type', 'text/plain' );
+	$response->append_bytes( "Hello from " . $request->method . " " . $request->url . "\n" );
+} );
+
+$server->serve( function ( $host, $port ) {
+	echo "Listening on http://{$host}:{$port}\n";
+} );
+</script>
+</php-snippet>
+		<h2 id="a-tiny-json-router">A tiny JSON router</h2>
+		<p class="callout"><strong>Run on your machine:</strong> needs a listening port. Once running, try <code>curl localhost:8080/api/status</code>.</p><p>Build a CLI tool with a web UI by switching on the parsed path and method.</p>
+<php-snippet blueprint="toolkit-setup" name="mini-router.php" runnable="false">
+<script type="application/x-php">
+<?php
+require __DIR__ . '/vendor/autoload.php';
+
+use WordPress\HttpServer\TcpServer;
+use WordPress\HttpServer\IncomingRequest;
+use WordPress\HttpServer\Response\ResponseWriteStream;
+
+$server = new TcpServer( '127.0.0.1', 8080 );
+
+$server->set_handler( function ( IncomingRequest $request, ResponseWriteStream $response ) {
+	$path = $request->get_parsed_url()->pathname;
+
+	if ( '/api/status' === $path ) {
+		$response->send_http_code( 200 );
+		$response->send_header( 'Content-Type', 'application/json' );
+		$response->append_bytes( json_encode( array(
+			'ok'     => true,
+			'pid'    => getmypid(),
+			'memory' => memory_get_usage( true ),
+		) ) );
+		return;
+	}
+
+	if ( '/api/echo' === $path && 'POST' === $request->method ) {
+		$body = '';
+		while ( ! $request->body_stream->reached_end_of_data() ) {
+			$n = $request->body_stream->pull( 4096 );
+			if ( $n > 0 ) $body .= $request->body_stream->consume( $n );
+		}
+		$response->send_http_code( 200 );
+		$response->send_header( 'Content-Type', 'text/plain' );
+		$response->append_bytes( $body );
+		return;
+	}
+
+	$response->send_http_code( 404 );
+	$response->append_bytes( "Not found\n" );
+} );
+
+$server->serve();
+</script>
+</php-snippet>
+		<h2 id="buffered-response-with-auto-content-length">Buffered response with auto Content-Length</h2>
+		<p>Use <code>BufferingResponseWriter</code> when you want the framework to compute <code>Content-Length</code> for you, or when the runtime is CGI-shaped and expects the full body up front. This one runs anywhere — no socket required.</p>
+<php-snippet blueprint="toolkit-setup" name="buffered-writer.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpServer\Response\BufferingResponseWriter;
+
+$writer = new BufferingResponseWriter();
+$writer->send_http_code( 200 );
+$writer->send_header( 'Content-Type', 'text/html' );
+$writer->append_bytes( '<!doctype html><title>Hi</title><h1>Hello</h1>' );
+$writer->append_bytes( '<p>Buffered body, sent at the end.</p>' );
+
+ob_start();
+$writer->close_writing();
+$response_body = ob_get_clean();
+
+echo "headers before send:\n";
+foreach ( $writer->get_buffered_headers() as $name => $value ) {
+	echo "{$name}: {$value}\n";
+}
+echo "\nbody:\n" . $response_body;
+</script>
+<script type="text/expected-output">
+headers before send:
+Content-Type: text/html
+
+body:
+<!doctype html><title>Hi</title><h1>Hello</h1><p>Buffered body, sent at the end.</p>
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../cli/">CLI</a><span>Expose a local browser UI from a command-line tool.</span></li>
+			<li><a href="../httpclient/">HttpClient</a><span>Test client code against a small local fixture server.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/index.html b/docs/_legacy/index.html
new file mode 100644
index 000000000..a79f1dff9
--- /dev/null
+++ b/docs/_legacy/index.html
@@ -0,0 +1,60 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>PHP Toolkit — runnable docs</title>
+<meta name="description" content="Guided docs for eighteen pure-PHP libraries for WordPress and general PHP, with runnable examples powered by WordPress Playground.">
+<link rel="stylesheet" href="assets/style.css?v=20260429-concept-guide">
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="./">PHP Toolkit</a>
+	<nav>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<main class="landing">
+	<h1>PHP Toolkit</h1>
+	<p class="lede">Eighteen standalone pure-PHP libraries for WordPress and general PHP, with no extension or Composer dependencies. Each guide starts with the story for that component, outlines the route through the page, names the main APIs, and then uses examples only where code clarifies the idea.</p>
+
+	<h2>Choose a Path</h2>
+	<ul class="starter-paths">
+		<li><strong>Content and migration</strong><span>Start here when you are importing, exporting, rewriting, or auditing WordPress content.</span><nav aria-label="Content and migration path"><a href="html/">HTML</a> <a href="blockparser/">BlockParser</a> <a href="markdown/">Markdown</a> <a href="xml/">XML</a> <a href="dataliberation/">DataLiberation</a></nav></li>
+		<li><strong>Streams and storage</strong><span>Use this path for archives, large files, testable storage backends, and pure-PHP file movement.</span><nav aria-label="Streams and storage path"><a href="bytestream/">ByteStream</a> <a href="filesystem/">Filesystem</a> <a href="zip/">Zip</a> <a href="git/">Git</a> <a href="merge/">Merge</a></nav></li>
+		<li><strong>Networked tools</strong><span>Use this path for clients, local fixture servers, browser-facing proxies, and CLI workflows.</span><nav aria-label="Networked tools path"><a href="httpclient/">HttpClient</a> <a href="httpserver/">HttpServer</a> <a href="corsproxy/">CORSProxy</a> <a href="cli/">CLI</a></nav></li>
+		<li><strong>WordPress runtime support</strong><span>Use this path when your code needs WordPress-shaped helpers, repeatable sites, or project-specific review rules.</span><nav aria-label="WordPress runtime support path"><a href="polyfill/">Polyfill</a> <a href="blueprints/">Blueprints</a> <a href="coding-standards/">ToolkitCodingStandards</a></nav></li>
+	</ul>
+
+	<h2>Components</h2>
+	<ul class="components">
+		<li><a href="html/"><strong>HTML</strong><span>A pure-PHP HTML5 parser and tag rewriter mirroring WordPress core&#x27;s HTML API.</span></a></li>
+		<li><a href="zip/"><strong>Zip</strong><span>Read and write ZIP archives in pure PHP — no libzip, no ZipArchive.</span></a></li>
+		<li><a href="bytestream/"><strong>ByteStream</strong><span>Composable streaming primitives for reading, writing, transforming, hashing, and compressing byte data.</span></a></li>
+		<li><a href="filesystem/"><strong>Filesystem</strong><span>One Filesystem interface across local disk, in-memory trees, SQLite databases, and ZIP archives.</span></a></li>
+		<li><a href="blockparser/"><strong>BlockParser</strong><span>WordPress core&#x27;s block parser, packaged as a standalone library.</span></a></li>
+		<li><a href="markdown/"><strong>Markdown</strong><span>Bidirectional converter between Markdown and WordPress block markup.</span></a></li>
+		<li><a href="xml/"><strong>XML</strong><span>A streaming, namespace-aware XML processor in pure PHP.</span></a></li>
+		<li><a href="encoding/"><strong>Encoding</strong><span>UTF-8 validation and scrubbing with a pure-PHP fallback when mbstring is unavailable.</span></a></li>
+		<li><a href="dataliberation/"><strong>DataLiberation</strong><span>Streaming WordPress import/export.</span></a></li>
+		<li><a href="git/"><strong>Git</strong><span>A pure-PHP Git client and server.</span></a></li>
+		<li><a href="merge/"><strong>Merge</strong><span>Three-way merge and diff.</span></a></li>
+		<li><a href="httpclient/"><strong>HttpClient</strong><span>Async HTTP client without curl required.</span></a></li>
+		<li><a href="httpserver/"><strong>HttpServer</strong><span>A minimal blocking TCP HTTP server in pure PHP.</span></a></li>
+		<li><a href="corsproxy/"><strong>CORSProxy</strong><span>A small PHP CORS proxy intended for browser-side code that needs to reach servers without CORS headers.</span></a></li>
+		<li><a href="cli/"><strong>CLI</strong><span>POSIX-style argument parser.</span></a></li>
+		<li><a href="polyfill/"><strong>Polyfill</strong><span>PHP 8 string functions on PHP 7.</span></a></li>
+		<li><a href="blueprints/"><strong>Blueprints</strong><span>Declarative WordPress site provisioning.</span></a></li>
+		<li><a href="coding-standards/"><strong>ToolkitCodingStandards</strong><span>PHP_CodeSniffer sniffs used by this project: enforce Yoda comparisons and ban the short ternary where it…</span></a></li>
+	</ul>
+
+	<h2>How these examples work</h2>
+	<p>Most PHP examples embed <code>&lt;php-snippet&gt;</code> elements from <a href="https://playground.wordpress.net/">WordPress Playground</a>. The first <em>Run</em> click on a page boots a single shared PHP+WordPress runtime in your browser via WebAssembly and unzips the toolkit into it. Subsequent snippets reuse the same runtime, so only the first run pays the boot cost.</p>
+	<p>Examples that need a local listening port, a web server, or deployment-specific config are presented as static code blocks so the page does not imply they can run in the browser sandbox.</p>
+	<p>The toolkit bundle (<code>docs/assets/php-toolkit.zip</code>, ≈1.8&nbsp;MB) ships with the docs, so no third-party CDN is involved.</p>
+</main>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/markdown/index.html b/docs/_legacy/markdown/index.html
new file mode 100644
index 000000000..a433368a0
--- /dev/null
+++ b/docs/_legacy/markdown/index.html
@@ -0,0 +1,242 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Markdown — PHP Toolkit</title>
+<meta name="description" content="Bidirectional converter between Markdown and WordPress block markup. Useful for moving content between Markdown files and WordPress while preserving the structures both formats can express.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li class="current"><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>Markdown</h1>
+		<p class="lede">Bidirectional converter between Markdown and WordPress block markup. Useful for moving content between Markdown files and WordPress while preserving the structures both formats can express.</p>
+		<code class="install">composer require wp-php-toolkit/markdown</code>
+		<p>Many publishing workflows start in Markdown: documentation sites, static-site generators, Git-backed editorial workflows, Obsidian vaults, and developer notes. WordPress stores editor content as block markup. Moving between those worlds by string replacement loses metadata and quickly breaks on lists, tables, code blocks, and frontmatter.</p><p>The Markdown component provides a structured bridge. <code>MarkdownConsumer</code> turns Markdown plus frontmatter into block markup and metadata; <code>MarkdownProducer</code> turns supported block markup back into Markdown. The conversion is meant for practical content workflows, not byte-identical round-tripping of every custom block attribute.</p>
+		<p>Use Markdown for files that humans edit and block markup for content that WordPress stores. This component translates the supported middle ground: headings, paragraphs, lists, code blocks, links, images, and frontmatter-backed metadata.</p><p>Keep unsupported syntax visible. A migration tool should tell you that a file contains an unsupported table instead of silently dropping it before publishing.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Convert one document</li>
+			<li>Carry metadata beside content</li>
+			<li>Prepare a folder import</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="markdown-to-blocks">Markdown to blocks</h2>
+		<p>Feed Markdown into <code>MarkdownConsumer</code>, get block markup back. The result is a <code>BlocksWithMetadata</code> object that holds both the rendered blocks and any frontmatter parsed from the document.</p>
+<php-snippet blueprint="toolkit-setup" name="quickstart.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+$result = ( new MarkdownConsumer( "# Hello\n\nWelcome to **WordPress**." ) )->consume();
+echo $result->get_block_markup();
+</script>
+<script type="text/expected-output">
+<!-- wp:heading {"level":1} -->
+<h1 class="wp-block-heading" id="hello">Hello</h1>
+<!-- /wp:heading -->
+
+<!-- wp:paragraph -->
+<p>Welcome to <b>WordPress</b>.</p>
+<!-- /wp:paragraph -->
+</script>
+</php-snippet>
+		<h2 id="round-trip-blocks-back-to-markdown">Round-trip: blocks back to Markdown</h2>
+		<p>Pair <code>MarkdownProducer</code> with <code>MarkdownConsumer</code> to convert in either direction. Round-tripping is lossy for block attributes that have no Markdown representation (custom classes, alignment), so do not expect byte-perfect equality.</p>
+<php-snippet blueprint="toolkit-setup" name="roundtrip.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+use WordPress\Markdown\MarkdownProducer;
+
+$md       = "## Round trip\n\n- one\n- two\n- three\n";
+$blocks   = ( new MarkdownConsumer( $md ) )->consume();
+$markdown = ( new MarkdownProducer( $blocks ) )->produce();
+
+echo $markdown;
+</script>
+<script type="text/expected-output">
+## Round trip
+
+- one
+- two
+- three
+</script>
+</php-snippet>
+		<h2 id="reading-yaml-frontmatter-as-post-meta">Reading YAML frontmatter as post meta</h2>
+		<p>Frontmatter keys come back as arrays so a single key can hold multiple values. Use <code>get_meta_value()</code> when you only want the first scalar.</p>
+<php-snippet blueprint="toolkit-setup" name="frontmatter.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+$md = <<<MD
+---
+post_title: "The Name of the Wind"
+post_status: publish
+tags: [fantasy, kingkiller]
+---
+
+Once upon a time...
+MD;
+
+$consumer = new MarkdownConsumer( $md );
+$consumer->consume();
+
+echo 'Title: '   . $consumer->get_meta_value( 'post_title' )  . "\n";
+echo 'Status: '  . $consumer->get_meta_value( 'post_status' ) . "\n";
+$metadata = $consumer->get_all_metadata();
+echo 'Tags: ' . implode( ', ', $metadata['tags'][0] ) . "\n";
+</script>
+<script type="text/expected-output">
+Title: The Name of the Wind
+Status: publish
+Tags: fantasy, kingkiller
+</script>
+</php-snippet>
+		<h2 id="migrating-an-obsidian-or-hugo-folder-of-markdown">Migrating an Obsidian or Hugo folder of Markdown</h2>
+		<p>Walk a directory of <code>.md</code> files (Obsidian vault, Hugo <code>content/</code>, Jekyll <code>_posts</code>) and emit one block-markup record per file.</p>
+<php-snippet blueprint="toolkit-setup" name="migrate-folder.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+@mkdir( '/tmp/vault', 0777, true );
+file_put_contents( '/tmp/vault/welcome.md', "---\ntitle: Welcome\n---\n\nHello world." );
+file_put_contents( '/tmp/vault/roadmap.md', "# Roadmap\n\n1. Ship\n2. Iterate" );
+
+foreach ( glob( '/tmp/vault/*.md' ) as $path ) {
+	$consumer = new MarkdownConsumer( file_get_contents( $path ) );
+	$consumer->consume();
+	$title = $consumer->get_meta_value( 'title' );
+	if ( ! $title ) $title = basename( $path, '.md' );
+	echo "=== $title ($path) ===\n";
+	echo substr( $consumer->get_block_markup(), 0, 120 ) . "...\n\n";
+}
+</script>
+<script type="text/expected-output">
+=== roadmap (/tmp/<tempfile>/roadmap.md) ===
+<!-- wp:heading {"level":1} -->
+<h1 class="wp-block-heading" id="roadmap">Roadmap</h1>
+<!-- /wp:heading -->
+
+<!-- wp:lis...
+
+=== Welcome (/tmp/<tempfile>/welcome.md) ===
+<!-- wp:paragraph -->
+<p>Hello world.</p>
+<!-- /wp:paragraph -->
+
+...
+</script>
+</php-snippet>
+		<h2 id="counting-blocks-produced-by-a-markdown-document">Counting blocks produced by a Markdown document</h2>
+		<p>After conversion, the block markup is plain WordPress block markup, so <code>parse_blocks()</code> works on it directly. The standard way to introspect what the converter emitted before saving to the database.</p>
+<php-snippet blueprint="toolkit-setup" name="count-blocks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+$md = <<<MD
+# Title
+
+A paragraph with **bold** and *italics*.
+
+| Col A | Col B |
+|-------|-------|
+| 1     | 2     |
+
+```php
+echo 'hi';
+```
+
+> A quote.
+MD;
+
+$blocks = ( new MarkdownConsumer( $md ) )->consume()->get_block_markup();
+$counts = array();
+$queue  = parse_blocks( $blocks );
+
+while ( $queue ) {
+	$block = array_shift( $queue );
+	if ( null !== $block['blockName'] ) {
+		$name             = $block['blockName'];
+		$counts[ $name ] = isset( $counts[ $name ] ) ? $counts[ $name ] + 1 : 1;
+	}
+	foreach ( $block['innerBlocks'] as $inner_block ) {
+		$queue[] = $inner_block;
+	}
+}
+foreach ( $counts as $name => $count ) {
+	echo "{$name}: {$count}\n";
+}
+</script>
+<script type="text/expected-output">
+core/heading: 1
+core/paragraph: 2
+core/table: 1
+core/code: 1
+core/quote: 1
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../blockparser/">BlockParser</a><span>Understand the block tree created from Markdown output.</span></li>
+			<li><a href="../html/">HTML</a><span>Rewrite rendered HTML fragments without using DOMDocument.</span></li>
+			<li><a href="../dataliberation/">DataLiberation</a><span>Turn Markdown folders into import/export streams.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/merge/index.html b/docs/_legacy/merge/index.html
new file mode 100644
index 000000000..f9b1b0553
--- /dev/null
+++ b/docs/_legacy/merge/index.html
@@ -0,0 +1,266 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Merge — PHP Toolkit</title>
+<meta name="description" content="Three-way merge and diff. Pluggable differ + merger + optional validator.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li class="current"><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>Merge</h1>
+		<p class="lede">Three-way merge and diff. Pluggable differ + merger + optional validator.</p>
+		<code class="install">composer require wp-php-toolkit/merge</code>
+		<p>Content synchronization needs more than "last write wins." A Markdown file changes in Git while the same post changes in WordPress. A generated config changes through both a CLI tool and a UI. In those cases you need a common ancestor, two edited versions, and a way to explain conflicts to a human.</p><p>The Merge component provides the diff and three-way merge primitives used by those workflows. The default examples are line-oriented because that is the most familiar shape, but the strategy is intentionally pluggable: choose the differ, choose the merger, and optionally validate the merged result before accepting it.</p><p>Use the merge result to auto-accept independent edits and to show structured conflicts when a person must decide.</p>
+		<p>A three-way merge needs the common base, your version, and their version. The base tells the merger whether two lines changed independently or collided.</p><p>Start with line merges for Markdown, config files, and generated PHP. Move to a domain-specific differ only when lines hide the real unit of change.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>See the edit</li>
+			<li>Auto-merge independent lines</li>
+			<li>Surface conflicts</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="diff-two-strings-line-by-line">Diff two strings line by line</h2>
+		<p>Feed two strings to <code>LineDiffer</code> and inspect the operations. Every <code>get_changes()</code> entry is a <code>[op, text]</code> pair.</p>
+<php-snippet blueprint="toolkit-setup" name="line-diff.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Merge\Diff\Diff;
+use WordPress\Merge\Diff\LineDiffer;
+
+$diff = ( new LineDiffer() )->diff(
+	"alpha\nbeta\ngamma\n",
+	"alpha\nBETA\ngamma\ndelta\n"
+);
+
+$labels = array( Diff::DIFF_EQUAL => '=', Diff::DIFF_DELETE => '-', Diff::DIFF_INSERT => '+' );
+foreach ( $diff->get_changes() as $change ) {
+	echo $labels[ $change[0] ] . ' ' . rtrim( $change[1] ) . "\n";
+}
+</script>
+<script type="text/expected-output">
+= alpha
+- beta
++ BETA
+= gamma
++ delta
+=
+</script>
+</php-snippet>
+		<h2 id="render-a-unified-patch">Render a unified patch</h2>
+		<p><code>format_as_git_patch()</code> produces output that mirrors <code>git diff</code>, including hunk headers — handy for emails, CI annotations, or a "what changed?" panel.</p>
+<php-snippet blueprint="toolkit-setup" name="git-patch.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Merge\Diff\LineDiffer;
+
+$old = "title: Hello\nauthor: Alice\nstatus: draft\n";
+$new = "title: Hello, world\nauthor: Alice\nstatus: published\ntags: greeting\n";
+
+$diff = ( new LineDiffer() )->diff( $old, $new );
+echo $diff->format_as_git_patch( array(
+	'a_source' => 'a/post.yml',
+	'b_source' => 'b/post.yml',
+) );
+</script>
+<script type="text/expected-output">
+diff --git a/post.yml b/post.yml
+--- a/post.yml
++++ b/post.yml
+@@ -1,4 +1,5 @@- title: Hello
++ title: Hello, world
+  author: Alice
+- status: draft
++ status: published
++ tags: greeting
+</script>
+</php-snippet>
+		<h2 id="three-way-merge-with-no-conflicts">Three-way merge with no conflicts</h2>
+		<p>The classic case: each branch changes a different region. Pass the common ancestor plus both edits to <code>MergeStrategy::merge()</code> and read the merged result.</p>
+<php-snippet blueprint="toolkit-setup" name="three-way.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Merge\Diff\LineDiffer;
+use WordPress\Merge\Merge\LineMerger;
+use WordPress\Merge\MergeStrategy;
+
+$strategy = new MergeStrategy( new LineDiffer(), new LineMerger() );
+
+$result = $strategy->merge(
+	"intro\nbody\noutro\n",
+	"intro updated\nbody\noutro\n",
+	"intro\nbody\noutro\nappendix\n"
+);
+
+echo $result->has_conflicts() ? "conflicts!\n" : "clean merge:\n";
+echo $result->get_merged_content();
+</script>
+<script type="text/expected-output">
+clean merge:
+intro updated
+body
+outro
+appendix
+</script>
+</php-snippet>
+		<h2 id="inspect-and-surface-conflicts">Inspect and surface conflicts</h2>
+		<p>When both sides edit the same region, the merger produces a <code>MergeConflict</code>. The merged content carries Git-style markers, but the structured <code>get_conflicts()</code> output is what you want for a UI that lets the user pick a side.</p>
+<php-snippet blueprint="toolkit-setup" name="conflicts.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Merge\Diff\LineDiffer;
+use WordPress\Merge\Merge\LineMerger;
+use WordPress\Merge\MergeStrategy;
+
+$strategy = new MergeStrategy( new LineDiffer(), new LineMerger() );
+$result = $strategy->merge(
+	"line 1\nline 2\n",
+	"line 1\nline 2 from Alice\n",
+	"line 1\nline 2 from Bob\n"
+);
+
+if ( $result->has_conflicts() ) {
+	foreach ( $result->get_conflicts() as $c ) {
+		echo "ours:   " . trim( $c->ours ) . "\n";
+		echo "theirs: " . trim( $c->theirs ) . "\n";
+	}
+}
+echo "\n--- merged content with markers ---\n";
+echo $result->get_merged_content();
+</script>
+<script type="text/expected-output">
+ours:   line 2 from Alice
+theirs: line 2 from Bob
+
+--- merged content with markers ---
+line 1
+
+<<<<<<< HEAD
+line 2 from Alice
+
+=======
+line 2 from Bob
+
+>>>>>>> incoming
+</script>
+</php-snippet>
+		<h2 id="sync-a-markdown-folder-against-an-edited-db-copy">Sync a Markdown folder against an edited DB copy</h2>
+		<p>A real-world scenario: posts live both in a Git-tracked Markdown folder and in WordPress, and someone edits each. Three-way-merge each post against its common ancestor.</p>
+<php-snippet blueprint="toolkit-setup" name="sync-folder-vs-db.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Merge\Diff\LineDiffer;
+use WordPress\Merge\Merge\LineMerger;
+use WordPress\Merge\MergeStrategy;
+
+$strategy = new MergeStrategy( new LineDiffer(), new LineMerger() );
+
+$posts = array(
+	'hello.md' => array(
+		'base' => "# Hello\nDraft body.\n",
+		'disk' => "# Hello\nDraft body, expanded on disk.\n",
+		'db'   => "# Hello\nDraft body.\nNew section from the editor.\n",
+	),
+	'about.md' => array(
+		'base' => "# About\nWho we are.\n",
+		'disk' => "# About\nWho *they* are.\n",
+		'db'   => "# About\nWho we really are.\n",
+	),
+);
+
+foreach ( $posts as $name => $sides ) {
+	$result = $strategy->merge( $sides['base'], $sides['disk'], $sides['db'] );
+	echo "=== {$name} ===\n";
+	echo $result->has_conflicts() ? "(conflict — needs review)\n" : "(auto-merged)\n";
+	echo $result->get_merged_content() . "\n";
+}
+</script>
+<script type="text/expected-output">
+=== hello.md ===
+(conflict — needs review)
+# Hello
+
+<<<<<<< HEAD
+Draft body, expanded on disk.
+
+=======
+New section from the editor.
+
+>>>>>>> incoming 
+
+
+=== about.md ===
+(conflict — needs review)
+# About
+
+<<<<<<< HEAD
+Who *they* are.
+
+=======
+Who we really are.
+
+>>>>>>> incoming
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../git/">Git</a><span>Merge file contents discovered through repository history.</span></li>
+			<li><a href="../markdown/">Markdown</a><span>Resolve file-based editorial workflows before converting to blocks.</span></li>
+			<li><a href="../dataliberation/">DataLiberation</a><span>Make content synchronization conflicts visible.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/polyfill/index.html b/docs/_legacy/polyfill/index.html
new file mode 100644
index 000000000..3711a0749
--- /dev/null
+++ b/docs/_legacy/polyfill/index.html
@@ -0,0 +1,194 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Polyfill — PHP Toolkit</title>
+<meta name="description" content="PHP 8 string functions on PHP 7.2+, WordPress hook stubs, and translation/escaping passthroughs so toolkit code runs without WordPress.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li class="current"><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>Polyfill</h1>
+		<p class="lede">PHP 8 string functions on PHP 7.2+, WordPress hook stubs, and translation/escaping passthroughs so toolkit code runs without WordPress.</p>
+		<code class="install">composer require wp-php-toolkit/polyfill</code>
+		<p>A lot of WordPress-adjacent code wants to call <code>esc_html()</code>, <code>__()</code>, or <code>apply_filters()</code> without booting WordPress. The polyfill component provides minimal but real implementations so that code runs unchanged outside WordPress, and stays out of the way when WordPress is loaded (every function uses <code>function_exists()</code> guards).</p>
+		<p>Load Polyfill when toolkit code runs outside WordPress but still calls WordPress-shaped helpers. Standalone tests can call <code>esc_html()</code>, add a filter, or use a translation stub without booting WordPress.</p><p>The component defines only missing functions. If WordPress or the current PHP runtime already provides a function, the polyfill leaves it alone.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Backfill missing PHP helpers</li>
+			<li>Keep familiar WordPress calls</li>
+			<li>Expose extension points</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="php-8-string-functions-on-php-72">PHP 8 string functions on PHP 7.2</h2>
+		<p>The polyfills define <code>str_contains</code>, <code>str_starts_with</code>, <code>str_ends_with</code>, and <code>array_key_first</code> only when missing.</p>
+<php-snippet blueprint="toolkit-setup" name="php8-strings.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+var_dump( str_starts_with( '/var/www/html', '/var' ) );
+var_dump( str_ends_with( 'image.png', '.png' ) );
+var_dump( str_contains( 'WordPress Toolkit', 'Toolkit' ) );
+
+$first_key = array_key_first( array( 'alpha' => 1, 'beta' => 2 ) );
+echo "first key: {$first_key}\n";
+</script>
+<script type="text/expected-output">
+bool(true)
+bool(true)
+bool(true)
+first key: alpha
+</script>
+</php-snippet>
+		<h2 id="escaping-and-translation-stubs">Escaping and translation stubs</h2>
+		<p>Pass-through implementations let you write code that looks WordPressy and runs anywhere.</p>
+<php-snippet blueprint="toolkit-setup" name="wp-stubs.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+echo __( 'Hello, world' ) . "\n";
+echo esc_html( '<script>alert("xss")<\/script>' ) . "\n";
+echo esc_attr( 'a "quoted" value' ) . "\n";
+echo esc_url( 'https://example.com/?a=1&b=2' ) . "\n";
+</script>
+<script type="text/expected-output">
+Hello, world
+&lt;script&gt;alert(&quot;xss&quot;)&lt;/script&gt;
+a &quot;quoted&quot; value
+https://example.com/?a=1&amp;b=2
+</script>
+</php-snippet>
+		<h2 id="a-simple-filter-chain">A simple filter chain</h2>
+		<p>The hook system is a real implementation of the WordPress filter API: registered callbacks get applied in priority order, and each one transforms the running value.</p>
+<php-snippet blueprint="toolkit-setup" name="filter-chain.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+add_filter( 'sanitize_title', 'trim' );
+add_filter( 'sanitize_title', 'strtolower' );
+add_filter( 'sanitize_title', function ( $title ) {
+	return preg_replace( '/\s+/', '-', $title );
+} );
+
+echo apply_filters( 'sanitize_title', '  My Post Title  ' ) . "\n";
+</script>
+<script type="text/expected-output">
+my-post-title
+</script>
+</php-snippet>
+		<h2 id="priority-ordering-and-multi-arg-passing">Priority ordering and multi-arg passing</h2>
+		<p>Lower priority numbers run first. The fourth argument to <code>add_filter</code> controls how many context values get passed to the callback.</p>
+<php-snippet blueprint="toolkit-setup" name="priority-args.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+add_filter( 'render_price', function ( $html, $price, $currency ) {
+	return $html . " ({$currency} markup)";
+}, 30, 3 );
+
+add_filter( 'render_price', function ( $html, $price ) {
+	return "<strong>{$html}</strong>";
+}, 10, 2 );
+
+add_filter( 'render_price', function ( $html, $price, $currency ) {
+	if ( 'EUR' === $currency ) return $html . ' EUR';
+	return $html . " {$currency}";
+}, 20, 3 );
+
+echo apply_filters( 'render_price', '19.99', 19.99, 'EUR' ) . "\n";
+</script>
+<script type="text/expected-output">
+<strong>19.99</strong> EUR (EUR markup)
+</script>
+</php-snippet>
+		<h2 id="hook-based-extension-points-in-standalone-libraries">Hook-based extension points in standalone libraries</h2>
+		<p>Use <code>do_action</code> and <code>apply_filters</code> as cheap extension points in your own code, without depending on WordPress.</p>
+<php-snippet blueprint="toolkit-setup" name="library-hooks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+class ImportPipeline {
+	public function process( array $row ) {
+		$row = apply_filters( 'import_pipeline_normalize', $row );
+		do_action( 'import_pipeline_row_processed', $row );
+		return $row;
+	}
+}
+
+add_filter( 'import_pipeline_normalize', function ( $row ) {
+	$row['email'] = strtolower( trim( $row['email'] ) );
+	return $row;
+} );
+
+$log = array();
+add_action( 'import_pipeline_row_processed', function ( $row ) use ( &$log ) {
+	$log[] = $row['email'];
+} );
+
+$pipeline = new ImportPipeline();
+$pipeline->process( array( 'email' => '  USER@EXAMPLE.COM  ' ) );
+$pipeline->process( array( 'email' => 'OTHER@example.com' ) );
+
+echo implode( "\n", $log ) . "\n";
+</script>
+<script type="text/expected-output">
+user@example.com
+other@example.com
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../html/">HTML</a><span>Run WordPress-shaped escaping and translation helpers beside HTML processors.</span></li>
+			<li><a href="../blockparser/">BlockParser</a><span>Keep standalone block tooling familiar outside WordPress.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/xml/index.html b/docs/_legacy/xml/index.html
new file mode 100644
index 000000000..facff8a2b
--- /dev/null
+++ b/docs/_legacy/xml/index.html
@@ -0,0 +1,210 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>XML — PHP Toolkit</title>
+<meta name="description" content="A streaming, namespace-aware XML processor in pure PHP. Read and modify huge feeds, WXR exports, ePub manifests, and Office Open XML parts without ever loading the document into memory and without depending on libxml2.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li class="current"><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>XML</h1>
+		<p class="lede">A streaming, namespace-aware XML processor in pure PHP. Read and modify huge feeds, WXR exports, ePub manifests, and Office Open XML parts without ever loading the document into memory and without depending on <code>libxml2</code>.</p>
+		<code class="install">composer require wp-php-toolkit/xml</code>
+		<p><code>SimpleXMLElement</code> and <code>DOMDocument</code> both need <code>libxml2</code> and both build a complete in-memory tree. <code>XMLProcessor</code> walks the document forward as a cursor, keeps modifications in a side buffer, and emits the full updated XML with <code>get_updated_xml()</code> only when you ask for it.</p><p>This design came from WordPress-scale documents such as WXR exports. A migration may only need to rewrite <code>wp:attachment_url</code> values or bump a feed attribute, so the processor optimizes for targeted cursor edits instead of a full validating XML stack.</p><p><strong>Footgun #1:</strong> namespace-aware methods use the namespace name declared in <code>xmlns</code>, not the prefix written in the tag. In WXR, <code>get_attribute( 'wp', 'status' )</code> looks for a namespace literally named <code>wp</code>; for the usual WXR declaration you want <code>get_attribute( 'http://wordpress.org/export/1.2/', 'status' )</code>.</p><p><strong>Footgun #2:</strong> in streaming mode <code>next_tag()</code> can return false because input ran out, not because the document ended. Check <code>is_paused_at_incomplete_input()</code> before assuming you're done.</p>
+		<p><code>XMLProcessor</code> walks XML as a cursor. It reads the next tag, exposes attributes and text, records edits, and emits updated XML only when you call <code>get_updated_xml()</code>.</p><p>Query namespaces by URI, not by prefix. In WXR, look for <code>http://wordpress.org/export/1.2/</code> even when the source file writes the prefix as <code>wp:</code>.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Edit one attribute</li>
+			<li>Read namespaced exports</li>
+			<li>Process export-sized files</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="bump-every-price-in-a-catalog">Bump every price in a catalog</h2>
+		<p>Find each <code>&lt;book&gt;</code>, read its price, write a new one, emit the updated document.</p>
+<php-snippet blueprint="toolkit-setup" name="bump-prices.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\XML\XMLProcessor;
+
+$xml = '<catalog>'
+	. '<book sku="A1" price="29.99"><title>PHP Internals</title></book>'
+	. '<book sku="A2" price="14.50"><title>WordPress at Scale</title></book>'
+	. '</catalog>';
+
+$p = XMLProcessor::create_from_string( $xml );
+while ( $p->next_tag( 'book' ) ) {
+	$old = (float) $p->get_attribute( '', 'price' );
+	$new = number_format( $old * 1.10, 2, '.', '' );
+	$p->set_attribute( '', 'price', $new );
+}
+
+echo $p->get_updated_xml();
+</script>
+<script type="text/expected-output">
+<catalog><book sku="A1" price="32.99"><title>PHP Internals</title></book><book sku="A2" price="15.95"><title>WordPress at Scale</title></book></catalog>
+</script>
+</php-snippet>
+		<h2 id="read-namespaced-attributes-from-a-wxr-export">Read namespaced attributes from a WXR export</h2>
+		<p>WordPress's WXR commonly uses <code>wp:</code>, <code>dc:</code>, and <code>content:</code> prefixes bound to namespace names such as <code>http://wordpress.org/export/1.2/</code>. Pass that expanded namespace name, not the prefix; the processor handles whichever prefix the document actually uses.</p>
+<php-snippet blueprint="toolkit-setup" name="wxr-namespaces.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\XML\XMLProcessor;
+
+$wxr = '<?xml version="1.0"?>'
+	. '<rss xmlns:wp="http://wordpress.org/export/1.2/" xmlns:dc="http://purl.org/dc/elements/1.1/">'
+	. '<channel><item>'
+	. '<title>Hello World</title>'
+	. '<dc:creator>admin</dc:creator>'
+	. '<wp:post_id>42</wp:post_id>'
+	. '<wp:status>publish</wp:status>'
+	. '</item></channel></rss>';
+
+$WP = 'http://wordpress.org/export/1.2/';
+$DC = 'http://purl.org/dc/elements/1.1/';
+
+$p = XMLProcessor::create_from_string( $wxr );
+while ( $p->next_tag( 'item' ) ) {
+	while ( $p->next_token() ) {
+		if ( $p->is_tag_closer() && 'item' === $p->get_tag_local_name() ) break;
+		if ( ! $p->is_tag_opener() ) continue;
+		$ns = $p->get_tag_namespace();
+		$local = $p->get_tag_local_name();
+		$prefix = ( $WP === $ns ) ? 'wp/' : ( ( $DC === $ns ) ? 'dc/' : '' );
+		echo "{$prefix}{$local}: ";
+		while ( $p->next_token() && '#text' !== $p->get_token_name() ) {}
+		echo trim( $p->get_modifiable_text() ) . "\n";
+	}
+}
+</script>
+<script type="text/expected-output">
+title: Hello World
+dc/creator: admin
+wp/post_id: 42
+wp/status: publish
+</script>
+</php-snippet>
+		<h2 id="rewrite-urls-across-an-entire-wxr-export">Rewrite URLs across an entire WXR export</h2>
+		<p>Large WXR exports can hold many URLs in <code>&lt;link&gt;</code>, <code>&lt;guid&gt;</code>, and post content. Streaming the file lets you rewrite large exports without loading the whole XML document into memory.</p>
+<php-snippet blueprint="toolkit-setup" name="rewrite-wxr-urls.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\XML\XMLProcessor;
+
+$wxr = '<?xml version="1.0"?><rss xmlns:wp="http://wordpress.org/export/1.2/"><channel>'
+	. '<wp:base_site_url>https://old.example.com</wp:base_site_url>'
+	. '<item><link>https://old.example.com/2024/post-1</link>'
+	. '<guid>https://old.example.com/?p=1</guid></item>'
+	. '</channel></rss>';
+
+$from = 'https://old.example.com';
+$to   = 'https://new.example.com';
+
+$p = XMLProcessor::create_from_string( $wxr );
+$rewritten = 0;
+
+while ( $p->next_token() ) {
+	if ( '#text' !== $p->get_token_name() ) continue;
+	$text = $p->get_modifiable_text();
+	if ( false === strpos( $text, $from ) ) continue;
+	$p->set_modifiable_text( str_replace( $from, $to, $text ) );
+	$rewritten++;
+}
+
+echo "rewrote {$rewritten} text nodes\n\n";
+echo $p->get_updated_xml();
+</script>
+<script type="text/expected-output">
+rewrote 3 text nodes
+
+<?xml version="1.0"?><rss xmlns:wp="http://wordpress.org/export/1.2/"><channel><wp:base_site_url>https://new.example.com</wp:base_site_url><item><link>https://new.example.com/2024/post-1</link><guid>https://new.example.com/?p=1</guid></item></channel></rss>
+</script>
+</php-snippet>
+		<h2 id="parse-opml-to-extract-feed-urls">Parse OPML to extract feed URLs</h2>
+		<p>OPML is the format Feedly and many readers use to import/export feed lists. Flat, attribute-heavy XML — exactly what a tag processor handles best.</p>
+<php-snippet blueprint="toolkit-setup" name="opml.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\XML\XMLProcessor;
+
+$opml = '<?xml version="1.0"?><opml version="2.0"><head><title>My Feeds</title></head>'
+	. '<body>'
+	. '<outline text="Tech"><outline text="Hacker News" type="rss" xmlUrl="https://news.ycombinator.com/rss"/>'
+	. '<outline text="LWN" type="rss" xmlUrl="https://lwn.net/headlines/rss"/></outline>'
+	. '<outline text="WordPress" type="rss" xmlUrl="https://wordpress.org/news/feed/"/>'
+	. '</body></opml>';
+
+$p = XMLProcessor::create_from_string( $opml );
+while ( $p->next_tag( 'outline' ) ) {
+	$url = $p->get_attribute( '', 'xmlUrl' );
+	if ( null === $url ) continue;
+	echo $p->get_attribute( '', 'text' ) . "\t" . $url . "\n";
+}
+</script>
+<script type="text/expected-output">
+Hacker News	https://news.ycombinator.com/rss
+LWN	https://lwn.net/headlines/rss
+WordPress	https://wordpress.org/news/feed/
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../dataliberation/">DataLiberation</a><span>Read and write WXR-sized WordPress exports as entities.</span></li>
+			<li><a href="../encoding/">Encoding</a><span>Validate and scrub text before strict XML processing.</span></li>
+			<li><a href="../bytestream/">ByteStream</a><span>Keep large XML reads incremental.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/_legacy/zip/index.html b/docs/_legacy/zip/index.html
new file mode 100644
index 000000000..9d0d1b1d3
--- /dev/null
+++ b/docs/_legacy/zip/index.html
@@ -0,0 +1,378 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Zip — PHP Toolkit</title>
+<meta name="description" content="Read and write ZIP archives in pure PHP — no libzip, no ZipArchive. Streams entries one at a time, so you can build EPUBs, .docx files, and multi-gigabyte plugin bundles without buffering the archive in memory.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-concept-guide">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-concept-guide" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../">Components</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+<div class="layout">
+	<aside class="sidebar" aria-label="Component navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="../html/">HTML</a></li>
+			<li class="current"><a href="../zip/">Zip</a></li>
+			<li><a href="../bytestream/">ByteStream</a></li>
+			<li><a href="../filesystem/">Filesystem</a></li>
+			<li><a href="../blockparser/">BlockParser</a></li>
+			<li><a href="../markdown/">Markdown</a></li>
+			<li><a href="../xml/">XML</a></li>
+			<li><a href="../encoding/">Encoding</a></li>
+			<li><a href="../dataliberation/">DataLiberation</a></li>
+			<li><a href="../git/">Git</a></li>
+			<li><a href="../merge/">Merge</a></li>
+			<li><a href="../httpclient/">HttpClient</a></li>
+			<li><a href="../httpserver/">HttpServer</a></li>
+			<li><a href="../corsproxy/">CORSProxy</a></li>
+			<li><a href="../cli/">CLI</a></li>
+			<li><a href="../polyfill/">Polyfill</a></li>
+			<li><a href="../blueprints/">Blueprints</a></li>
+			<li><a href="../coding-standards/">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+		<h1>Zip</h1>
+		<p class="lede">Read and write ZIP archives in pure PHP — no <code>libzip</code>, no <code>ZipArchive</code>. Streams entries one at a time, so you can build EPUBs, .docx files, and multi-gigabyte plugin bundles without buffering the archive in memory.</p>
+		<code class="install">composer require wp-php-toolkit/zip</code>
+		<p>Common PHP ZIP workflows rely on the <code>ZipArchive</code> extension or shelling out to <code>zip</code>. Those are awkward in hosts without libzip, WebAssembly builds, and code paths that need to stream archive data through toolkit byte streams.</p><p>The Zip component reads and writes Stored and Deflate archives in pure PHP. The decoder is pull-based, so listing the central directory of a 2 GB ZIP costs roughly the size of the directory itself. The encoder accepts any <code>ByteWriteStream</code> as a sink and writes one entry at a time.</p>
+		<p>Treat a ZIP as a small filesystem with a table of contents at the end. Read the central directory, open one entry stream, and copy that entry where it belongs.</p><p>Use <code>ZipFilesystem</code> when your code wants <code>get_contents()</code> and <code>ls()</code>. Use <code>ZipEncoder</code> and <code>ZipDecoder</code> when the archive format matters, such as an EPUB that must store <code>mimetype</code> first and uncompressed.</p>
+		<p class="you-will-learn-label">You will learn to:</p>
+		<ul class="you-will-learn">
+			<li>Open an archive as files</li>
+			<li>Write a format with rules</li>
+			<li>Move archives through streams</li>
+		</ul>
+		<p class="runtime-note">Most snippets below run in the browser through WordPress Playground. Click <em>Run</em> on any example to execute it; edit the code and run again to see what changes. Static snippets show config or shell commands that need a real local environment.</p>
+		<h2 id="read-a-file-out-of-a-zip">Read a file out of a ZIP</h2>
+		<p><code>ZipFilesystem</code> implements this toolkit's <code>Filesystem</code> interface, so once you wrap the byte reader you can call <code>get_contents()</code>, <code>ls()</code>, and <code>is_dir()</code> just like the other filesystem backends.</p><p><strong>Try this:</strong> after <em>Run</em>, add a second <code>append_file()</code> call before <code>$enc-&gt;close()</code> for a <code>notes.md</code> entry, then call <code>print_r( $zip-&gt;ls( '/' ) )</code> at the end. The directory listing reflects the new entry without re-reading the file.</p>
+<php-snippet blueprint="toolkit-setup" name="teaser-read.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+
+$path = tempnam( sys_get_temp_dir(), 'demo' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+$enc->append_file( new FileEntry( array(
+	'path'               => 'readme.txt',
+	'compression_method' => ZipDecoder::COMPRESSION_NONE,
+	'body_reader'        => new MemoryPipe( 'Hello from inside the zip.' ),
+) ) );
+$enc->close();
+$out->close_writing();
+
+$zip = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+echo $zip->get_contents( 'readme.txt' );
+</script>
+<script type="text/expected-output">
+Hello from inside the zip.
+</script>
+</php-snippet>
+		<h2 id="build-an-epub-from-scratch">Build an EPUB from scratch</h2>
+		<p>An EPUB follows one strict ZIP rule: write the <code>mimetype</code> entry first and store it without compression. Deflate the rest of the archive normally.</p><p>Gotcha: e-readers reject EPUBs whose <code>mimetype</code> entry has compression. Use <code>COMPRESSION_NONE</code> for that single entry.</p>
+<php-snippet blueprint="toolkit-setup" name="epub.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+
+$path = tempnam( sys_get_temp_dir(), 'book' ) . '.epub';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+
+// 1) The mimetype entry MUST be first and stored uncompressed.
+$enc->append_file( new FileEntry( array(
+	'path'               => 'mimetype',
+	'compression_method' => ZipDecoder::COMPRESSION_NONE,
+	'body_reader'        => new MemoryPipe( 'application/epub+zip' ),
+) ) );
+
+$container = '<?xml version="1.0"?>'
+	. '<container version="1.0" xmlns="urn:oasis:names:tc:opendocument:xmlns:container">'
+	. '<rootfiles><rootfile full-path="EPUB/package.opf" media-type="application/oebps-package+xml"/></rootfiles>'
+	. '</container>';
+
+foreach ( array(
+	'META-INF/container.xml' => $container,
+	'EPUB/package.opf'       => '<package version="3.0" xmlns="http://www.idpf.org/2007/opf"><metadata/><manifest/><spine/></package>',
+	'EPUB/chapter1.xhtml'    => '<html xmlns="http://www.w3.org/1999/xhtml"><body><h1>Chapter 1</h1><p>It was a dark and stormy night.</p></body></html>',
+) as $name => $body ) {
+	$enc->append_file( new FileEntry( array(
+		'path'               => $name,
+		'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+		'body_reader'        => new MemoryPipe( $body ),
+	) ) );
+}
+$enc->close();
+$out->close_writing();
+
+$zip = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+printf( "mimetype: %s\n", $zip->get_contents( 'mimetype' ) );
+printf( "size on disk: %d bytes\n", filesize( $path ) );
+</script>
+<script type="text/expected-output">
+mimetype: application/epub+zip
+size on disk: 839 bytes
+</script>
+</php-snippet>
+		<h2 id="stream-a-large-entry-without-buffering-it">Stream a large entry without buffering it</h2>
+		<p>Calling <code>get_contents()</code> on a 500 MB CSV inside a ZIP would eat 500 MB of RAM. Use <code>open_read_stream()</code> instead and inflate-as-you-go.</p><p>Gotcha: only one entry stream open at a time. Drain or finish the previous stream before opening the next.</p>
+<php-snippet blueprint="toolkit-setup" name="stream-large.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+
+$path = tempnam( sys_get_temp_dir(), 'big' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+$enc->append_file( new FileEntry( array(
+	'path'               => 'data.csv',
+	'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+	'body_reader'        => new MemoryPipe( str_repeat( "id,value,timestamp\n1,foo,2024\n2,bar,2024\n", 5000 ) ),
+) ) );
+$enc->close();
+$out->close_writing();
+
+$zip    = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+$stream = $zip->open_read_stream( 'data.csv' );
+
+$rows  = 0;
+$bytes = 0;
+$tail  = '';
+while ( ! $stream->reached_end_of_data() ) {
+	$n = $stream->pull( 8192 );
+	if ( 0 === $n ) break;
+	$chunk  = $tail . $stream->consume( $n );
+	$lines  = explode( "\n", $chunk );
+	$tail   = array_pop( $lines );
+	$rows  += count( $lines );
+	$bytes += $n;
+}
+printf( "Inflated %d bytes in 8 KB chunks, parsed %d rows.\n", $bytes, $rows );
+</script>
+<script type="text/expected-output">
+Inflated 205000 bytes in 8 KB chunks, parsed 15000 rows.
+</script>
+</php-snippet>
+		<h2 id="repack-modify-one-file-copy-the-rest">Repack: modify one file, copy the rest</h2>
+		<p>Updating one file in a ZIP without rewriting the others is impossible at the format level — the central directory points at byte offsets. The pragmatic answer is repack: stream the source archive into a new one, swapping the file you care about.</p>
+<php-snippet blueprint="toolkit-setup" name="repack.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+
+$src_path = tempnam( sys_get_temp_dir(), 'orig' ) . '.zip';
+$src_out  = FileWriteStream::from_path( $src_path, 'truncate' );
+$src_enc  = new ZipEncoder( $src_out );
+foreach ( array(
+	'config.json'   => '{"debug":false,"version":"1.0"}',
+	'app/index.php' => '<?php echo "hello";',
+	'app/style.css' => 'body{color:#333}',
+) as $name => $body ) {
+	$src_enc->append_file( new FileEntry( array(
+		'path'               => $name,
+		'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+		'body_reader'        => new MemoryPipe( $body ),
+	) ) );
+}
+$src_enc->close();
+$src_out->close_writing();
+
+$source   = ZipFilesystem::create( FileReadStream::from_path( $src_path ) );
+$dst_path = tempnam( sys_get_temp_dir(), 'repacked' ) . '.zip';
+$dst_out  = FileWriteStream::from_path( $dst_path, 'truncate' );
+$dst_enc  = new ZipEncoder( $dst_out );
+
+$dirs = array( '/' );
+while ( $dirs ) {
+	$dir = array_shift( $dirs );
+	foreach ( $source->ls( $dir ) as $name ) {
+		$path = rtrim( $dir, '/' ) . '/' . $name;
+		if ( $source->is_dir( $path ) ) {
+			$dirs[] = $path;
+			continue;
+		}
+		$rel  = ltrim( $path, '/' );
+		$body = ( 'config.json' === $rel )
+			? '{"debug":true,"version":"1.0.1"}'
+			: $source->get_contents( $rel );
+		$dst_enc->append_file( new FileEntry( array(
+			'path'               => $rel,
+			'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+			'body_reader'        => new MemoryPipe( $body ),
+		) ) );
+	}
+}
+$dst_enc->close();
+$dst_out->close_writing();
+
+$repacked = ZipFilesystem::create( FileReadStream::from_path( $dst_path ) );
+echo "new config.json: " . $repacked->get_contents( 'config.json' ) . "\n";
+echo "untouched: " . $repacked->get_contents( 'app/index.php' ) . "\n";
+</script>
+<script type="text/expected-output">
+new config.json: {"debug":true,"version":"1.0.1"}
+untouched: <?php echo "hello";
+</script>
+</php-snippet>
+		<h2 id="defend-against-zip-slip">Defend against zip-slip</h2>
+		<p>A malicious archive can name an entry <code>../../etc/passwd</code> and trick a naive extractor into clobbering files outside the destination. <code>ZipDecoder::sanitize_path()</code> strips leading <code>../</code> segments and collapses internal <code>/../</code> sequences before exposing the path.</p>
+<php-snippet blueprint="toolkit-setup" name="zip-slip.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Zip\ZipDecoder;
+
+$evil_inputs = array(
+	'../../etc/passwd',
+	'./safe/path.txt',
+	'a/../../b/secret',
+	'a//b///c.txt',
+	'../../../../root/.ssh/authorized_keys',
+);
+foreach ( $evil_inputs as $name ) {
+	printf( "%-45s => %s\n", $name, ZipDecoder::sanitize_path( $name ) );
+}
+</script>
+<script type="text/expected-output">
+../../etc/passwd                              => etc/passwd
+./safe/path.txt                               => ./safe/path.txt
+a/../../b/secret                              => a/../b/secret
+a//b///c.txt                                  => a/b/c.txt
+../../../../root/.ssh/authorized_keys         => root/.ssh/authorized_keys
+</script>
+</php-snippet>
+		<h2 id="pipe-zip-entries-into-an-inmemoryfilesystem">Pipe ZIP entries into an InMemoryFilesystem</h2>
+		<p>Real-world recipe: take an uploaded plugin ZIP, expand it into an <code>InMemoryFilesystem</code> so you can validate, edit, or scan it before it ever touches disk. Three components compose into something you couldn't build with <code>ZipArchive</code> alone.</p>
+<php-snippet blueprint="toolkit-setup" name="zip-to-memfs.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+use function WordPress\Filesystem\copy_between_filesystems;
+
+$path = tempnam( sys_get_temp_dir(), 'app' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+foreach ( array(
+	'app/index.php'        => '<?php echo "ok";',
+	'app/lib/util.php'     => '<?php // util',
+	'app/assets/style.css' => 'body{margin:0}',
+	'app/README.md'        => '# App',
+) as $name => $body ) {
+	$enc->append_file( new FileEntry( array(
+		'path'               => $name,
+		'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+		'body_reader'        => new MemoryPipe( $body ),
+	) ) );
+}
+$enc->close();
+$out->close_writing();
+
+$zip = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+$mem = InMemoryFilesystem::create();
+copy_between_filesystems( array(
+	'source_filesystem' => $zip,
+	'source_path'       => '/',
+	'target_filesystem' => $mem,
+	'target_path'       => '/',
+) );
+
+$mem->put_contents( '/app/VERSION', '1.0.0' );
+echo "files now in memory:\n";
+$dirs = array( '/' );
+$files = array();
+while ( $dirs ) {
+	$dir = array_shift( $dirs );
+	foreach ( $mem->ls( $dir ) as $name ) {
+		$p = rtrim( $dir, '/' ) . '/' . $name;
+		if ( $mem->is_dir( $p ) ) {
+			$dirs[] = $p;
+			continue;
+		}
+		$files[] = $p;
+	}
+}
+sort( $files );
+foreach ( $files as $path ) {
+	echo "  " . $path . "\n";
+}
+</script>
+<script type="text/expected-output">
+files now in memory:
+  /app/README.md
+  /app/VERSION
+  /app/assets/style.css
+  /app/index.php
+  /app/lib/util.php
+</script>
+</php-snippet>
+		<h2 id="see-also">See also</h2>
+		<ul class="related-components">
+			<li><a href="../filesystem/">Filesystem</a><span>Treat an archive like a swappable filesystem backend.</span></li>
+			<li><a href="../bytestream/">ByteStream</a><span>Feed readers and writers without whole-file buffers.</span></li>
+			<li><a href="../httpclient/">HttpClient</a><span>Stream downloaded archives into validation or extraction workflows.</span></li>
+		</ul>
+	</article>
+</div>
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/assets/page.js b/docs/assets/page.js
new file mode 100644
index 000000000..440756e2c
--- /dev/null
+++ b/docs/assets/page.js
@@ -0,0 +1,196 @@
+// Per-page wiring: blueprint, editable snippets, sticky TOC.
+//
+// Pages declare their h2/h3 structure plainly; this script:
+//   1. Fills the shared <script id="toolkit-setup"> blueprint with a runtime-resolved
+//      absolute URL to docs/assets/php-toolkit.zip (must be absolute since the
+//      Playground iframe is cross-origin).
+//   2. Builds a sticky table of contents from <h2>/<h3> headings inside .content.
+//   3. Patches each <php-snippet>'s shadow DOM to make the rendered code editable
+//      and to reflect the user's edits back into the runner. This is a stopgap
+//      until <php-snippet> ships an `editable` attribute.
+
+(function () {
+	'use strict';
+
+	// ---------- Blueprint URL injection ----------
+	const setup = document.getElementById('toolkit-setup');
+	if (setup) {
+		const zipUrl = new URL('../assets/php-toolkit.zip', location.href).toString();
+		setup.textContent = JSON.stringify({
+			steps: [
+				{
+					step: 'unzip',
+					zipFile: { resource: 'url', url: zipUrl },
+					extractToPath: '/wordpress/wp-content/php-toolkit',
+				},
+			],
+		});
+	}
+
+	// ---------- Table of contents ----------
+	function buildToc() {
+		const container = document.querySelector('.toc');
+		const content = document.querySelector('.content');
+		if (!container || !content) return;
+
+		const headings = content.querySelectorAll('h2[id], h2, h3[id], h3');
+		if (!headings.length) {
+			container.remove();
+			return;
+		}
+
+		const list = document.createElement('ol');
+		const links = [];
+		headings.forEach(function (h) {
+			if (!h.id) {
+				h.id = h.textContent
+					.toLowerCase()
+					.replace(/[^\w\s-]/g, '')
+					.trim()
+					.replace(/\s+/g, '-');
+			}
+			const li = document.createElement('li');
+			li.className = 'toc-depth-' + h.tagName.substring(1);
+			const a = document.createElement('a');
+			a.href = '#' + h.id;
+			a.textContent = h.textContent;
+			li.appendChild(a);
+			list.appendChild(li);
+			links.push({ a, target: h });
+		});
+
+		const title = document.createElement('p');
+		title.className = 'toc-title';
+		title.textContent = 'On this page';
+		container.replaceChildren(title, list);
+
+		// Active-section tracking via IntersectionObserver.
+		const byId = new Map();
+		links.forEach(function (l) { byId.set(l.target.id, l.a); });
+
+		const observer = new IntersectionObserver(
+			function (entries) {
+				const visible = entries
+					.filter(function (e) { return e.isIntersecting; })
+					.sort(function (a, b) { return a.target.offsetTop - b.target.offsetTop; });
+				if (!visible.length) return;
+				links.forEach(function (l) { l.a.classList.remove('active'); });
+				const a = byId.get(visible[0].target.id);
+				if (a) a.classList.add('active');
+			},
+			{ rootMargin: '-80px 0px -70% 0px', threshold: 0 }
+		);
+		links.forEach(function (l) { observer.observe(l.target); });
+	}
+
+	// ---------- Editable snippet shim ----------
+	// <php-snippet> renders into shadow DOM:
+	//   <pre><code>...highlighted PHP...</code></pre>
+	// We swap the <code> for a contentEditable element and patch _code on input.
+	function patchSnippet(el) {
+		if (el._editablePatched) return;
+		const root = el.shadowRoot;
+		if (!root) {
+			// Wait until the component renders.
+			const obs = new MutationObserver(function () {
+				if (el.shadowRoot && el.shadowRoot.querySelector('pre code')) {
+					obs.disconnect();
+					patchSnippet(el);
+				}
+			});
+			obs.observe(el, { attributes: true, childList: true, subtree: true });
+			return;
+		}
+		const code = root.querySelector('pre code');
+		if (!code) return;
+
+		if (el.getAttribute('runnable') === 'false') {
+			root.querySelectorAll('button').forEach(function (button) {
+				if (/run/i.test(button.textContent || button.getAttribute('aria-label') || '')) {
+					button.style.display = 'none';
+				}
+			});
+			el.setAttribute('data-static-snippet', '');
+			el._editablePatched = true;
+			return;
+		}
+
+		code.setAttribute('contenteditable', 'plaintext-only');
+		code.setAttribute('spellcheck', 'false');
+		code.style.outline = 'none';
+		code.style.caretColor = 'currentColor';
+		el.setAttribute('data-editable', '');
+
+		// On every edit, push the plain text back into the component's internal
+		// _code field so client.run({ code }) sees the new value. The component's
+		// highlightPhp() output stays as-is until the user reloads — that's fine
+		// for an editing session and the highlighter resyncs on next render.
+		code.addEventListener('input', function () {
+			el._code = code.textContent.trim();
+		});
+
+		// Re-highlight on blur so the colors track the user's edits.
+		code.addEventListener('blur', function () {
+			if (typeof el._render === 'function') {
+				const previous = el._code;
+				el._code = code.textContent.trim();
+				// Avoid clobbering output panel state — only the code area is reset.
+				const output = root.querySelector('.output');
+				const wasVisible = output && output.classList.contains('visible');
+				const outputBody = root.querySelector('.output-body');
+				const previousOutput = outputBody ? outputBody.textContent : '';
+				el._render();
+				if (wasVisible) {
+					root.querySelector('.output').classList.add('visible');
+					root.querySelector('.output-body').textContent = previousOutput;
+				}
+				// Re-patch the freshly rendered code element.
+				el._editablePatched = false;
+				patchSnippet(el);
+				el._code = previous;
+			}
+		});
+
+		el._editablePatched = true;
+	}
+
+	function patchAllSnippets() {
+		document.querySelectorAll('php-snippet').forEach(patchSnippet);
+	}
+
+	if (window.customElements && customElements.whenDefined) {
+		customElements.whenDefined('php-snippet').then(function () {
+			// Defer past the component's first render.
+			requestAnimationFrame(patchAllSnippets);
+			// Also catch any late-defined snippets.
+			new MutationObserver(patchAllSnippets).observe(document.body, {
+				childList: true,
+				subtree: true,
+			});
+		});
+	}
+
+	// ---------- Sidebar mobile toggle ----------
+	function wireTocToggle() {
+		const toggle = document.querySelector('.sidebar-toggle');
+		const sidebar = document.querySelector('.sidebar');
+		if (!toggle || !sidebar) return;
+		toggle.addEventListener('click', function () {
+			sidebar.classList.toggle('open');
+			toggle.setAttribute(
+				'aria-expanded',
+				sidebar.classList.contains('open') ? 'true' : 'false'
+			);
+		});
+	}
+
+	if (document.readyState === 'loading') {
+		document.addEventListener('DOMContentLoaded', function () {
+			buildToc();
+			wireTocToggle();
+		});
+	} else {
+		buildToc();
+		wireTocToggle();
+	}
+})();
diff --git a/docs/assets/php-toolkit.zip b/docs/assets/php-toolkit.zip
new file mode 100644
index 000000000..2c3b2a2e0
Binary files /dev/null and b/docs/assets/php-toolkit.zip differ
diff --git a/docs/assets/style.css b/docs/assets/style.css
new file mode 100644
index 000000000..ad3b5a970
--- /dev/null
+++ b/docs/assets/style.css
@@ -0,0 +1,816 @@
+:root {
+	--bg: #ffffff;
+	--fg: #1a1a1a;
+	--muted: #5a5a5a;
+	--border: #e3e3e3;
+	--accent: #2563eb;
+	--accent-hover: #1d4ed8;
+	--code-bg: #f6f8fa;
+	--code-fg: #24292f;
+	--toc-fg: #444;
+	--toc-active: var(--accent);
+}
+
+@media (prefers-color-scheme: dark) {
+	:root {
+		--bg: #0d1117;
+		--fg: #e6edf3;
+		--muted: #8b949e;
+		--border: #30363d;
+		--accent: #58a6ff;
+		--accent-hover: #79b8ff;
+		--code-bg: #161b22;
+		--code-fg: #e6edf3;
+		--toc-fg: #b3becd;
+	}
+}
+
+* { box-sizing: border-box; }
+
+html { scroll-behavior: smooth; scroll-padding-top: 5rem; }
+
+body {
+	font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+	background: var(--bg);
+	color: var(--fg);
+	margin: 0;
+	line-height: 1.65;
+	-webkit-font-smoothing: antialiased;
+	font-size: 16px;
+}
+
+a { color: var(--accent); text-decoration: none; }
+a:hover { color: var(--accent-hover); text-decoration: underline; }
+
+header.site {
+	position: sticky;
+	top: 0;
+	z-index: 10;
+	background: var(--bg);
+	border-bottom: 1px solid var(--border);
+	padding: 1rem 1.75rem;
+	display: flex;
+	justify-content: space-between;
+	align-items: center;
+	font-size: 1rem;
+	box-shadow: 0 1px 0 rgba(0, 0, 0, 0.02);
+}
+
+header.site a.brand {
+	color: var(--fg);
+	font-weight: 700;
+	letter-spacing: -0.015em;
+	font-size: 1.08rem;
+}
+
+header.site nav { display: flex; gap: 0.4rem; align-items: center; }
+header.site nav a {
+	color: var(--fg);
+	font-weight: 500;
+	padding: 0.45rem 0.85rem;
+	border-radius: 6px;
+	transition: background 0.12s, color 0.12s;
+}
+header.site nav a:hover {
+	background: var(--code-bg);
+	color: var(--accent);
+	text-decoration: none;
+}
+header.site nav a.github {
+	background: var(--accent);
+	color: white;
+	margin-left: 0.4rem;
+}
+header.site nav a.github:hover { background: var(--accent-hover); color: white; }
+@media (max-width: 600px) {
+	header.site { padding: 0.75rem 1rem; flex-wrap: wrap; }
+	header.site nav { gap: 0.2rem; }
+	header.site nav a { padding: 0.35rem 0.6rem; font-size: 0.92rem; }
+}
+
+footer.site {
+	border-top: 1px solid var(--border);
+	padding: 1.5rem;
+	text-align: center;
+	font-size: 0.85rem;
+	color: var(--muted);
+	margin-top: 4rem;
+}
+
+/* ---------- Landing page ---------- */
+
+.landing {
+	max-width: 880px;
+	margin: 0 auto;
+	padding: 4rem 1.5rem 3rem;
+}
+
+.landing h1 {
+	font-size: 2.6rem;
+	margin: 0 0 0.5rem;
+	letter-spacing: -0.025em;
+	font-weight: 700;
+}
+
+.landing .lede {
+	font-size: 1.15rem;
+	color: var(--muted);
+	margin: 0 0 2rem;
+	max-width: 60ch;
+}
+
+.landing h2 {
+	font-size: 1.35rem;
+	margin: 3rem 0 1rem;
+	letter-spacing: -0.01em;
+	font-weight: 600;
+}
+
+.components {
+	display: grid;
+	grid-template-columns: repeat(auto-fill, minmax(260px, 1fr));
+	gap: 0.75rem;
+	margin: 1.5rem 0;
+	padding: 0;
+	list-style: none;
+}
+
+.components a {
+	display: block;
+	border: 1px solid var(--border);
+	border-radius: 8px;
+	padding: 1rem 1.1rem;
+	color: var(--fg);
+	transition: border-color 0.15s, transform 0.15s;
+}
+
+.components a:hover {
+	border-color: var(--accent);
+	transform: translateY(-1px);
+	text-decoration: none;
+}
+
+.components strong { display: block; font-size: 1rem; margin-bottom: 0.2rem; font-weight: 600; }
+.components span { display: block; font-size: 0.85rem; color: var(--muted); line-height: 1.45; }
+
+.starter-paths {
+	display: grid;
+	grid-template-columns: repeat(auto-fit, minmax(280px, 1fr));
+	gap: 0.85rem;
+	margin: 1.25rem 0 2rem;
+	padding: 0;
+	list-style: none;
+}
+
+.starter-paths li {
+	border: 1px solid var(--border);
+	border-radius: 8px;
+	padding: 1rem 1.1rem;
+}
+
+.starter-paths strong {
+	display: block;
+	font-size: 1rem;
+	margin-bottom: 0.2rem;
+}
+
+.starter-paths span {
+	display: block;
+	color: var(--muted);
+	font-size: 0.88rem;
+	line-height: 1.5;
+}
+
+.starter-paths nav {
+	display: flex;
+	flex-wrap: wrap;
+	gap: 0.45rem;
+	margin-top: 0.8rem;
+}
+
+.starter-paths nav a {
+	border: 1px solid var(--border);
+	border-radius: 4px;
+	padding: 0.18rem 0.55rem;
+	font-size: 0.78rem;
+	color: var(--fg);
+}
+
+.starter-paths nav a:hover {
+	border-color: var(--accent);
+	color: var(--accent);
+	text-decoration: none;
+}
+
+/* ---------- Component page layout ---------- */
+
+.layout {
+	display: grid;
+	grid-template-columns: 240px minmax(0, 1fr);
+	gap: 3rem;
+	max-width: 1180px;
+	margin: 0 auto;
+	padding: 2.5rem 1.5rem 4rem;
+}
+
+.sidebar {
+	position: sticky;
+	top: 5rem;
+	align-self: start;
+	max-height: calc(100vh - 6rem);
+	overflow-y: auto;
+	padding-left: 0.5rem;
+	font-size: 0.88rem;
+	line-height: 1.5;
+}
+
+.components-nav {
+	margin-top: 1.75rem;
+	padding-top: 1.25rem;
+	border-top: 1px solid var(--border);
+}
+
+.components-nav summary {
+	text-transform: uppercase;
+	font-size: 0.72rem;
+	font-weight: 600;
+	letter-spacing: 0.06em;
+	color: var(--muted);
+	cursor: pointer;
+	list-style: none;
+	margin: 0 0 0.6rem;
+	user-select: none;
+}
+
+.components-nav summary::-webkit-details-marker { display: none; }
+.components-nav summary::before {
+	content: "▸";
+	display: inline-block;
+	width: 1em;
+	transition: transform 0.15s;
+	color: var(--muted);
+}
+.components-nav[open] summary::before { transform: rotate(90deg); }
+
+.components-nav ol { list-style: none; padding: 0; margin: 0; }
+.components-nav li { margin: 0; }
+.components-nav a {
+	display: block;
+	padding: 0.18rem 0.65rem;
+	color: var(--toc-fg);
+	border-left: 2px solid transparent;
+	margin-left: -0.65rem;
+	font-size: 0.85rem;
+}
+.components-nav a:hover { color: var(--fg); text-decoration: none; }
+.components-nav li.current a {
+	color: var(--toc-active);
+	border-left-color: var(--toc-active);
+	font-weight: 600;
+}
+
+.toc {
+	font-size: 0.88rem;
+	line-height: 1.5;
+}
+
+.toc-title {
+	text-transform: uppercase;
+	font-size: 0.72rem;
+	font-weight: 600;
+	letter-spacing: 0.06em;
+	color: var(--muted);
+	margin: 0 0 0.6rem;
+}
+
+.toc ol { list-style: none; padding: 0; margin: 0; }
+.toc li { margin: 0; }
+.toc a {
+	display: block;
+	padding: 0.25rem 0;
+	color: var(--toc-fg);
+	border-left: 2px solid transparent;
+	padding-left: 0.65rem;
+	margin-left: -0.65rem;
+}
+.toc a:hover { color: var(--fg); text-decoration: none; }
+.toc a.active { color: var(--toc-active); border-left-color: var(--toc-active); font-weight: 500; }
+.toc .toc-depth-3 a {
+	font-size: 0.82rem;
+	line-height: 1.35;
+	padding-left: 1.35rem;
+}
+
+.sidebar-toggle {
+	display: none;
+	background: transparent;
+	border: 1px solid var(--border);
+	border-radius: 4px;
+	color: var(--fg);
+	font-size: 0.85rem;
+	padding: 0.4rem 0.7rem;
+	cursor: pointer;
+	margin-bottom: 0.5rem;
+}
+
+@media (max-width: 880px) {
+	.layout { grid-template-columns: 1fr; gap: 1rem; padding-top: 1.5rem; }
+	.sidebar {
+		position: static;
+		max-height: none;
+		padding: 0;
+	}
+	.sidebar-toggle { display: block; }
+	.sidebar > .components-nav,
+	.sidebar > .toc { display: none; }
+	.sidebar.open > .components-nav,
+	.sidebar.open > .toc { display: block; }
+}
+
+.content {
+	min-width: 0;
+	max-width: 720px;
+}
+
+.content h1 {
+	font-size: 2.1rem;
+	margin: 0 0 0.4rem;
+	letter-spacing: -0.02em;
+	font-weight: 700;
+}
+
+.content > .lede {
+	font-size: 1.08rem;
+	color: var(--muted);
+	margin: 0 0 0.5rem;
+	max-width: 60ch;
+}
+
+.content .install {
+	display: inline-block;
+	font-family: ui-monospace, "SF Mono", Menlo, monospace;
+	font-size: 0.85rem;
+	background: var(--code-bg);
+	color: var(--code-fg);
+	padding: 0.35rem 0.7rem;
+	border-radius: 5px;
+	border: 1px solid var(--border);
+	margin: 1rem 0 1.5rem;
+}
+
+.content h2 {
+	font-size: 1.4rem;
+	margin: 3rem 0 0.5rem;
+	letter-spacing: -0.012em;
+	font-weight: 600;
+	scroll-margin-top: 5rem;
+}
+
+.content h3 {
+	font-size: 1.05rem;
+	margin: 1.75rem 0 0.4rem;
+	font-weight: 600;
+}
+
+.content p { margin: 0 0 0.9rem; }
+
+.you-will-learn-label {
+	margin: 1.2rem 0 0.3rem;
+	font-weight: 600;
+	color: var(--muted);
+	text-transform: uppercase;
+	letter-spacing: 0.04em;
+	font-size: 0.78rem;
+}
+
+.you-will-learn {
+	margin: 0 0 1.5rem;
+	padding-left: 1.2rem;
+	display: grid;
+	gap: 0.3rem;
+}
+
+.you-will-learn li {
+	line-height: 1.5;
+}
+
+.learning-path {
+	display: grid;
+	gap: 0.85rem;
+	padding-left: 1.4rem;
+	margin: 0.5rem 0 1.5rem;
+}
+
+.learning-path li {
+	padding-left: 0.2rem;
+}
+
+.learning-path strong {
+	display: block;
+	margin-bottom: 0.15rem;
+}
+
+.learning-path span {
+	display: block;
+	color: var(--muted);
+}
+
+.related-components {
+	display: grid;
+	gap: 0.65rem;
+	margin: 0.75rem 0 1.5rem;
+	padding: 0;
+	list-style: none;
+}
+
+.related-components li {
+	border-left: 3px solid var(--border);
+	padding-left: 0.85rem;
+}
+
+.related-components a {
+	display: inline-block;
+	font-weight: 600;
+}
+
+.related-components span {
+	display: block;
+	color: var(--muted);
+	font-size: 0.9rem;
+	line-height: 1.5;
+}
+
+p code, li code, td code {
+	background: var(--code-bg);
+	padding: 0.12em 0.4em;
+	border-radius: 4px;
+	font-family: ui-monospace, "SF Mono", Menlo, monospace;
+	font-size: 0.88em;
+}
+
+.content blockquote {
+	border-left: 3px solid var(--border);
+	margin: 1rem 0;
+	padding: 0.05rem 0 0.05rem 1rem;
+	color: var(--muted);
+}
+
+.content table {
+	border-collapse: collapse;
+	margin: 1rem 0;
+	font-size: 0.92rem;
+	width: 100%;
+}
+.content th, .content td {
+	border: 1px solid var(--border);
+	padding: 0.4rem 0.7rem;
+	text-align: left;
+	vertical-align: top;
+}
+.content th { background: var(--code-bg); font-weight: 600; }
+
+.runtime-note {
+	font-size: 0.85rem;
+	color: var(--muted);
+	background: var(--code-bg);
+	border: 1px solid var(--border);
+	border-radius: 6px;
+	padding: 0.65rem 0.85rem;
+	margin: 0 0 2rem;
+}
+
+.runtime-note strong { color: var(--fg); }
+
+php-snippet { display: block; margin: 1rem 0 1.75rem; }
+
+.code-example {
+	margin: 1rem 0 1.75rem;
+	border: 1px solid var(--border);
+	border-radius: 6px;
+	overflow: hidden;
+	background: var(--code-bg);
+}
+
+.code-example figcaption {
+	border-bottom: 1px solid var(--border);
+	color: var(--muted);
+	font-family: ui-monospace, "SF Mono", Menlo, monospace;
+	font-size: 0.78rem;
+	padding: 0.45rem 0.7rem;
+}
+
+.code-example pre {
+	margin: 0;
+	padding: 0.9rem;
+	overflow-x: auto;
+}
+
+.code-example code {
+	font-family: ui-monospace, "SF Mono", Menlo, monospace;
+	font-size: 0.85rem;
+	color: var(--code-fg);
+}
+
+/* When the editable hack is wired, hint at it without nagging. */
+php-snippet[data-editable] { position: relative; }
+php-snippet[data-editable]::after {
+	content: "Editable — click in the code to change it";
+	position: absolute;
+	right: 0.75rem;
+	bottom: -1.2rem;
+	font-size: 0.72rem;
+	color: var(--muted);
+	pointer-events: none;
+}
+
+.callout {
+	border: 1px solid var(--border);
+	border-left: 3px solid var(--accent);
+	background: var(--code-bg);
+	padding: 0.65rem 0.85rem;
+	border-radius: 4px;
+	font-size: 0.92rem;
+	margin: 1rem 0;
+}
+
+.callout strong { color: var(--fg); }
+
+/* ============================================================
+ * Rewritten docs surface (April 2026)
+ * Landing page, learn track, reference pages, callouts.
+ * ============================================================ */
+
+/* ----- Landing page ----- */
+
+main.landing {
+	max-width: 980px;
+	margin: 0 auto;
+	padding: 2.5rem 1.5rem 4rem;
+}
+
+main.landing h1 {
+	font-size: 2.6rem;
+	line-height: 1.15;
+	margin: 0 0 1rem;
+	letter-spacing: -0.02em;
+}
+
+main.landing .lede {
+	font-size: 1.15rem;
+	color: var(--muted);
+	max-width: 70ch;
+	margin: 0 0 2rem;
+}
+
+.cta-row {
+	display: flex;
+	gap: 0.75rem;
+	flex-wrap: wrap;
+	margin: 1.5rem 0 3rem;
+}
+
+.cta {
+	display: inline-block;
+	padding: 0.7rem 1.2rem;
+	border: 1px solid var(--border);
+	border-radius: 6px;
+	font-weight: 500;
+	color: var(--fg);
+}
+
+.cta:hover { border-color: var(--accent); text-decoration: none; }
+
+.cta.primary {
+	background: var(--accent);
+	color: white;
+	border-color: var(--accent);
+}
+
+.cta.primary:hover { background: var(--accent-hover); border-color: var(--accent-hover); color: white; }
+
+.origins, .insight, .two-doors, .proofs, .how-runnable, .prereqs, .path, .canonical-artifact, .next, .ref-group {
+	margin: 2.5rem 0;
+}
+
+main.landing h2,
+main.learn-landing h2,
+main.reference-landing h2 {
+	font-size: 1.6rem;
+	margin: 0 0 1rem;
+	letter-spacing: -0.01em;
+}
+
+.component-summary {
+	list-style: none;
+	padding: 0;
+	display: grid;
+	gap: 0.6rem;
+	margin: 1rem 0;
+}
+
+.component-summary li {
+	padding: 0.7rem 0.9rem;
+	border-left: 3px solid var(--border);
+	background: var(--code-bg);
+	border-radius: 0 4px 4px 0;
+}
+
+.component-summary strong { display: inline-block; min-width: 9rem; }
+
+.doors {
+	display: grid;
+	gap: 1rem;
+	grid-template-columns: 1fr 1fr;
+	margin: 1rem 0;
+}
+
+@media (max-width: 720px) { .doors { grid-template-columns: 1fr; } }
+
+.door {
+	display: block;
+	padding: 1.4rem;
+	border: 1px solid var(--border);
+	border-radius: 8px;
+	color: var(--fg);
+	transition: border-color 0.15s, transform 0.15s;
+}
+
+.door:hover { border-color: var(--accent); text-decoration: none; transform: translateY(-2px); }
+.door strong { display: block; font-size: 1.1rem; margin-bottom: 0.5rem; }
+.door span { display: block; color: var(--muted); margin-bottom: 0.7rem; }
+.door em { color: var(--accent); font-style: normal; font-weight: 500; }
+
+.proof-table {
+	border-collapse: collapse;
+	width: 100%;
+	margin: 1rem 0;
+	font-size: 0.93rem;
+}
+
+.proof-table td {
+	padding: 0.55rem 0.75rem;
+	border-bottom: 1px solid var(--border);
+	vertical-align: top;
+}
+
+.proof-table td:first-child { white-space: nowrap; color: var(--muted); }
+.proof-table td:nth-child(2) { color: var(--muted); width: 1.5rem; }
+
+/* ----- Learn landing ----- */
+
+main.learn-landing, main.reference-landing {
+	max-width: 880px;
+	margin: 0 auto;
+	padding: 2.5rem 1.5rem 4rem;
+}
+
+ol.chapters {
+	list-style: none;
+	counter-reset: ch;
+	padding: 0;
+	display: grid;
+	gap: 0.7rem;
+	margin: 1rem 0;
+}
+
+ol.chapters li { counter-increment: ch; }
+
+ol.chapters a {
+	display: block;
+	padding: 1rem 1.2rem;
+	border: 1px solid var(--border);
+	border-radius: 6px;
+	color: var(--fg);
+}
+
+ol.chapters a:hover { border-color: var(--accent); text-decoration: none; }
+ol.chapters strong { display: block; margin-bottom: 0.3rem; }
+ol.chapters span { display: block; color: var(--muted); font-size: 0.93rem; }
+
+.canonical-artifact pre {
+	background: var(--code-bg);
+	padding: 1rem;
+	border-radius: 6px;
+	overflow-x: auto;
+	border: 1px solid var(--border);
+	font-size: 0.88rem;
+	line-height: 1.55;
+}
+
+/* ----- Reference landing ----- */
+
+.ref-grid {
+	list-style: none;
+	padding: 0;
+	display: grid;
+	grid-template-columns: repeat(auto-fill, minmax(260px, 1fr));
+	gap: 0.7rem;
+	margin: 1rem 0 1.5rem;
+}
+
+.ref-grid a {
+	display: block;
+	padding: 0.9rem 1rem;
+	border: 1px solid var(--border);
+	border-radius: 6px;
+	color: var(--fg);
+	height: 100%;
+}
+
+.ref-grid a:hover { border-color: var(--accent); text-decoration: none; }
+.ref-grid strong { display: block; margin-bottom: 0.3rem; }
+.ref-grid span { display: block; color: var(--muted); font-size: 0.88rem; line-height: 1.5; }
+
+.legacy-note {
+	margin-top: 2rem;
+	padding: 0.75rem 1rem;
+	background: var(--code-bg);
+	border-left: 3px solid var(--border);
+	color: var(--muted);
+	font-size: 0.92rem;
+}
+
+/* ----- Article chrome (shared with reference + learn pages) ----- */
+
+.breadcrumb {
+	color: var(--muted);
+	font-size: 0.85rem;
+	text-transform: uppercase;
+	letter-spacing: 0.06em;
+	margin: 0 0 0.5rem;
+}
+
+.chapter-nav {
+	display: flex;
+	justify-content: space-between;
+	gap: 1rem;
+	margin: 2.5rem 0 0.5rem;
+	padding-top: 1.5rem;
+	border-top: 1px solid var(--border);
+	font-weight: 500;
+	flex-wrap: wrap;
+}
+
+.chapter-nav .prev { margin-right: auto; }
+.chapter-nav .next { margin-left: auto; }
+
+.next-preview {
+	color: var(--muted);
+	font-size: 0.95rem;
+	margin: 0.5rem 0 0;
+	max-width: 65ch;
+}
+
+/* ----- Callouts ----- */
+
+.callout {
+	display: block;
+	margin: 1.2rem 0;
+	padding: 0.85rem 1rem;
+	border-left: 4px solid var(--border);
+	background: var(--code-bg);
+	border-radius: 0 4px 4px 0;
+	font-size: 0.96rem;
+}
+
+.callout strong { display: inline; margin-right: 0.3rem; }
+
+.callout.try { border-left-color: #10b981; }
+.callout.pitfall { border-left-color: #ef4444; }
+.callout.warning { border-left-color: #f59e0b; }
+.callout.note { border-left-color: var(--accent); }
+
+.callout.you-will-learn { border-left-color: var(--accent); }
+.callout.you-will-learn ul { margin: 0.5rem 0 0; padding-left: 1.2rem; }
+.callout.you-will-learn li { margin: 0.2rem 0; }
+
+/* ----- API tables on reference pages ----- */
+
+.api-table {
+	border-collapse: collapse;
+	width: 100%;
+	margin: 1rem 0 1.5rem;
+	font-size: 0.93rem;
+}
+
+.api-table th, .api-table td {
+	padding: 0.6rem 0.8rem;
+	border-bottom: 1px solid var(--border);
+	vertical-align: top;
+	text-align: left;
+}
+
+.api-table th {
+	font-size: 0.78rem;
+	text-transform: uppercase;
+	letter-spacing: 0.05em;
+	color: var(--muted);
+	font-weight: 600;
+}
+
+.api-table td:first-child { white-space: nowrap; }
+
+.callout.credit {
+	border-left-color: #8b5cf6;
+	background: linear-gradient(to right, rgba(139, 92, 246, 0.06), transparent);
+}
diff --git a/docs/index.html b/docs/index.html
new file mode 100644
index 000000000..d39d364b0
--- /dev/null
+++ b/docs/index.html
@@ -0,0 +1,145 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>PHP Toolkit — pure-PHP libraries for WordPress and the open web</title>
+<meta name="description" content="A pure-PHP toolkit for parsing HTML, reading and writing ZIP archives, streaming bytes, importing content, and a dozen other jobs that PHP normally outsources to extensions. No libxml2, no libzip, no curl, no database. Runs on PHP 7.2 through 8.3 and inside the browser via WordPress Playground.">
+<link rel="stylesheet" href="assets/style.css?v=20260429-credits">
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="./">PHP Toolkit</a>
+	<nav>
+		<a href="learn/">Learn</a>
+		<a href="reference/">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<main class="landing">
+
+<section class="hero">
+	<h1>The pieces of WordPress, without the dependencies.</h1>
+	<p class="lede">PHP Toolkit is a set of small, pure-PHP libraries for the work that WordPress core does every day — parsing HTML, reading ZIP archives, streaming bytes, importing content, making HTTP requests. No <code>libxml2</code>. No <code>libzip</code>. No <code>curl</code>. No database. Runs on PHP 7.2 through 8.3, on Linux, macOS, Windows, and inside the browser via WordPress Playground.</p>
+
+	<div class="cta-row">
+		<a class="cta primary" href="learn/quickstart.html">Quickstart →</a>
+		<a class="cta" href="learn/">Take the tutorial</a>
+		<a class="cta" href="reference/">Browse components</a>
+	</div>
+</section>
+
+<section class="origins">
+	<h2>The problem</h2>
+
+	<p>The PHP ecosystem has spent twenty years assuming the host will provide the hard parts. Need to parse HTML? Install <code>libxml2</code> and reach for <code>DOMDocument</code>. Need a ZIP? Hope <code>ZipArchive</code> is compiled in. Need to fetch a URL? Pray <code>curl</code> is available, then handle the cases where it isn't.</p>
+
+	<p>This works fine until it doesn't. Shared hosts disable extensions. WebAssembly runtimes don't have them at all. WordPress Playground runs in your browser and can't shell out to <code>libzip</code>. New PHP releases break old C bindings. Every extension is a dependency that some user, somewhere, can't satisfy.</p>
+
+	<p>Meanwhile WordPress core has quietly built its own answers: <code>WP_HTML_Tag_Processor</code> and <code>WP_HTML_Processor</code> for HTML, <code>WP_Block_Parser</code> for the editor's serialized content, hand-rolled archive helpers for plugin and theme updates. Pure PHP, no extensions, written carefully because they have to work everywhere from cheap shared hosting to a Raspberry Pi.</p>
+
+	<p>PHP Toolkit lifts those answers out of WordPress and turns them into libraries you can use anywhere.</p>
+</section>
+
+<section class="insight">
+	<h2>The shape of it</h2>
+
+	<p>Eighteen components. Each is a small library focused on one job, distributable as its own Composer package, depending only on PHP itself plus other toolkit components — no Composer packages outside the <code>wp-php-toolkit/*</code> family, no PHP extensions beyond <code>json</code> and <code>mbstring</code>.</p>
+</section>
+
+<section class="all-components">
+	<h2>All eighteen components</h2>
+
+	<h3>Content and migration</h3>
+	<ul class="ref-grid">
+		<li><a href="reference/html.html"><strong>HTML</strong><span>Browser-grade HTML5 parser and tag rewriter. Cursor model, byte-for-byte edits.</span></a></li>
+		<li><a href="reference/blockparser.html"><strong>BlockParser</strong><span>Parse WordPress block markup into a structured tree.</span></a></li>
+		<li><a href="reference/markdown.html"><strong>Markdown</strong><span>Bidirectional Markdown ↔ block markup with frontmatter as metadata.</span></a></li>
+		<li><a href="reference/xml.html"><strong>XML</strong><span>Streaming, namespace-aware XML processor. Edit WXR exports without a tree.</span></a></li>
+		<li><a href="reference/encoding.html"><strong>Encoding</strong><span>UTF-8 validation and scrubbing with a pure-PHP fallback.</span></a></li>
+		<li><a href="reference/dataliberation.html"><strong>DataLiberation</strong><span>Stream WordPress entities between sites; rewrite URLs across an export.</span></a></li>
+	</ul>
+
+	<h3>Streams and storage</h3>
+	<ul class="ref-grid">
+		<li><a href="reference/bytestream.html"><strong>ByteStream</strong><span>Pull / peek / consume primitives. Gzip, hash, limit, window filters compose.</span></a></li>
+		<li><a href="reference/filesystem.html"><strong>Filesystem</strong><span>One interface across disk, memory, SQLite, and ZIP-backed storage.</span></a></li>
+		<li><a href="reference/zip.html"><strong>Zip</strong><span>Read and write ZIP archives one entry at a time. EPUB, .docx, plugin bundles.</span></a></li>
+		<li><a href="reference/git.html"><strong>Git</strong><span>Pure-PHP Git: commits, branches, merges, HTTP push/pull, no shelling out.</span></a></li>
+		<li><a href="reference/merge.html"><strong>Merge</strong><span>Three-way diff and merge with explicit conflict records.</span></a></li>
+	</ul>
+
+	<h3>Networked tools</h3>
+	<ul class="ref-grid">
+		<li><a href="reference/httpclient.html"><strong>HttpClient</strong><span>Async HTTP with progress, redirects, ranged resume, concurrent requests.</span></a></li>
+		<li><a href="reference/httpserver.html"><strong>HttpServer</strong><span>Tiny blocking TCP server for OAuth callbacks, fixtures, status pages.</span></a></li>
+		<li><a href="reference/corsproxy.html"><strong>CORSProxy</strong><span>Server-side fetch for browser apps that can't bypass same-origin.</span></a></li>
+		<li><a href="reference/cli.html"><strong>CLI</strong><span>POSIX argv parser. Long options, short bundles, one static call.</span></a></li>
+	</ul>
+
+	<h3>WordPress runtime support</h3>
+	<ul class="ref-grid">
+		<li><a href="reference/polyfill.html"><strong>Polyfill</strong><span>WordPress-shaped helpers (<code>esc_html</code>, hooks, translations) outside WordPress.</span></a></li>
+		<li><a href="reference/blueprints.html"><strong>Blueprints</strong><span>Versioned recipes for spinning up a WordPress site, plugins, options, content.</span></a></li>
+		<li><a href="reference/coding-standards.html"><strong>ToolkitCodingStandards</strong><span>PHPCS sniffs that encode the project's review feedback as rules.</span></a></li>
+	</ul>
+</section>
+
+<section class="two-doors">
+	<h2>Where to start</h2>
+
+	<div class="doors">
+		<a class="door" href="learn/">
+			<strong>I want to learn the toolkit.</strong>
+			<span>Build a real content importer across four short chapters. We'll start with one HTML rewrite and finish with a ZIP-packaged WXR export. Every code block runs in the browser; every chapter ends with something you can keep.</span>
+			<em>~45 minutes →</em>
+		</a>
+
+		<a class="door" href="reference/">
+			<strong>I'm here to look something up.</strong>
+			<span>Eighteen component pages, each with a one-line definition, a minimal runnable example, refinements, the pitfalls people actually trip on, and links back to the tutorial chapters where the concept first appears.</span>
+			<em>Browse all components →</em>
+		</a>
+	</div>
+</section>
+
+<section class="proofs">
+	<h2>The toolkit in one line each</h2>
+	<table class="proof-table">
+	<tr><td><code>preg_replace</code> for HTML</td><td>→</td><td>HTML's <code>WP_HTML_Tag_Processor</code> rewrites attributes byte-for-byte without re-serializing. Untouched markup stays byte-identical.</td></tr>
+	<tr><td><code>ZipArchive::open()</code></td><td>→</td><td>Zip's <code>ZipFilesystem</code> opens a 2 GB archive using memory proportional to the central directory's size, not the archive's.</td></tr>
+	<tr><td><code>file_get_contents</code> on a URL</td><td>→</td><td>HttpClient streams the response body, supports <code>Range</code> resume, reports progress, and uses curl when available or PHP stream sockets when it isn't.</td></tr>
+	<tr><td><code>DOMDocument::loadHTML</code></td><td>→</td><td>HTML's <code>WP_HTML_Processor</code> parses HTML5 the way browsers do — fragments, implicit tags, the works.</td></tr>
+	<tr><td><code>simplexml_load_string</code></td><td>→</td><td>XML's <code>XMLProcessor</code> walks WXR exports as a cursor and rewrites attributes byte-for-byte, never building a full tree.</td></tr>
+	</table>
+</section>
+
+<section class="credits">
+	<h2>Credits</h2>
+
+	<p>Several toolkit components are PHP ports or wrappers of upstream code:</p>
+
+	<ul class="component-summary">
+		<li><strong>HTML</strong> is a port of WordPress core's <code>WP_HTML_Tag_Processor</code> and <code>WP_HTML_Processor</code>. The toolkit version tracks core; bug fixes and improvements flow in both directions. Source: <a href="https://github.com/WordPress/wordpress-develop/tree/trunk/src/wp-includes/html-api">WordPress/wordpress-develop</a>.</li>
+		<li><strong>BlockParser</strong> is WordPress core's block parser (<code>WP_Block_Parser</code>) packaged as a standalone library so importers and linters can read <a href="https://developer.wordpress.org/block-editor/reference-guides/block-api/">block markup</a> without booting WordPress. Source: <a href="https://github.com/WordPress/wordpress-develop/blob/trunk/src/wp-includes/class-wp-block-parser.php">WordPress/wordpress-develop</a>.</li>
+		<li><strong>Markdown</strong> wraps <a href="https://commonmark.thephpleague.com/"><code>league/commonmark</code></a> for the Markdown parsing itself and <a href="https://github.com/webuni/front-matter"><code>webuni/front-matter</code></a> for the YAML frontmatter handling. The toolkit's own work is the bridge from CommonMark's AST into WordPress block markup, plus the reverse direction.</li>
+		<li><strong>Polyfill</strong>'s WordPress-shaped helpers (<code>esc_html</code>, <code>add_filter</code>, <code>__</code>) defer to WordPress when WordPress is loaded. The standalone implementations match WordPress's behavior so the same code runs both inside and outside the platform.</li>
+	</ul>
+
+	<p>The remaining components — Zip, ByteStream, Filesystem, XML, Encoding, DataLiberation, Git, Merge, HttpClient, HttpServer, CORSProxy, CLI, Blueprints, ToolkitCodingStandards — are toolkit originals, written for this project to fill gaps the PHP ecosystem leaves to extensions.</p>
+</section>
+
+<section class="how-runnable">
+	<h2>How the runnable examples work</h2>
+	<p>Most code blocks on this site are <code>&lt;php-snippet&gt;</code> elements from <a href="https://playground.wordpress.net/">WordPress Playground</a>. Click <em>Run</em> and the page boots a PHP+WordPress runtime in your browser via WebAssembly, unzips the toolkit into it, and executes the snippet. The first run on a page boots the runtime; later runs reuse it. Edit the code in place and click <em>Run</em> again to see what changes.</p>
+	<p>Static code blocks show shell commands, deployment config, or network-bound code that needs a real local environment.</p>
+</section>
+
+</main>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a> · runnable docs powered by <a href="https://wordpress.github.io/wordpress-playground/">WordPress Playground</a>
+</footer>
+</body>
+</html>
diff --git a/docs/learn/01-rewriting-html.html b/docs/learn/01-rewriting-html.html
new file mode 100644
index 000000000..4809b1c89
--- /dev/null
+++ b/docs/learn/01-rewriting-html.html
@@ -0,0 +1,363 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Chapter 1 — Rewriting HTML safely · PHP Toolkit</title>
+<meta name="description" content="Rewrite real-world HTML — lazy-load images, fix relative URLs, strip script tags — using WP_HTML_Tag_Processor's cursor model. Chapter 1 of a tutorial that builds a content importer.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="./">Learn</a>
+		<a href="../reference/">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+
+<aside class="sidebar" aria-label="Tutorial navigation">
+	<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+	<nav class="toc" aria-label="Table of contents"></nav>
+	<details class="components-nav" open>
+		<summary>The path</summary>
+		<ol>
+			<li><a href="quickstart.html">Quickstart</a></li>
+			<li class="current"><a href="01-rewriting-html.html">1. Rewriting HTML</a></li>
+			<li><a href="02-streaming-archives.html">2. Streaming archives</a></li>
+			<li><a href="03-importing-content.html">3. Markdown to WXR</a></li>
+			<li><a href="04-talking-to-the-network.html">4. Talking to the network</a></li>
+			<li><a href="recap.html">Recap</a></li>
+		</ol>
+	</details>
+</aside>
+
+<article class="content">
+
+<p class="breadcrumb">Chapter 1 of 4</p>
+<h1>Rewriting HTML safely</h1>
+
+<p class="lede">In the quickstart you added a single attribute to a single tag. In this chapter we'll do the work the importer actually needs to do on real-world post content: add lazy loading to every image, rewrite relative links to absolute URLs, and strip the script tags and inline event handlers that creep into pasted HTML. By the end you'll have a <code>clean_post_html()</code> function the next chapter will plug into the importer.</p>
+
+<aside class="callout you-will-learn">
+	<strong>You will learn to:</strong>
+	<ul>
+		<li>Walk every tag of a given name with <code>next_tag()</code>, and every tag and text node with <code>next_token()</code>.</li>
+		<li>Add, replace, and remove attributes without disturbing the surrounding bytes.</li>
+		<li>Use <code>get_attribute_names_with_prefix()</code> to remove every <code>on*</code> handler in one pass.</li>
+		<li>Recognize when the tag-level cursor is the right tool, and when to reach for <code>WP_HTML_Processor</code> instead.</li>
+	</ul>
+</aside>
+
+<h2 id="the-input">The input we're cleaning</h2>
+
+<p>The importer's job is to read a folder of Markdown posts. Each post has frontmatter, prose, and inline HTML that survived from a previous CMS — a mix of helpful markup, sloppy markup, and the occasional <code>&lt;script&gt;</code> tag someone pasted from Stack Overflow. Here's a representative example:</p>
+
+<php-snippet blueprint="toolkit-setup" name="raw-post.php" runnable="false">
+<script type="application/x-php">
+<?php
+// Slightly abridged. Real posts can be 5–10 KB of HTML.
+$post_html = <<<HTML
+<p>A weeknight pasta that takes 20 minutes start to finish.
+See <a href="/recipes/sauces">our sauce primer</a> for context,
+or <a href="https://example.com/elsewhere">skip to the canonical version</a>.</p>
+
+<figure>
+	<img src="/uploads/2024/pasta-hero.jpg" alt="Plated pasta">
+	<figcaption onmouseover="trackHover()">Photo: ours.</figcaption>
+</figure>
+
+<p>Watch the <a href="video.html">technique video</a>
+or <a href="https://other.test/x">jump to the discussion</a>.</p>
+
+<script>trackPageview('/recipes/weeknight-pasta');</script>
+HTML;
+</script>
+</php-snippet>
+
+<p>Three things need fixing before this HTML belongs in a database:</p>
+
+<ol>
+	<li>The <code>&lt;img&gt;</code> has no <code>loading</code> hint, so it'll fetch eagerly even when it's far below the fold.</li>
+	<li>Two of the four <code>&lt;a&gt;</code> tags use relative URLs. They were correct on the source site; on the destination site they'll point to nothing.</li>
+	<li>There's a <code>&lt;script&gt;</code> tag and an <code>onmouseover</code> handler. They have to go.</li>
+</ol>
+
+<p>Each of the next three sections fixes one of these. They all use the same component — <code>WP_HTML_Tag_Processor</code> — and the same shape: open a processor over the HTML, walk it, ask the cursor to make edits, then call <code>get_updated_html()</code> for the result.</p>
+
+<h2 id="lazy-load">Lazy-load every image</h2>
+
+<p>Start with the most ergonomic fix: add <code>loading="lazy"</code> to every image that doesn't already have a <code>loading</code> attribute. The processor's filter argument lets us skip everything that isn't an <code>&lt;img&gt;</code>:</p>
+
+<php-snippet blueprint="toolkit-setup" name="lazy-images.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$post_html = <<<HTML
+<figure>
+	<img src="/uploads/2024/pasta-hero.jpg" alt="Plated pasta">
+	<figcaption>Photo: ours.</figcaption>
+</figure>
+<p>Body copy with an inline <img src="emoji.png" alt="" loading="eager"> image.</p>
+HTML;
+
+$tags = new WP_HTML_Tag_Processor( $post_html );
+while ( $tags->next_tag( 'img' ) ) {
+	if ( null === $tags->get_attribute( 'loading' ) ) {
+		$tags->set_attribute( 'loading', 'lazy' );
+	}
+	$tags->set_attribute( 'decoding', 'async' );
+}
+
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<figure>
+	<img src="/uploads/2024/pasta-hero.jpg" alt="Plated pasta" loading="lazy" decoding="async">
+	<figcaption>Photo: ours.</figcaption>
+</figure>
+<p>Body copy with an inline <img src="emoji.png" alt="" loading="eager" decoding="async"> image.</p>
+</script>
+</php-snippet>
+
+<p>Notice three things in the output. The first <code>&lt;img&gt;</code> gained both <code>loading="lazy"</code> and <code>decoding="async"</code>. The second <code>&lt;img&gt;</code> kept its author-provided <code>loading="eager"</code> — the <code>null === get_attribute( 'loading' )</code> guard saw it and skipped the lazy line — but still gained <code>decoding="async"</code>, because that's an unconditional <code>set_attribute()</code> call. And every byte that wasn't an image attribute came through untouched: the <code>&lt;figure&gt;</code>, the whitespace, the <code>&lt;figcaption&gt;</code>, the <code>&lt;p&gt;</code>, even the prose inside it.</p>
+
+<aside class="callout try">
+	<strong>Try this:</strong> change the second image to also lack a <code>loading</code> attribute, then add a third <code>&lt;img&gt;</code> wrapped in <code>&lt;picture&gt;&lt;source&gt;&lt;img&gt;&lt;/picture&gt;</code>. Run again. The processor walks all of them.
+</aside>
+
+<aside class="callout pitfall">
+	<strong>Pitfall — mutations are buffered.</strong> If you read <code>get_attribute('loading')</code> after a <code>set_attribute('loading', 'lazy')</code> on the same tag, you'll see <code>'lazy'</code>. But if a different bit of code reads the original <code>$post_html</code> string, it sees the unmodified HTML — the edits only land in the string when you call <code>get_updated_html()</code>. This trips people up when they pass the source HTML to a logger or a hash function and wonder why the output doesn't match.
+</aside>
+
+<h2 id="absolute-urls">Rewrite relative URLs to absolute</h2>
+
+<p>The importer needs every link in a post to be addressable from the destination site. <code>/recipes/sauces</code> meant something on the source site; on the destination it points to nothing. We'll resolve every relative <code>href</code> against a base URL — and leave protocol-relative URLs, fragments, and absolute URLs alone.</p>
+
+<php-snippet blueprint="toolkit-setup" name="absolute-urls.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$post_html = '<p>See <a href="/recipes/sauces">our sauce primer</a>, '
+	. 'or <a href="https://other.test/x">the canonical version</a>, '
+	. 'or <a href="video.html">the video</a>, '
+	. 'or <a href="#footnote-1">footnote 1</a>.</p>';
+
+$base = 'https://recipes.example.com/';
+
+$tags = new WP_HTML_Tag_Processor( $post_html );
+while ( $tags->next_tag( 'a' ) ) {
+	$href = $tags->get_attribute( 'href' );
+	if ( null === $href || '' === $href ) {
+		continue;
+	}
+	// Already a scheme (https:, mailto:, javascript:), or scheme-relative,
+	// or a same-page fragment? Leave it alone.
+	if ( preg_match( '#^[a-z][a-z0-9+.\-]*:#i', $href )
+		|| 0 === strpos( $href, '//' )
+		|| 0 === strpos( $href, '#' ) ) {
+		continue;
+	}
+	$tags->set_attribute( 'href', rtrim( $base, '/' ) . '/' . ltrim( $href, '/' ) );
+}
+
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<p>See <a href="https://recipes.example.com/recipes/sauces">our sauce primer</a>, or <a href="https://other.test/x">the canonical version</a>, or <a href="https://recipes.example.com/video.html">the video</a>, or <a href="#footnote-1">footnote 1</a>.</p>
+</script>
+</php-snippet>
+
+<p>The pattern in the body of the loop is a small URL classifier: scheme-bearing URLs and scheme-relative ones (<code>//other.test/...</code>) are already absolute; fragments stay on the current document; everything else gets the base URL prepended. The classifier itself is forgettable boilerplate — what matters is that the processor lets us write it once and apply it to every <code>&lt;a&gt;</code> in the document with five lines of loop scaffolding.</p>
+
+<aside class="callout try">
+	<strong>Try this:</strong> add a <code>mailto:cooks@example.com</code> link and a <code>javascript:void(0)</code> link to the input. Run. The mailto stays intact (good); the javascript link also stays intact (less good — sanitization is the next section's problem, not this one's).
+</aside>
+
+<aside class="callout note">
+	<strong>Note.</strong> Real-world URL resolution has corners (relative paths with <code>..</code>, query-string-only URLs like <code>?page=2</code>, base elements). The toolkit ships a focused URL handling utility under DataLiberation that does the full job. We'll meet it in chapter 3. For now the simple classifier is good enough for the inputs the importer actually sees.
+</aside>
+
+<h2 id="strip-scripts">Strip script tags and inline event handlers</h2>
+
+<p>This is the security-shaped fix. A user pasted some HTML, and an <code>onmouseover</code> handler came along with it. Maybe a <code>&lt;script&gt;</code> tag too. The importer needs to neutralize both before the content lands in a database that will later be rendered into someone else's browser.</p>
+
+<p>For inline event handlers, <code>get_attribute_names_with_prefix( 'on' )</code> returns every attribute on the current tag whose name starts with <code>on</code> — that's <code>onclick</code>, <code>onmouseover</code>, <code>onerror</code>, every variant. We loop over the returned names and remove each.</p>
+
+<p>For <code>&lt;script&gt;</code> tags, <code>set_modifiable_text('')</code> blanks the script's body without disturbing the surrounding markup. Combined with stripping its attributes, the result is an inert <code>&lt;script&gt;&lt;/script&gt;</code> shell — readable, valid HTML, but executable as a no-op.</p>
+
+<php-snippet blueprint="toolkit-setup" name="strip-scripts.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$untrusted = '<p>Hi <b onclick="steal()">friend</b>!</p>'
+	. '<figure><img src="x" onerror="boom()">'
+	. '<figcaption onmouseover="trackHover()">Photo</figcaption></figure>'
+	. '<script>alert("xss")</script>'
+	. '<script src="https://evil.test/x.js"></script>';
+
+$tags = new WP_HTML_Tag_Processor( $untrusted );
+while ( $tags->next_tag() ) {
+	$tag = $tags->get_tag();
+
+	// 1. Neutralize script bodies and remove their attributes.
+	if ( 'SCRIPT' === $tag && ! $tags->is_tag_closer() ) {
+		$tags->set_modifiable_text( '' );
+		foreach ( $tags->get_attribute_names_with_prefix( '' ) as $attr ) {
+			$tags->remove_attribute( $attr );
+		}
+		continue;
+	}
+
+	// 2. Remove every on* handler on every other tag.
+	foreach ( $tags->get_attribute_names_with_prefix( 'on' ) as $handler ) {
+		$tags->remove_attribute( $handler );
+	}
+}
+
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<p>Hi <b>friend</b>!</p><figure><img src="x"><figcaption>Photo</figcaption></figure><script></script><script></script>
+</script>
+</php-snippet>
+
+<p>Read the output carefully. The <code>onclick</code>, <code>onerror</code>, and <code>onmouseover</code> attributes are gone. Both <code>&lt;script&gt;</code> tags survive structurally — empty, no <code>src</code>, no body — but they're inert. The surrounding <code>&lt;p&gt;</code>, <code>&lt;figure&gt;</code>, and <code>&lt;figcaption&gt;</code> markup is unchanged.</p>
+
+<aside class="callout pitfall">
+	<strong>Pitfall — script tag pairs.</strong> An HTML processor sees <code>&lt;script&gt;</code> twice: once as the opener, once as the closer. The <code>! $tags-&gt;is_tag_closer()</code> guard makes sure we only blank the body when we're sitting on the opener; calling <code>set_modifiable_text()</code> on a closer is a no-op but the attribute-stripping loop would emit nothing useful. The same shape applies to <code>&lt;style&gt;</code>, <code>&lt;textarea&gt;</code>, and other elements with raw text content.
+</aside>
+
+<aside class="callout warning">
+	<strong>Warning — this is not a complete sanitizer.</strong> Stripping <code>on*</code> handlers and emptying <code>&lt;script&gt;</code> tags closes the most common pasted-HTML vectors. It does not close <code>javascript:</code> URLs in <code>href</code> and <code>src</code>, CSS expressions in <code>style</code>, or SVG-borne event handlers. If you're accepting untrusted HTML from end users (not just migrating known-author content like our importer is), use WordPress's <code>wp_kses_post()</code> after this pass, or build an explicit allowlist of tags and attributes. The Tag Processor gives you the surgical tool; a full sanitizer is a policy decision on top.
+</aside>
+
+<h2 id="combine">Combine the three into one function</h2>
+
+<p>Each of the three rewrites above used its own <code>WP_HTML_Tag_Processor</code> instance. That's fine for a tutorial, but the importer is going to call this on every post — twelve, then a hundred, then a thousand — and each instance allocates a little state. We'll fold all three into a single pass over a single processor.</p>
+
+<p>This is also the function chapter 2 will import and reuse. Save the shape:</p>
+
+<php-snippet blueprint="toolkit-setup" name="clean-post-html.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+function clean_post_html( $html, $base_url ) {
+	$tags = new WP_HTML_Tag_Processor( $html );
+	while ( $tags->next_tag() ) {
+		$tag = $tags->get_tag();
+
+		// Inert script tags.
+		if ( 'SCRIPT' === $tag && ! $tags->is_tag_closer() ) {
+			$tags->set_modifiable_text( '' );
+			foreach ( $tags->get_attribute_names_with_prefix( '' ) as $attr ) {
+				$tags->remove_attribute( $attr );
+			}
+			continue;
+		}
+
+		// Strip on* handlers everywhere else.
+		foreach ( $tags->get_attribute_names_with_prefix( 'on' ) as $handler ) {
+			$tags->remove_attribute( $handler );
+		}
+
+		// Lazy-load images.
+		if ( 'IMG' === $tag && ! $tags->is_tag_closer() ) {
+			if ( null === $tags->get_attribute( 'loading' ) ) {
+				$tags->set_attribute( 'loading', 'lazy' );
+			}
+			$tags->set_attribute( 'decoding', 'async' );
+		}
+
+		// Resolve relative anchor hrefs.
+		if ( 'A' === $tag && ! $tags->is_tag_closer() ) {
+			$href = $tags->get_attribute( 'href' );
+			if ( is_string( $href ) && '' !== $href
+				&& ! preg_match( '#^[a-z][a-z0-9+.\-]*:#i', $href )
+				&& 0 !== strpos( $href, '//' )
+				&& 0 !== strpos( $href, '#' ) ) {
+				$tags->set_attribute(
+					'href',
+					rtrim( $base_url, '/' ) . '/' . ltrim( $href, '/' )
+				);
+			}
+		}
+	}
+	return $tags->get_updated_html();
+}
+
+$post_html = <<<HTML
+<p>A weeknight pasta. See <a href="/recipes/sauces">our sauce primer</a>.</p>
+<figure>
+	<img src="/uploads/pasta.jpg" alt="Plated pasta">
+	<figcaption onmouseover="trackHover()">Photo: ours.</figcaption>
+</figure>
+<script>trackPageview('/recipes/weeknight-pasta');</script>
+HTML;
+
+echo clean_post_html( $post_html, 'https://recipes.example.com/' );
+</script>
+<script type="text/expected-output">
+<p>A weeknight pasta. See <a href="https://recipes.example.com/recipes/sauces">our sauce primer</a>.</p>
+<figure>
+	<img src="/uploads/pasta.jpg" alt="Plated pasta" loading="lazy" decoding="async">
+	<figcaption>Photo: ours.</figcaption>
+</figure>
+<script></script>
+</script>
+</php-snippet>
+
+<p>One processor instance, one walk, one allocation of update state. Real importers run this on the body of every post they ingest — call it ten thousand times in a long export and the difference between one allocation per post and four is measurable.</p>
+
+<aside class="callout try">
+	<strong>Try this:</strong> add a <code>&lt;style&gt;</code> tag with a body to the input, then extend <code>clean_post_html()</code> to blank <code>&lt;style&gt;</code> bodies the same way it blanks <code>&lt;script&gt;</code> bodies. Run. CSS-borne attacks are rare in author-supplied content but they exist; the same surgical fix applies.
+</aside>
+
+<h2 id="when-tag-is-wrong">When the tag-level cursor is the wrong tool</h2>
+
+<p>Everything above used <code>WP_HTML_Tag_Processor</code>, which walks tags as a flat sequence. It doesn't know that <code>&lt;img&gt;</code> is inside <code>&lt;figure&gt;</code>; it just sees them in document order. For attribute rewriting that's perfect — fast, allocation-light, byte-honest.</p>
+
+<p>It's the wrong tool when ancestry matters. If you need "every <code>&lt;img&gt;</code> directly inside a <code>&lt;figure&gt;</code>, but not images in paragraphs," or "the <code>&lt;h1&gt;</code> at the top of the article body, ignoring <code>&lt;h1&gt;</code>s nested inside <code>&lt;blockquote&gt;</code>," reach for <code>WP_HTML_Processor</code> — the same component, one class up. It implements HTML5 tree construction, so you can query by ancestry (<code>breadcrumbs</code>) and trust that <code>&lt;p&gt;one&lt;p&gt;two</code> parses as two paragraphs the way a browser sees it.</p>
+
+<p>The reference page for the HTML component (<a href="../reference/html.html">reference/html.html</a>) shows both processors side by side with worked examples. We won't need the full processor in the importer.</p>
+
+<h2 id="recap">Recap</h2>
+
+<p>You can now:</p>
+
+<ul>
+	<li>Open a <code>WP_HTML_Tag_Processor</code> over an HTML string and walk it with <code>next_tag()</code>.</li>
+	<li>Add, replace, and remove attributes — and read the result with <code>get_updated_html()</code> — without disturbing untouched bytes.</li>
+	<li>Use <code>get_attribute_names_with_prefix()</code> to find and remove every <code>on*</code> handler in a single pass.</li>
+	<li>Blank the body of a special-content tag (<code>&lt;script&gt;</code>, <code>&lt;style&gt;</code>) with <code>set_modifiable_text('')</code>.</li>
+	<li>Combine multiple rewrites into a single processor walk for performance and clarity.</li>
+	<li>Recognize when the cursor model is the right tool and when ancestry-aware <code>WP_HTML_Processor</code> is.</li>
+</ul>
+
+<p>The <code>clean_post_html()</code> function is the importer's first real piece. We'll use it again in chapter 3.</p>
+
+<nav class="chapter-nav">
+	<a class="prev" href="quickstart.html">← Previous: Quickstart</a>
+	<a class="next" href="02-streaming-archives.html">Next: Chapter 2 — Streaming archives →</a>
+</nav>
+
+<p class="next-preview">In chapter 2 the importer's input becomes a real ZIP file: a thousand Markdown posts in a 40 MB archive that you can't afford to extract to disk on a memory-constrained host. We'll wrap the archive as a <code>Filesystem</code>, read entries one at a time, and pipe them into a memory-backed staging filesystem the next chapter will read from.</p>
+
+</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/learn/02-streaming-archives.html b/docs/learn/02-streaming-archives.html
new file mode 100644
index 000000000..5aaa3f566
--- /dev/null
+++ b/docs/learn/02-streaming-archives.html
@@ -0,0 +1,349 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Chapter 2 — Streaming archives · PHP Toolkit</title>
+<meta name="description" content="Read a ZIP archive without buffering it, mount it as a Filesystem, and stage entries in memory. Chapter 2 of the content-importer tutorial.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="./">Learn</a>
+		<a href="../reference/">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+
+<aside class="sidebar" aria-label="Tutorial navigation">
+	<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+	<nav class="toc" aria-label="Table of contents"></nav>
+	<details class="components-nav" open>
+		<summary>The path</summary>
+		<ol>
+			<li><a href="quickstart.html">Quickstart</a></li>
+			<li><a href="01-rewriting-html.html">1. Rewriting HTML</a></li>
+			<li class="current"><a href="02-streaming-archives.html">2. Streaming archives</a></li>
+			<li><a href="03-importing-content.html">3. Markdown to WXR</a></li>
+			<li><a href="04-talking-to-the-network.html">4. Talking to the network</a></li>
+			<li><a href="recap.html">Recap</a></li>
+		</ol>
+	</details>
+</aside>
+
+<article class="content">
+
+<p class="breadcrumb">Chapter 2 of 4</p>
+<h1>Streaming archives</h1>
+
+<p class="lede">In chapter 1 you wrote <code>clean_post_html()</code>, a function that takes one HTML string and returns a clean one. The importer needs to run that on a thousand posts at a time. In this chapter the input becomes a real ZIP file: a folder of Markdown posts that you can't always extract to disk — the host might not give you a writable scratch directory, the runtime might not have a persistent filesystem at all. We'll wrap the archive as a <code>Filesystem</code>, read entries one at a time, and stage them in memory for chapter 3 to import.</p>
+
+<aside class="callout you-will-learn">
+	<strong>You will learn to:</strong>
+	<ul>
+		<li>Read a ZIP archive through the <code>ZipFilesystem</code> interface — same calls as a local directory.</li>
+		<li>Stream a single large entry with <code>open_read_stream()</code> and the pull / consume loop.</li>
+		<li>Compose two filesystems with <code>copy_between_filesystems()</code> to move data between backends.</li>
+		<li>Recognize when an in-memory staging filesystem is the right tool, and what swaps out for production.</li>
+	</ul>
+</aside>
+
+<h2 id="why-streams">Why we don't extract to disk</h2>
+
+<p>The naive approach to importing a ZIP of posts is <code>$zip->extractTo('/tmp/staging')</code>, then walk the directory. That's fine if you control the host. The toolkit's whole point is that you often don't. Shared hosts ration disk quota; WebAssembly runtimes have no persistent disk; Docker containers running as non-root may not be able to write where you'd like.</p>
+
+<p>We sidestep the issue by never extracting. <code>ZipFilesystem</code> reads entry data on demand directly from the archive bytes, and an <code>InMemoryFilesystem</code> gives us a place to stage results that vanishes when the process ends. The importer reads from one and writes to the other; the disk is never involved.</p>
+
+<h2 id="open-zip">Open the input ZIP as a filesystem</h2>
+
+<p>The ZIP component's highest-level type is <code>ZipFilesystem</code> — an archive presented through the same <code>Filesystem</code> interface that <code>InMemoryFilesystem</code> and <code>LocalFilesystem</code> implement. Once you've wrapped it, you call <code>get_contents()</code>, <code>ls()</code>, and <code>is_dir()</code> the same way you would on disk:</p>
+
+<php-snippet blueprint="toolkit-setup" name="open-zip.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+
+// In a real importer this is `$argv[1]`. Here we synthesize the input ZIP
+// inline so the snippet runs end-to-end.
+$path = tempnam( sys_get_temp_dir(), 'posts' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+foreach ( array(
+	'posts/2024-01-pasta.md'   => "---\ntitle: Weeknight pasta\ntags: [dinner, quick]\n---\n\n# Weeknight pasta\n\nA 20-minute recipe.",
+	'posts/2024-02-soup.md'    => "---\ntitle: Carrot soup\ntags: [soup]\n---\n\n# Carrot soup\n\nA cold-day standby.",
+	'posts/2024-03-bread.md'   => "---\ntitle: No-knead bread\n---\n\n# No-knead bread\n\nA loaf in your sleep.",
+) as $name => $body ) {
+	$enc->append_file( new FileEntry( array(
+		'path'               => $name,
+		'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+		'body_reader'        => new MemoryPipe( $body ),
+	) ) );
+}
+$enc->close();
+$out->close_writing();
+
+// And here's the part the importer actually does.
+$zip = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+echo "entries in /posts:\n";
+foreach ( $zip->ls( '/posts' ) as $name ) {
+	$first_line = strtok( $zip->get_contents( '/posts/' . $name ), "\n" );
+	echo "  {$name}  --  {$first_line}\n";
+}
+</script>
+<script type="text/expected-output">
+entries in /posts:
+  2024-01-pasta.md  --  ---
+  2024-02-soup.md  --  ---
+  2024-03-bread.md  --  ---
+</script>
+</php-snippet>
+
+<p>Three things matter in that snippet. The build-the-archive part (<code>ZipEncoder</code>, <code>FileEntry</code>, <code>MemoryPipe</code>) is scaffolding so the example runs end-to-end; in your real importer the ZIP comes from <code>argv</code>. The read part is one line: <code>ZipFilesystem::create( FileReadStream::from_path( $path ) )</code> wraps the archive bytes and gives you the interface. And the loop reads each entry's contents, <em>but doesn't extract</em> — the bytes get inflated on demand and discarded after we're done with them. Memory stays flat regardless of how big the archive is.</p>
+
+<aside class="callout pitfall">
+	<strong>Pitfall — one entry stream at a time.</strong> The decoder is positional. <code>get_contents()</code> opens an entry, reads it whole, and closes it. If you switch to <code>open_read_stream()</code> for a large entry (next section), you must drain or close that stream before opening another. Holding two open simultaneously is undefined.
+</aside>
+
+<h2 id="stream-large">Stream a large entry without buffering it</h2>
+
+<p>For our small Markdown posts <code>get_contents()</code> is fine. But the importer might also include a <code>data.csv</code> with twenty thousand rows of metadata, or a large JSON file describing categories. <code>open_read_stream()</code> returns a pull-based byte reader instead of a buffered string, so you can process the entry chunk-by-chunk:</p>
+
+<php-snippet blueprint="toolkit-setup" name="stream-large.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+
+$path = tempnam( sys_get_temp_dir(), 'big' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+$enc->append_file( new FileEntry( array(
+	'path'               => 'metadata.csv',
+	'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+	'body_reader'        => new MemoryPipe( str_repeat( "id,slug,date\n1,pasta,2024-01\n", 5000 ) ),
+) ) );
+$enc->close();
+$out->close_writing();
+
+$zip    = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+$stream = $zip->open_read_stream( 'metadata.csv' );
+
+$rows = 0;
+$tail = '';
+while ( ! $stream->reached_end_of_data() ) {
+	$n = $stream->pull( 8192 );
+	if ( 0 === $n ) break;
+	$chunk  = $tail . $stream->consume( $n );
+	$lines  = explode( "\n", $chunk );
+	$tail   = array_pop( $lines );
+	$rows  += count( $lines );
+}
+printf( "parsed %d CSV rows in 8 KB chunks; peak memory ~%d KB\n",
+	$rows, (int)( memory_get_peak_usage() / 1024 ) );
+</script>
+</php-snippet>
+
+<p>That pull-loop is the same shape every byte stream in the toolkit uses. <code>pull(8192)</code> means "buffer up to 8 KB"; <code>consume($n)</code> reads and advances. The trailing partial line gets carried into the next iteration. Memory used is the chunk size plus one partial line — the same regardless of whether the file is 50 KB or 5 GB.</p>
+
+<aside class="callout note">
+	<strong>Note.</strong> The reference page for ByteStream covers the same loop pattern in more detail, plus the filters that wrap streams: gzip, hash, limit, window. See <a href="../reference/bytestream.html">reference/bytestream.html</a>.
+</aside>
+
+<h2 id="staging">Stage the imports in memory</h2>
+
+<p>Now we connect the two halves. The input is the ZIP we just opened. The staging area is an <code>InMemoryFilesystem</code> — same interface, no disk. Walking the input and copying into the stage is one helper:</p>
+
+<php-snippet blueprint="toolkit-setup" name="stage-imports.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+use function WordPress\Filesystem\copy_between_filesystems;
+
+// Build a sample input ZIP.
+$path = tempnam( sys_get_temp_dir(), 'posts' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+foreach ( array(
+	'posts/pasta.md'  => "---\ntitle: Pasta\n---\n\nQuick pasta.",
+	'posts/soup.md'   => "---\ntitle: Soup\n---\n\nWarm soup.",
+	'images/hero.jpg' => "(fake jpeg bytes)",
+) as $name => $body ) {
+	$enc->append_file( new FileEntry( array(
+		'path'               => $name,
+		'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+		'body_reader'        => new MemoryPipe( $body ),
+	) ) );
+}
+$enc->close();
+$out->close_writing();
+
+// Open the input ZIP and a fresh staging filesystem.
+$zip   = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+$stage = InMemoryFilesystem::create();
+
+// One call walks the source and writes to the destination.
+copy_between_filesystems( array(
+	'source_filesystem' => $zip,
+	'source_path'       => '/',
+	'target_filesystem' => $stage,
+	'target_path'       => '/',
+) );
+
+// The stage is now a writable in-memory tree mirroring the archive.
+echo "staged files:\n";
+foreach ( array( '/posts', '/images' ) as $dir ) {
+	foreach ( $stage->ls( $dir ) as $name ) {
+		echo "  {$dir}/{$name}\n";
+	}
+}
+
+// You can still write to the stage afterwards — it's mutable.
+$stage->put_contents( '/MANIFEST', "imported " . date( 'c' ) );
+echo "manifest: " . $stage->get_contents( '/MANIFEST' ) . "\n";
+</script>
+</php-snippet>
+
+<p>Read that example carefully because it's the heart of how the importer composes. The input is read-only (a ZIP) and the output is writable (in-memory). Both expose the same interface, so a generic <code>copy_between_filesystems()</code> works on both. In chapter 3 we'll iterate the staged Markdown files and convert them; in chapter 4 we'll add downloaded media to the same stage. The shape doesn't change between chapters — only what's in the stage.</p>
+
+<aside class="callout try">
+	<strong>Try this:</strong> swap <code>InMemoryFilesystem::create()</code> for <code>LocalFilesystem::create($somePath)</code>. The rest of the example works identically — that's the point of the shared interface. For a CLI tool you'd ship to disk; for an in-process importer you'd stay in memory; for tests you'd use the in-memory backend so each test starts fresh.
+</aside>
+
+<h2 id="zip-slip">Defend against malicious archive paths</h2>
+
+<p>Every importer that accepts external ZIPs needs to defend against <em>zip-slip</em>: an archive containing an entry named <code>../../etc/passwd</code> that, if extracted naively, writes outside the intended destination. The toolkit ships a one-line defense:</p>
+
+<php-snippet blueprint="toolkit-setup" name="zip-slip-defense.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Zip\ZipDecoder;
+
+$inputs = array(
+	'../../etc/passwd',
+	'./safe/path.txt',
+	'a/../../b/secret',
+	'a//b///c.txt',
+	'../../../../root/.ssh/authorized_keys',
+);
+foreach ( $inputs as $name ) {
+	printf( "%-30s -> %s\n", $name, ZipDecoder::sanitize_path( $name ) );
+}
+</script>
+</php-snippet>
+
+<p>Run any entry path through <code>ZipDecoder::sanitize_path()</code> before using it as a key in your destination filesystem. <code>copy_between_filesystems()</code> already does this; if you build your own loop you must too.</p>
+
+<h2 id="combine">Folding it into the importer</h2>
+
+<p>The importer so far has chapter 1's <code>clean_post_html()</code> and chapter 2's stage. Combine them: open the input ZIP, copy it into the stage, then iterate the stage's <code>posts/</code> directory and remember to apply <code>clean_post_html()</code> when we render in chapter 3. We're not invoking it yet because the Markdown-to-HTML conversion is chapter 3's job — but we can already see the shape:</p>
+
+<php-snippet blueprint="toolkit-setup" name="importer-step-2.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\Filesystem\Filesystem;
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Zip\ZipFilesystem;
+use function WordPress\Filesystem\copy_between_filesystems;
+
+function open_input_zip( $path ) {
+	return ZipFilesystem::create( FileReadStream::from_path( $path ) );
+}
+
+function stage_input( ZipFilesystem $input ) {
+	$stage = InMemoryFilesystem::create();
+	copy_between_filesystems( array(
+		'source_filesystem' => $input,
+		'source_path'       => '/',
+		'target_filesystem' => $stage,
+		'target_path'       => '/',
+	) );
+	return $stage;
+}
+
+function each_post( Filesystem $stage ) {
+	foreach ( $stage->ls( '/posts' ) as $name ) {
+		yield array(
+			'name'     => $name,
+			'markdown' => $stage->get_contents( '/posts/' . $name ),
+		);
+	}
+}
+
+// Caller (omitted here; chapter 3 wires this in):
+//   $input  = open_input_zip( $argv[1] );
+//   $stage  = stage_input( $input );
+//   foreach ( each_post( $stage ) as $post ) {
+//       $blocks = markdown_to_blocks( $post['markdown'] );
+//       $html   = clean_post_html( render_blocks( $blocks ), $base_url );
+//       ...
+//   }
+</script>
+</php-snippet>
+
+<p>Three small functions, each with a single job. <code>open_input_zip()</code> is one line and exists mostly for readability. <code>stage_input()</code> is the composition we just built. <code>each_post()</code> is a generator so the caller can iterate without loading every post's text at once. The signatures take the abstract <code>Filesystem</code> type, not <code>InMemoryFilesystem</code>, which means a future version of the importer that stages on disk for a debugging session would not need any code change.</p>
+
+<h2 id="recap">Recap</h2>
+
+<p>You can now:</p>
+
+<ul>
+	<li>Wrap a ZIP archive as a <code>Filesystem</code> with <code>ZipFilesystem::create()</code> and read entries through the standard interface.</li>
+	<li>Stream a large entry with <code>open_read_stream()</code>, the <code>pull()</code> / <code>consume()</code> loop, and a trailing-partial-line carry.</li>
+	<li>Stage data in <code>InMemoryFilesystem</code> for in-process work, and swap to a different backend without changing the calling code.</li>
+	<li>Compose source and destination filesystems with <code>copy_between_filesystems()</code> in one helper call.</li>
+	<li>Defend against zip-slip with <code>ZipDecoder::sanitize_path()</code>.</li>
+</ul>
+
+<p>The stage is now ready to feed chapter 3, where the Markdown-to-blocks conversion actually happens.</p>
+
+<nav class="chapter-nav">
+	<a class="prev" href="01-rewriting-html.html">← Previous: Rewriting HTML</a>
+	<a class="next" href="03-importing-content.html">Next: Markdown to WXR →</a>
+</nav>
+
+<p class="next-preview">In chapter 3 we'll turn each Markdown post into WordPress block markup, run it through <code>clean_post_html()</code>, and stream the whole thing into a WXR file the WordPress importer plugin will accept. Three more components — Markdown, BlockParser, and DataLiberation — finally meet the importer.</p>
+
+</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/learn/03-importing-content.html b/docs/learn/03-importing-content.html
new file mode 100644
index 000000000..5a24f80ea
--- /dev/null
+++ b/docs/learn/03-importing-content.html
@@ -0,0 +1,452 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Chapter 3 — Markdown to WXR · PHP Toolkit</title>
+<meta name="description" content="Convert Markdown posts to WordPress block markup, audit the result with BlockParser, and stream a WXR export with DataLiberation. Chapter 3 of the importer tutorial.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="./">Learn</a>
+		<a href="../reference/">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+
+<aside class="sidebar" aria-label="Tutorial navigation">
+	<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+	<nav class="toc" aria-label="Table of contents"></nav>
+	<details class="components-nav" open>
+		<summary>The path</summary>
+		<ol>
+			<li><a href="quickstart.html">Quickstart</a></li>
+			<li><a href="01-rewriting-html.html">1. Rewriting HTML</a></li>
+			<li><a href="02-streaming-archives.html">2. Streaming archives</a></li>
+			<li class="current"><a href="03-importing-content.html">3. Markdown to WXR</a></li>
+			<li><a href="04-talking-to-the-network.html">4. Talking to the network</a></li>
+			<li><a href="recap.html">Recap</a></li>
+		</ol>
+	</details>
+</aside>
+
+<article class="content">
+
+<p class="breadcrumb">Chapter 3 of 4</p>
+<h1>Markdown to blocks to WXR</h1>
+
+<p class="lede">Chapter 1 cleaned a single HTML string. Chapter 2 staged a folder of Markdown files in memory. This chapter turns each of those files into the actual format the WordPress importer plugin reads: WXR, an extended-RSS export. Along the way we meet three more components — Markdown, BlockParser, and DataLiberation — and watch them compose into something none of them could do alone.</p>
+
+<aside class="callout you-will-learn">
+	<strong>You will learn to:</strong>
+	<ul>
+		<li>Convert a Markdown document into WordPress block markup with <code>MarkdownConsumer</code>, including frontmatter as post metadata.</li>
+		<li>Inspect the produced blocks with <code>WP_Block_Parser</code> to count, audit, or rewrite them.</li>
+		<li>Stream a WXR export with <code>WXRWriter</code>, one entity at a time, with constant memory.</li>
+		<li>Combine those components into a single end-to-end pipeline: Markdown in, WXR out.</li>
+	</ul>
+</aside>
+
+<h2 id="markdown-to-blocks">Markdown to block markup</h2>
+
+<p>The <code>Markdown</code> component does one thing well: it bridges Markdown and <a href="https://developer.wordpress.org/block-editor/reference-guides/block-api/">WordPress block markup</a>, in either direction. The <code>MarkdownConsumer</code> class takes a Markdown string and returns a result object containing both the rendered block markup and any frontmatter parsed from the document's leading YAML.</p>
+
+<php-snippet blueprint="toolkit-setup" name="md-to-blocks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+$markdown = <<<MD
+---
+title: Weeknight pasta
+status: publish
+tags: [dinner, quick]
+---
+
+# Weeknight pasta
+
+A 20-minute recipe for **busy nights**.
+
+## Ingredients
+
+- 200 g spaghetti
+- 2 cloves garlic
+- 50 g parmesan
+
+> Use a heavy pan; it makes a difference.
+MD;
+
+$consumer = new MarkdownConsumer( $markdown );
+$result   = $consumer->consume();
+
+echo "title:  " . $consumer->get_meta_value( 'title' ) . "\n";
+echo "status: " . $consumer->get_meta_value( 'status' ) . "\n\n";
+echo "block markup (first 400 chars):\n";
+echo substr( $result->get_block_markup(), 0, 400 ) . "...\n";
+</script>
+</php-snippet>
+
+<p>Two outputs come back: the post metadata (read with <code>get_meta_value()</code> for scalars, or <code>get_all_metadata()</code> for the raw structure) and the block markup itself, which is the <code>&lt;!-- wp:heading --&gt;…&lt;!-- /wp:heading --&gt;</code> string that WordPress stores in <code>post_content</code>. From here on we treat that string the way WordPress treats it.</p>
+
+<aside class="callout note">
+	<strong>Note — two ways to read frontmatter.</strong> <code>get_meta_value( 'title' )</code> returns the first occurrence of that key as a scalar; for everything else use <code>get_all_metadata()</code> and index into the resulting array. The toolkit wraps repeated keys so the same call works whether a key appears once or many times.
+</aside>
+
+<h2 id="audit-blocks">Audit the produced blocks</h2>
+
+<p>Before we ship the converted post into a WXR file, the importer should sanity-check what came out. Did Markdown conversion produce blocks the destination site can render? Are there headings out of order? Are there blocks the importer doesn't know how to handle? <code>WP_Block_Parser</code> walks the same block markup WordPress core uses and gives us a structured tree:</p>
+
+<php-snippet blueprint="toolkit-setup" name="audit-blocks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+$markdown = "# Title\n\nIntro.\n\n## Section\n\nBody.\n\n#### Skipped a level\n\nDetails.";
+$blocks   = ( new MarkdownConsumer( $markdown ) )->consume()->get_block_markup();
+
+$tree = ( new WP_Block_Parser() )->parse( $blocks );
+
+// Count blocks by name.
+$counts = array();
+$queue  = $tree;
+while ( $queue ) {
+	$block = array_shift( $queue );
+	if ( null !== $block['blockName'] ) {
+		$name             = $block['blockName'];
+		$counts[ $name ] = isset( $counts[ $name ] ) ? $counts[ $name ] + 1 : 1;
+	}
+	foreach ( $block['innerBlocks'] as $inner ) {
+		$queue[] = $inner;
+	}
+}
+echo "block counts:\n";
+foreach ( $counts as $name => $n ) {
+	printf( "  %-20s %d\n", $name, $n );
+}
+
+// Lint heading levels.
+$last = 1;
+foreach ( $tree as $b ) {
+	if ( 'core/heading' !== $b['blockName'] ) continue;
+	$level = isset( $b['attrs']['level'] ) ? (int) $b['attrs']['level'] : 2;
+	$text  = trim( strip_tags( $b['innerHTML'] ) );
+	if ( $level > $last + 1 ) {
+		echo "  WARN '{$text}': jumped from H{$last} to H{$level}\n";
+	}
+	$last = $level;
+}
+</script>
+</php-snippet>
+
+<p>Two patterns to keep. The flat counter (a queue that walks <code>innerBlocks</code>) answers any "how many" or "does it use" question. The level checker is a domain-specific rule — accessibility wants no jumps in heading depth — but every audit you'll write follows the same shape: walk the tree, gate by <code>blockName</code>, ask the question. The reference page for <a href="../reference/blockparser.html">BlockParser</a> covers both patterns in more depth.</p>
+
+<h2 id="clean-html-inside-blocks">Apply chapter 1's cleaner inside the blocks</h2>
+
+<p>Block markup is HTML embedded in HTML comments. Chapter 1's <code>clean_post_html()</code> takes an HTML string and returns a clean one — we can run it on the whole block-markup string in one pass, because <code>WP_HTML_Tag_Processor</code> is happy to walk the HTML between the block-comment delimiters. The block comments themselves don't look like tags to the processor, so they pass through untouched:</p>
+
+<php-snippet blueprint="toolkit-setup" name="clean-blocks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+function clean_post_html( $html, $base_url ) {
+	$tags = new WP_HTML_Tag_Processor( $html );
+	while ( $tags->next_tag() ) {
+		$tag = $tags->get_tag();
+		if ( 'SCRIPT' === $tag && ! $tags->is_tag_closer() ) {
+			$tags->set_modifiable_text( '' );
+			foreach ( $tags->get_attribute_names_with_prefix( '' ) as $a ) {
+				$tags->remove_attribute( $a );
+			}
+			continue;
+		}
+		foreach ( $tags->get_attribute_names_with_prefix( 'on' ) as $a ) {
+			$tags->remove_attribute( $a );
+		}
+		if ( 'IMG' === $tag && ! $tags->is_tag_closer() ) {
+			if ( null === $tags->get_attribute( 'loading' ) ) {
+				$tags->set_attribute( 'loading', 'lazy' );
+			}
+		}
+		if ( 'A' === $tag && ! $tags->is_tag_closer() ) {
+			$href = $tags->get_attribute( 'href' );
+			if ( is_string( $href ) && '' !== $href
+				&& ! preg_match( '#^[a-z][a-z0-9+.\-]*:#i', $href )
+				&& 0 !== strpos( $href, '//' )
+				&& 0 !== strpos( $href, '#' ) ) {
+				$tags->set_attribute( 'href', rtrim( $base_url, '/' ) . '/' . ltrim( $href, '/' ) );
+			}
+		}
+	}
+	return $tags->get_updated_html();
+}
+
+$markdown = <<<MD
+# Hello
+
+See [our docs](/docs) — and an inline image:
+
+![](photo.jpg)
+MD;
+
+$blocks = ( new MarkdownConsumer( $markdown ) )->consume()->get_block_markup();
+$cleaned = clean_post_html( $blocks, 'https://example.com' );
+
+echo $cleaned;
+</script>
+</php-snippet>
+
+<p>Notice how <code>&lt;!-- wp:heading --&gt;</code> survived the walk verbatim. The Tag Processor only sees real HTML tags; comments and text aren't tags to it. That's why combining the two components here works without any special-casing — Markdown produces block markup, the cleaner walks the HTML inside it, and the comments pass through as plain bytes.</p>
+
+<h2 id="wxr">Stream a WXR file with DataLiberation</h2>
+
+<p>We have post titles, post content (clean block markup), post metadata. The format the WordPress importer reads is WXR — WordPress eXtended RSS — an XML dialect with a fixed shape. <code>DataLiberation</code>'s <code>WXRWriter</code> takes <code>ImportEntity</code> objects and streams them into a byte sink, one entity at a time, without ever holding the whole export in memory:</p>
+
+<php-snippet blueprint="toolkit-setup" name="wxr-stream.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+
+$writer->append_entity( new ImportEntity( 'post', array(
+	'post_id'    => '1',
+	'post_title' => 'Weeknight pasta',
+	'content'    => '<!-- wp:paragraph --><p>Quick recipe.</p><!-- /wp:paragraph -->',
+	'status'     => 'publish',
+	'post_type'  => 'post',
+	'post_name'  => 'weeknight-pasta',
+) ) );
+$writer->append_entity( new ImportEntity( 'post', array(
+	'post_id'    => '2',
+	'post_title' => 'Carrot soup',
+	'content'    => '<!-- wp:paragraph --><p>Cold-day standby.</p><!-- /wp:paragraph -->',
+	'status'     => 'publish',
+	'post_type'  => 'post',
+	'post_name'  => 'carrot-soup',
+) ) );
+
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+
+$wxr = $pipe->consume_all();
+echo "WXR size: " . strlen( $wxr ) . " bytes\n";
+echo "items in WXR: " . substr_count( $wxr, '<item>' ) . "\n";
+echo "first 600 chars:\n" . substr( $wxr, 0, 600 ) . "...\n";
+</script>
+</php-snippet>
+
+<p>The writer holds only what it needs to close currently-open XML tags — fewer than ten kilobytes of state for any reasonable pipeline. Every <code>append_entity()</code> writes one item to the underlying byte sink and forgets it. You can build a WXR from twenty thousand posts on a host with sixty-four megabytes of RAM and the importer code looks no different from the two-post version above.</p>
+
+<aside class="callout note">
+	<strong>Note.</strong> The byte sink here is <code>MemoryPipe</code> for the example. In the real importer you'd pass <code>FileWriteStream::from_path( 'export.xml', 'truncate' )</code> and the WXR would stream straight to disk without ever existing as a single in-memory string.
+</aside>
+
+<h2 id="end-to-end">End-to-end: Markdown folder to WXR file</h2>
+
+<p>Now we wire it all together. The pipeline reads the staged Markdown files from chapter 2, converts each to block markup, cleans the HTML inside it, builds an <code>ImportEntity</code> with title and slug from frontmatter, and streams the whole thing into a WXR document. This is the importer's first complete end-to-end run:</p>
+
+<php-snippet blueprint="toolkit-setup" name="importer-step-3.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+use WordPress\Markdown\MarkdownConsumer;
+
+// The combined cleaner from chapter 1, unchanged.
+function clean_post_html( $html, $base_url ) {
+	$tags = new WP_HTML_Tag_Processor( $html );
+	while ( $tags->next_tag() ) {
+		$tag = $tags->get_tag();
+
+		if ( 'SCRIPT' === $tag && ! $tags->is_tag_closer() ) {
+			$tags->set_modifiable_text( '' );
+			foreach ( $tags->get_attribute_names_with_prefix( '' ) as $a ) {
+				$tags->remove_attribute( $a );
+			}
+			continue;
+		}
+
+		foreach ( $tags->get_attribute_names_with_prefix( 'on' ) as $a ) {
+			$tags->remove_attribute( $a );
+		}
+
+		if ( 'IMG' === $tag && ! $tags->is_tag_closer() ) {
+			if ( null === $tags->get_attribute( 'loading' ) ) {
+				$tags->set_attribute( 'loading', 'lazy' );
+			}
+		}
+
+		if ( 'A' === $tag && ! $tags->is_tag_closer() ) {
+			$href = $tags->get_attribute( 'href' );
+			if ( is_string( $href ) && '' !== $href
+				&& ! preg_match( '#^[a-z][a-z0-9+.\-]*:#i', $href )
+				&& 0 !== strpos( $href, '//' )
+				&& 0 !== strpos( $href, '#' ) ) {
+				$tags->set_attribute( 'href', rtrim( $base_url, '/' ) . '/' . ltrim( $href, '/' ) );
+			}
+		}
+	}
+	return $tags->get_updated_html();
+}
+
+// Three sample Markdown posts. In the real importer these came from chapter 2's stage.
+$inputs = array(
+	'pasta.md' => "---\ntitle: Weeknight pasta\ntags: [dinner]\n---\n\n# Pasta\n\nA 20-minute recipe. See [our sauce primer](/sauces).",
+	'soup.md'  => "---\ntitle: Carrot soup\n---\n\n# Soup\n\nA cold-day standby with [a step-by-step video](video.html).",
+	'bread.md' => "---\ntitle: No-knead bread\n---\n\n# Bread\n\nA loaf in your sleep. ![](https://cdn.example.com/bread.jpg)",
+);
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+$base   = 'https://recipes.example.com';
+
+$id = 1;
+foreach ( $inputs as $filename => $markdown ) {
+	$consumer = new MarkdownConsumer( $markdown );
+	$result   = $consumer->consume();
+	$cleaned  = clean_post_html( $result->get_block_markup(), $base );
+
+	$writer->append_entity( new ImportEntity( 'post', array(
+		'post_id'    => (string) $id++,
+		'post_title' => $consumer->get_meta_value( 'title' ) ?: basename( $filename, '.md' ),
+		'content'    => $cleaned,
+		'status'     => 'publish',
+		'post_type'  => 'post',
+		'post_name'  => basename( $filename, '.md' ),
+	) ) );
+}
+
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+
+$wxr = $pipe->consume_all();
+echo "wrote WXR (" . count( $inputs ) . " posts, " . strlen( $wxr ) . " bytes)\n\n";
+
+// A snippet of the output so you can see what the importer plugin will read:
+$start = strpos( $wxr, '<item>' );
+echo substr( $wxr, $start, 800 ) . "...\n";
+</script>
+</php-snippet>
+
+<p>One pass. Three components composed (Markdown for parsing, HTML for cleaning, DataLiberation for WXR), each doing one thing well. The output is real WXR — drop it on a WordPress site through the importer plugin and you get three published posts with the cleaned content, the right slugs, and the frontmatter titles.</p>
+
+<aside class="callout try">
+	<strong>Try this:</strong> add a fourth Markdown post with an <code>onclick</code> handler in raw inline HTML. Run. The handler is gone in the WXR output — the cleaner is doing its job inside block markup the same way it did on a bare HTML string in chapter 1.
+</aside>
+
+<h2 id="rewriting-on-stream">Refinement: rewrite URLs across an existing WXR</h2>
+
+<p>The pattern above (build WXR from sources) is one half of DataLiberation. The other half is reading and transforming an existing WXR. <code>WXREntityReader</code> emits one entity at a time from a WXR document, and you can wire it to a <code>WXRWriter</code> to produce a transformed copy:</p>
+
+<php-snippet blueprint="toolkit-setup" name="wxr-rewrite.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityReader\WXREntityReader;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+
+// A small staging-export WXR. In production this is your real export.
+$source = <<<XML
+<?xml version="1.0" encoding="UTF-8" ?>
+<rss version="2.0" xmlns:wp="http://wordpress.org/export/1.2/" xmlns:content="http://purl.org/rss/1.0/modules/content/">
+<channel>
+<item><title>About</title><wp:post_id>1</wp:post_id><wp:post_type>post</wp:post_type>
+<content:encoded>Visit https://staging.example.com/contact for details.</content:encoded></item>
+</channel>
+</rss>
+XML;
+
+$reader = WXREntityReader::create();
+$reader->append_bytes( $source );
+$reader->input_finished();
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+
+while ( $reader->next_entity() ) {
+	$entity = $reader->get_entity();
+	$data   = $entity->get_data();
+	foreach ( array( 'post_content', 'content', 'description' ) as $f ) {
+		if ( isset( $data[ $f ] ) ) {
+			$data[ $f ] = str_replace( 'staging.example.com', 'example.com', $data[ $f ] );
+		}
+	}
+	if ( 'post' === $entity->get_type() && isset( $data['post_content'] ) ) {
+		$data['content'] = $data['post_content'];
+	}
+	$writer->append_entity( new ImportEntity( $entity->get_type(), $data ) );
+}
+
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+
+$out = $pipe->consume_all();
+echo strpos( $out, 'https://example.com/contact' ) !== false ? "rewrite ok\n" : "rewrite missing\n";
+echo strpos( $out, 'staging.example.com' ) === false ? "old URL gone\n" : "old URL still present\n";
+</script>
+</php-snippet>
+
+<p>The same pattern handles every "transform an export between sites" job — staging-to-production URL rewrites, theme migrations, slug normalization. Reader on the left, writer on the right, your transformation in the middle. Feed the reader bytes incrementally (instead of <code>append_bytes( $source )</code> all at once) and pipe the writer to a file sink (instead of <code>MemoryPipe</code>), and the same code processes a 10 GB export with the memory footprint of one entity at a time.</p>
+
+<aside class="callout note">
+	<strong>Note — asymmetric field names.</strong> <code>WXREntityReader</code> emits the post body under <code>post_content</code> (matching WordPress's database column); <code>WXRWriter</code> reads it under <code>content</code> (matching its own internal mapping). Pipelines that read on one side and write on the other have to copy the value across, as the example does.
+</aside>
+
+<h2 id="recap">Recap</h2>
+
+<p>You can now:</p>
+
+<ul>
+	<li>Convert Markdown plus YAML frontmatter into block markup with <code>MarkdownConsumer</code>.</li>
+	<li>Walk the produced block tree with <code>WP_Block_Parser</code> to count, audit, or rewrite blocks.</li>
+	<li>Apply HTML rewrites to block markup without breaking the surrounding block comments.</li>
+	<li>Stream a WXR document with <code>WXRWriter</code> in constant memory regardless of input size.</li>
+	<li>Read an existing WXR with <code>WXREntityReader</code> and pipe its entities through a transformation into a new WXR.</li>
+</ul>
+
+<p>The importer is now functionally complete for text content. What's missing is the network — when a Markdown post references <code>![](https://cdn.example.com/bread.jpg)</code>, the destination site doesn't have that image. Chapter 4 fixes that.</p>
+
+<nav class="chapter-nav">
+	<a class="prev" href="02-streaming-archives.html">← Previous: Streaming archives</a>
+	<a class="next" href="04-talking-to-the-network.html">Next: Talking to the network →</a>
+</nav>
+
+<p class="next-preview">In chapter 4 the importer learns to fetch the images referenced from imported posts: ten downloads at a time, with progress reporting, ranged-resume on partial failures, and the option to mount a remote ZIP without downloading it first. The HttpClient component meets the importer.</p>
+
+</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/learn/04-talking-to-the-network.html b/docs/learn/04-talking-to-the-network.html
new file mode 100644
index 000000000..fd27a05cf
--- /dev/null
+++ b/docs/learn/04-talking-to-the-network.html
@@ -0,0 +1,372 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Chapter 4 — Talking to the network · PHP Toolkit</title>
+<meta name="description" content="Frontload images, run a sliding window of concurrent downloads, and stream-unzip a remote archive — all without curl. Chapter 4 of the importer tutorial.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="./">Learn</a>
+		<a href="../reference/">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+
+<aside class="sidebar" aria-label="Tutorial navigation">
+	<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+	<nav class="toc" aria-label="Table of contents"></nav>
+	<details class="components-nav" open>
+		<summary>The path</summary>
+		<ol>
+			<li><a href="quickstart.html">Quickstart</a></li>
+			<li><a href="01-rewriting-html.html">1. Rewriting HTML</a></li>
+			<li><a href="02-streaming-archives.html">2. Streaming archives</a></li>
+			<li><a href="03-importing-content.html">3. Markdown to WXR</a></li>
+			<li class="current"><a href="04-talking-to-the-network.html">4. Talking to the network</a></li>
+			<li><a href="recap.html">Recap</a></li>
+		</ol>
+	</details>
+</aside>
+
+<article class="content">
+
+<p class="breadcrumb">Chapter 4 of 4</p>
+<h1>Talking to the network</h1>
+
+<p class="lede">By the end of chapter 3 the importer produces a valid WXR from a folder of Markdown. There's one loose thread: when a post references <code>![](https://cdn.example.com/bread.jpg)</code>, the destination site has no <code>bread.jpg</code> in its media library. The WordPress importer plugin will try to fetch each remote image as it runs, but that's a fragile thing to do during an import — slow, easy to rate-limit, easy to leave behind half-fetched media. The robust answer is to fetch the images <em>before</em> the import and stage them locally so the import can reference local paths. This chapter covers the fetch side of that work using HttpClient. We'll also see how the same client mounts a remote ZIP for streaming, which means in some workflows you don't need chapter 2's local archive at all.</p>
+
+<aside class="callout you-will-learn">
+	<strong>You will learn to:</strong>
+	<ul>
+		<li>Fetch a single URL and read the response as a byte stream.</li>
+		<li>Drive the event loop manually for progress reporting and concurrent downloads.</li>
+		<li>Maintain a sliding window of N concurrent requests, refilling as each completes.</li>
+		<li>Resume a partial download with the <code>Range</code> header.</li>
+		<li>Mount a remote ZIP through HttpClient and stream its entries with the same code from chapter 2.</li>
+	</ul>
+</aside>
+
+<h2 id="why-not-curl">Why a new HTTP client</h2>
+
+<p>The instinct is <code>file_get_contents( $url )</code> or <code>curl_exec()</code>. Both work — until they don't. <code>file_get_contents</code> on a URL needs <code>allow_url_fopen</code>, which security-conscious hosts disable. <code>curl_exec</code> needs the curl extension, which WebAssembly builds of PHP don't ship. And the simplest forms of both — no <code>CURLOPT_FILE</code>, no chunked stream wrapper — buffer the whole response into one PHP string, which is fatal for a 50 MB media file on a host with a 64 MB memory limit.</p>
+
+<p>HttpClient gives you the same shape regardless of host capabilities: an event loop, response objects with status codes and headers, response bodies as <code>ByteReadStream</code>s you can pipe somewhere instead of buffering. Under the hood it picks curl when available and PHP stream sockets otherwise. From your code's perspective those two transports are identical.</p>
+
+<h2 id="fetch-one">Fetch one URL</h2>
+
+<p>The smallest possible request: create a <code>Request</code>, hand it to <code>Client::fetch()</code>, wait for the response, read the body. The result of <code>fetch()</code> is a stream — the response headers arrive at <code>await_response()</code>, and the body bytes come through <code>consume_all()</code> or chunk-by-chunk via <code>pull()</code>/<code>consume()</code>:</p>
+
+<php-snippet blueprint="toolkit-setup" name="fetch-one.php" runnable="false">
+<script type="application/x-php">
+<?php
+// Snippets that talk to the open internet are static here because the in-page
+// runtime can't always reach external hosts. Run locally.
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$client  = new Client();
+$stream  = $client->fetch( new Request( 'https://example.com/' ) );
+$response = $stream->await_response();
+
+echo "status: " . $response->status_code . "\n";
+echo "type:   " . $response->get_header( 'content-type' ) . "\n";
+echo "body:   " . strlen( $stream->consume_all() ) . " bytes\n";
+</script>
+</php-snippet>
+
+<p>Read the lifecycle. <code>fetch()</code> returns immediately with a stream object — the request is queued, not yet executed. <code>await_response()</code> blocks until the response headers have arrived, then returns the <code>Response</code> object. <code>consume_all()</code> reads the body to completion. Splitting "headers" from "body" matters because for some workflows (progress reporting, redirect logging, content-type sniffing) you act on the headers before deciding what to do with the body.</p>
+
+<h2 id="frontload-one">Download an image to the stage</h2>
+
+<p>The importer's job in this chapter is to take an image URL, fetch it, and place the bytes into the staging filesystem under a deterministic local path. We'll write the bytes incrementally so the response never has to fit into memory:</p>
+
+<php-snippet blueprint="toolkit-setup" name="frontload-one.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\Filesystem;
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+function frontload_attachment( Filesystem $stage, Client $client, $url, $local_path ) {
+	$stream   = $client->fetch( new Request( $url ) );
+	$response = $stream->await_response();
+	if ( ! $response->ok() ) {
+		fwrite( STDERR, "skip {$url}: HTTP {$response->status_code}\n" );
+		return false;
+	}
+	// Write a single string for simplicity; for very large files you'd write
+	// chunks via the event loop (next section).
+	$stage->put_contents( $local_path, $stream->consume_all() );
+	return true;
+}
+
+$stage  = InMemoryFilesystem::create();
+$stage->mkdir( '/uploads', array( 'recursive' => true ) );
+$client = new Client();
+
+frontload_attachment( $stage, $client, 'https://example.com/hero.jpg', '/uploads/hero.jpg' );
+echo "staged: " . implode( ', ', $stage->ls( '/uploads' ) ) . "\n";
+</script>
+</php-snippet>
+
+<p>Notice the function signature. It takes a <code>Filesystem</code>, not a directory path; it takes a <code>Client</code>, not a URL string transformed into one. That keeps it testable — you can pass an <code>InMemoryFilesystem</code> and a mock client and the function doesn't know the difference. It also keeps the HTTP and storage decisions out of the caller, so when you later swap the in-memory stage for <code>LocalFilesystem</code>, the function is unchanged.</p>
+
+<h2 id="event-loop">The event loop, with progress</h2>
+
+<p>For files small enough that you don't care about memory, <code>consume_all()</code> is fine. For big ones, you want to know how the download is going and write bytes as they arrive. Drop down a layer: <code>Client::enqueue()</code> + <code>await_next_event()</code> exposes every stage of the request as an event you can react to:</p>
+
+<php-snippet blueprint="toolkit-setup" name="progress.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$client = new Client();
+$client->enqueue( array( new Request( 'https://example.com/big-file.zip' ) ) );
+
+$dest       = sys_get_temp_dir() . '/big-file.zip';
+@unlink( $dest );
+$downloaded = 0;
+$last_step  = -1;
+
+while ( $client->await_next_event() ) {
+	$event   = $client->get_event();
+	$request = $client->get_request();
+
+	if ( Client::EVENT_GOT_HEADERS === $event ) {
+		$total = $request->response->total_bytes;
+		echo "starting download (" . ( $total ?: 'unknown' ) . " bytes)\n";
+		continue;
+	}
+
+	if ( Client::EVENT_BODY_CHUNK_AVAILABLE === $event ) {
+		$chunk       = $client->get_response_body_chunk();
+		$downloaded += strlen( $chunk );
+		file_put_contents( $dest, $chunk, FILE_APPEND );
+
+		$total = $request->response->total_bytes;
+		if ( $total ) {
+			$step = (int) ( $downloaded / $total * 100 );
+			if ( $step >= $last_step + 10 ) {
+				echo "  {$step}% ({$downloaded}/{$total})\n";
+				$last_step = $step;
+			}
+		}
+		continue;
+	}
+
+	if ( Client::EVENT_FINISHED === $event ) {
+		echo "done: {$dest}\n";
+	} elseif ( Client::EVENT_FAILED === $event ) {
+		echo "failed: " . $request->error->message . "\n";
+	}
+}
+</script>
+</php-snippet>
+
+<p>Read the event flow. <code>EVENT_GOT_HEADERS</code> fires once when headers come in — useful for sniffing <code>Content-Length</code> or rejecting based on status. <code>EVENT_BODY_CHUNK_AVAILABLE</code> fires repeatedly as the body comes in — that's where you write to disk, update progress, or compute a hash. <code>EVENT_FINISHED</code> or <code>EVENT_FAILED</code> ends the request. Memory used is one chunk at a time; the importer can stream a 500 MB file under any memory limit large enough to hold the chunk size.</p>
+
+<h2 id="sliding-window">A sliding window of ten concurrent downloads</h2>
+
+<p>The importer might reference dozens of images. Doing them one at a time would be unnecessarily slow; firing all of them at once would hammer the upstream and risk being rate-limited. The polite move is a fixed-size window: keep ten requests in flight, and as each one finishes, enqueue the next:</p>
+
+<php-snippet blueprint="toolkit-setup" name="sliding-window.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$urls = array();
+for ( $i = 1; $i <= 25; $i++ ) {
+	$urls[] = 'https://example.com/image-' . $i . '.jpg';
+}
+
+$client  = new Client( array( 'concurrency' => 10 ) );
+$pending = $urls;
+$active  = array();
+$done    = 0;
+
+$enqueue_next = function () use ( &$pending, &$active, $client ) {
+	if ( ! $pending ) return;
+	$url     = array_shift( $pending );
+	$request = new Request( $url );
+	$active[ $request->id ] = $request;
+	$client->enqueue( array( $request ) );
+};
+
+for ( $i = 0; $i < 10; $i++ ) $enqueue_next();
+
+while ( $active && $client->await_next_event() ) {
+	$request = $client->get_request();
+	$event   = $client->get_event();
+	if ( Client::EVENT_FINISHED === $event || Client::EVENT_FAILED === $event ) {
+		unset( $active[ $request->id ] );
+		$done++;
+		echo "finished {$done}/25 (active=" . count( $active ) . ")\n";
+		$enqueue_next();
+	}
+}
+</script>
+</php-snippet>
+
+<p>The sliding window is a small piece of bookkeeping — a pending queue, an active set, an "enqueue next" callback — wrapped around the same event loop you saw above. Real importers do exactly this for media frontloading. The <code>concurrency</code> option in the <code>Client</code> constructor is the upper bound; the bookkeeping enforces a moving window so you don't enqueue more work than the window holds.</p>
+
+<aside class="callout pitfall">
+	<strong>Pitfall — concurrency is not parallelism.</strong> HttpClient runs in a single PHP process; "concurrent" here means multiple requests in flight, not multiple PHP threads executing user code. Headers and body chunks for ten different requests interleave through one event loop. CPU-bound work in your handler still serializes — if you're doing image processing on each chunk, ten-way concurrency won't speed up the CPU work.
+</aside>
+
+<h2 id="resume">Resume a partial download</h2>
+
+<p>Long downloads fail. Sometimes the network drops, sometimes the host runs out of execution time. The importer should be able to resume rather than redownload. HTTP's contract for that is <code>Range: bytes=N-</code>. Sending it to a cooperating server returns a <code>206 Partial Content</code> response with the missing bytes:</p>
+
+<php-snippet blueprint="toolkit-setup" name="resume.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+function resumable_download( Client $client, $url, $dest ) {
+	$existing = file_exists( $dest ) ? filesize( $dest ) : 0;
+	$headers  = $existing > 0 ? array( 'range' => "bytes={$existing}-" ) : array();
+
+	$stream   = $client->fetch( new Request( $url, array( 'headers' => $headers ) ) );
+	$response = $stream->await_response();
+
+	if ( $existing > 0 && 206 !== $response->status_code ) {
+		// Server didn't honor the Range request; restart from byte 0.
+		@unlink( $dest );
+		return resumable_download( $client, $url, $dest );
+	}
+
+	$flag = $existing > 0 ? FILE_APPEND : 0;
+	while ( ! $stream->reached_end_of_data() ) {
+		$n = $stream->pull( 8192 );
+		if ( 0 === $n ) break;
+		file_put_contents( $dest, $stream->consume( $n ), $flag );
+		$flag = FILE_APPEND;
+	}
+	return filesize( $dest );
+}
+
+$client = new Client();
+$bytes  = resumable_download( $client, 'https://example.com/big.zip', '/tmp/big.zip' );
+echo "saved {$bytes} bytes\n";
+</script>
+</php-snippet>
+
+<p>The defensive check matters: not every server respects <code>Range</code>, especially when sitting behind a CDN with caching that doesn't know how to pass the header upstream. If you ask for a partial response and the server hands you a fresh 200 instead, your existing bytes don't match what's coming and you have to start over. That's the recursion in <code>resumable_download()</code> — it's a one-line fallback rather than a separate retry path.</p>
+
+<h2 id="mount-remote-zip">Stream a remote ZIP through ZipFilesystem</h2>
+
+<p>The importer's input is a ZIP — chapter 2 read it from disk. But what if the ZIP lives on a URL? Downloading it whole, opening it with <code>ZipFilesystem</code>, then deleting the file afterwards works, but it asks you to coordinate a temp path the toolkit could manage for you. <code>SeekableRequestReadStream</code> wraps a <code>Request</code> as a seekable byte stream that <code>ZipFilesystem</code> can read directly: bytes are downloaded sequentially as the consumer reads, the class caches them in an internal temp file (cleaned up when you call <code>close_reading()</code>), and seeks back into already-downloaded ranges hit the cache instead of re-fetching:</p>
+
+<php-snippet blueprint="toolkit-setup" name="remote-zip.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\ByteStream\SeekableRequestReadStream;
+use WordPress\HttpClient\Request;
+use WordPress\Zip\ZipFilesystem;
+use function WordPress\Filesystem\copy_between_filesystems;
+
+$client = new Client();
+$reader = new SeekableRequestReadStream(
+	new Request( 'https://example.com/posts.zip' ),
+	array( 'client' => $client )
+);
+
+$response = $reader->await_response();
+if ( ! $response->ok() ) {
+	echo "HTTP " . $response->status_code . "\n";
+	exit;
+}
+
+// $reader behaves like a seekable byte stream over the remote URL.
+$zip   = ZipFilesystem::create( $reader );
+$stage = InMemoryFilesystem::create();
+
+copy_between_filesystems( array(
+	'source_filesystem' => $zip,
+	'source_path'       => '/',
+	'target_filesystem' => $stage,
+	'target_path'       => '/',
+) );
+
+echo "imported " . count( $stage->ls( '/' ) ) . " top-level entries\n";
+
+// Clean up the temp-file cache the seekable reader created.
+$reader->close_reading();
+</script>
+</php-snippet>
+
+<p>That's the entire chapter-2 setup with a remote URL substituted for the local file. <code>SeekableRequestReadStream</code> downloads the response body once, lazily, into a temporary file as ZipFilesystem asks for bytes — so reads work the way they would on a local file (including the seeks that ZipFilesystem performs to find the central directory at the end of the archive). The temp file caches what's been seen, so seeking backwards doesn't re-fetch.</p>
+
+<aside class="callout note">
+	<strong>Note — when this is the right tool.</strong> <code>SeekableRequestReadStream</code> is the right wrapper when the consumer needs random-access reads on the response (a ZIP central directory, an offset table, a large binary index). For workflows that read the body straight through, <code>$client-&gt;fetch($req)-&gt;consume_all()</code> or the event-loop pattern from earlier in this chapter is simpler.
+</aside>
+
+<h2 id="end-to-end">End-to-end: the importer, finally complete</h2>
+
+<p>The importer now spans four chapters' worth of components. The full shape:</p>
+
+<ol>
+	<li>Open the input ZIP — locally with <code>ZipFilesystem</code>, or remotely with <code>SeekableRequestReadStream</code>.</li>
+	<li>Stage its contents in an <code>InMemoryFilesystem</code> with <code>copy_between_filesystems()</code>.</li>
+	<li>For each Markdown file in the stage, run <code>MarkdownConsumer</code>, then <code>clean_post_html()</code> on the produced block markup.</li>
+	<li>For each image URL referenced from the cleaned content, fetch it with HttpClient through a sliding-window concurrency loop and stage the bytes alongside the WXR.</li>
+	<li>Stream the whole thing into a WXR document with <code>WXRWriter</code>, with the cleaned post markup as <code>content</code> and rewritten image references pointing at the local paths under the staged uploads tree.</li>
+</ol>
+
+<p>The full importer is roughly a hundred lines of PHP. It depends on no extension beyond <code>json</code> and <code>mbstring</code>. It runs in browser-side WebAssembly, on PHP 7.2 through 8.3, and on every shared host that's kept up with PHP releases. That's the toolkit's whole pitch — pure-PHP libraries that handle the work the platform usually outsources to extensions.</p>
+
+<h2 id="recap">Recap</h2>
+
+<p>You can now:</p>
+
+<ul>
+	<li>Fetch a URL with <code>Client::fetch()</code> and read the body either whole (<code>consume_all()</code>) or in chunks (<code>pull()</code>/<code>consume()</code>).</li>
+	<li>Drive the event loop with <code>enqueue()</code> + <code>await_next_event()</code> for progress reporting and per-chunk processing.</li>
+	<li>Maintain a sliding window of N concurrent requests by tracking active and pending sets.</li>
+	<li>Resume a partial download with the <code>Range</code> header, and fall back to a full download when the server doesn't honor it.</li>
+	<li>Mount a remote ZIP through <code>SeekableRequestReadStream</code> so <code>ZipFilesystem</code> can seek over the response — bytes are downloaded lazily into a temp-file cache as they're read.</li>
+</ul>
+
+<nav class="chapter-nav">
+	<a class="prev" href="03-importing-content.html">← Previous: Markdown to WXR</a>
+	<a class="next" href="recap.html">Next: Recap →</a>
+</nav>
+
+<p class="next-preview">The recap page summarizes what the four chapters built, what's still in the toolkit beyond what we used, and where to look in the reference for the components we didn't visit (Git for snapshots, Merge for sync, HttpServer for OAuth callbacks, Blueprints for site setup).</p>
+
+</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/learn/index.html b/docs/learn/index.html
new file mode 100644
index 000000000..c5f07f4fa
--- /dev/null
+++ b/docs/learn/index.html
@@ -0,0 +1,101 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Learn — PHP Toolkit</title>
+<meta name="description" content="A four-chapter tutorial that builds a real WordPress content importer using HTML, ZIP, Markdown, and DataLiberation. Every code block runs in the browser.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="./">Learn</a>
+		<a href="../reference/">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<main class="learn-landing">
+
+<h1>Learn the toolkit by building a content importer</h1>
+
+<p class="lede">Across four chapters and roughly forty-five minutes, you'll build a small WordPress content importer in pure PHP. It reads a folder of Markdown posts, rewrites the HTML inside them, packages everything as a ZIP-backed staging filesystem, and finally emits a WXR file ready to feed to WordPress's importer. Every snippet runs in your browser. You finish with code you can keep.</p>
+
+<section class="prereqs">
+	<h2>Before you start</h2>
+	<p>You should be comfortable reading and writing PHP. You don't need to know WordPress internals — we'll explain the WordPress-specific bits as they come up. You don't need anything installed locally; the runnable snippets execute via WordPress Playground in the page.</p>
+	<p>If you want to run the same code on your own machine afterwards, every example works under PHP 7.2 or newer with <code>composer require wp-php-toolkit/&lt;component&gt;</code>.</p>
+</section>
+
+<section class="path">
+	<h2>The path</h2>
+
+	<ol class="chapters">
+		<li>
+			<a href="quickstart.html">
+				<strong>Quickstart</strong>
+				<span>Five minutes from zero to a runnable HTML rewrite. The shape of every later chapter, in miniature.</span>
+			</a>
+		</li>
+		<li>
+			<a href="01-rewriting-html.html">
+				<strong>Chapter 1 — Rewriting HTML safely</strong>
+				<span>Add <code>loading="lazy"</code> to images, rewrite relative links, strip script tags. Meet the cursor model that underlies every later chapter.</span>
+			</a>
+		</li>
+		<li>
+			<a href="02-streaming-archives.html">
+				<strong>Chapter 2 — Streaming archives</strong>
+				<span>Read your importer's input from a ZIP without buffering it in memory. Compose a ZIP-backed filesystem with a memory-backed staging filesystem.</span>
+			</a>
+		</li>
+		<li>
+			<a href="03-importing-content.html">
+				<strong>Chapter 3 — Markdown to blocks to WXR</strong>
+				<span>Turn each Markdown file into block markup, then assemble those blocks into a WordPress eXtended RSS export.</span>
+			</a>
+		</li>
+		<li>
+			<a href="04-talking-to-the-network.html">
+				<strong>Chapter 4 — Talking to the network</strong>
+				<span>Frontload the images referenced from the imported posts using HttpClient with progress, redirects, and resumable downloads.</span>
+			</a>
+		</li>
+		<li>
+			<a href="recap.html">
+				<strong>Recap</strong>
+				<span>What you can now do, and where the rest of the toolkit lives.</span>
+			</a>
+		</li>
+	</ol>
+</section>
+
+<section class="canonical-artifact">
+	<h2>What you're building</h2>
+
+	<p>By the end of chapter 4, you'll have a small command — call it <code>importer.php</code> — that takes a ZIP file of Markdown posts and produces a WordPress WXR file:</p>
+
+<pre><code>$ php importer.php posts.zip > export.xml
+parsed 12 posts, 8 images
+rewrote 47 inline links
+fetched 8 image attachments (2.3 MB)
+wrote export.xml (94 KB, valid WXR 1.2)</code></pre>
+
+	<p>It's a real tool — the WordPress importer plugin will accept the output. You'll write it in pieces, one component per chapter, and the canonical example file grows with each chapter. By chapter 4 it's a hundred lines of pure PHP that depends on no extension beyond <code>json</code> and <code>mbstring</code>.</p>
+
+	<p>The actual content — twelve Markdown posts about cooking, with embedded images and frontmatter — is part of the tutorial's example data and ships pre-loaded into every snippet. You'll see it in chapter 1.</p>
+</section>
+
+<section class="next">
+	<a class="cta primary" href="quickstart.html">Start the quickstart →</a>
+</section>
+
+</main>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/learn/quickstart.html b/docs/learn/quickstart.html
new file mode 100644
index 000000000..9ef1dfdcd
--- /dev/null
+++ b/docs/learn/quickstart.html
@@ -0,0 +1,129 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Quickstart — PHP Toolkit</title>
+<meta name="description" content="Five minutes from zero to a runnable HTML rewrite using PHP Toolkit's HTML component.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="./">Learn</a>
+		<a href="../reference/">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+
+<aside class="sidebar" aria-label="Tutorial navigation">
+	<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+	<nav class="toc" aria-label="Table of contents"></nav>
+	<details class="components-nav" open>
+		<summary>The path</summary>
+		<ol>
+			<li class="current"><a href="quickstart.html">Quickstart</a></li>
+			<li><a href="01-rewriting-html.html">1. Rewriting HTML</a></li>
+			<li><a href="02-streaming-archives.html">2. Streaming archives</a></li>
+			<li><a href="03-importing-content.html">3. Markdown to WXR</a></li>
+			<li><a href="04-talking-to-the-network.html">4. Talking to the network</a></li>
+			<li><a href="recap.html">Recap</a></li>
+		</ol>
+	</details>
+</aside>
+
+<article class="content">
+
+<h1>Quickstart</h1>
+
+<p class="lede">By the end of this page you will have rewritten an HTML attribute in five lines of PHP, in a runtime that lives inside this browser tab. You'll see the shape every chapter of the tutorial follows: a problem in plain English, a small chunk of code, and a paragraph that points at what to look at.</p>
+
+<h2 id="install">Install</h2>
+
+<p>You don't need to install anything to follow the tutorial — the snippets on this site run in your browser. If you want to run the same code in your own project later, this is the line you'll copy:</p>
+
+<pre><code>composer require wp-php-toolkit/html</code></pre>
+
+<p>Each component installs separately; you only pull in what you use. The HTML component depends on nothing except PHP itself.</p>
+
+<h2 id="rewrite">Rewrite an attribute</h2>
+
+<p>Here's the smallest useful thing the toolkit does. The example feeds a snippet of HTML into <code>WP_HTML_Tag_Processor</code>, finds every <code>&lt;img&gt;</code> tag, and adds <code>loading="lazy"</code> if the author didn't already set <code>loading</code> themselves.</p>
+
+<p>Click <em>Run</em>. The first run on this page boots a PHP runtime in WebAssembly and unzips the toolkit into it; later runs reuse the same runtime, so they're instant.</p>
+
+<php-snippet blueprint="toolkit-setup" name="quickstart.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<article>
+	<img src="hero.jpg" alt="Hero shot">
+	<p>Welcome to the site.</p>
+	<img src="diagram.png" alt="" loading="eager">
+</article>';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag( 'img' ) ) {
+	if ( null === $tags->get_attribute( 'loading' ) ) {
+		$tags->set_attribute( 'loading', 'lazy' );
+	}
+}
+
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<article>
+	<img src="hero.jpg" alt="Hero shot" loading="lazy">
+	<p>Welcome to the site.</p>
+	<img src="diagram.png" alt="" loading="eager">
+</article>
+</script>
+</php-snippet>
+
+<p>Look at the output. The first <code>&lt;img&gt;</code> gained <code>loading="lazy"</code>. The second one — which had <code>loading="eager"</code> already — was left alone. The whitespace, the <code>&lt;p&gt;</code> tag, the <code>&lt;article&gt;</code> wrapper, every byte we didn't ask the processor to touch came through unchanged. That property is the entire reason this component exists: rewriting HTML byte-for-byte without re-serializing it.</p>
+
+<aside class="callout try">
+	<strong>Try this:</strong> change <code>'lazy'</code> to <code>'eager'</code>, click <em>Run</em>, and see that only the first image flips. Then add a third <code>&lt;img&gt;</code> tag inside the <code>&lt;p&gt;</code> and run again — the processor finds it without you touching the loop.
+</aside>
+
+<h2 id="why-cursor">Why a cursor, not a DOM</h2>
+
+<p>The traditional PHP move here is <code>DOMDocument::loadHTML</code>. That works, but loading 50 KB of post content into a libxml DOM, mutating it, and serializing it back gives you a string that's <em>nearly</em> the same as the input — different whitespace, normalized attribute quoting, occasionally a self-closing tag where there wasn't one before. For email templates and feed readers that compare strings byte-for-byte, that's a bug.</p>
+
+<p>The Tag Processor walks the HTML linearly, records edits as a small list of byte-range replacements, and applies them only when you call <code>get_updated_html()</code>. The HTML you didn't edit comes through bit-identical. The HTML you edited contains exactly your edits, and nothing else.</p>
+
+<p>That model — small, linear, byte-honest — is the toolkit's whole sensibility. Every other component that follows uses some version of it.</p>
+
+<h2 id="recap">Recap</h2>
+
+<p>You can now:</p>
+
+<ul>
+	<li>Run a PHP Toolkit snippet in the browser without installing anything.</li>
+	<li>Read an HTML string with <code>WP_HTML_Tag_Processor</code> and walk every tag of a given name.</li>
+	<li>Add or replace an attribute with <code>set_attribute()</code> and read the modified HTML with <code>get_updated_html()</code>.</li>
+</ul>
+
+<p>That's the whole shape of the tutorial. Each chapter takes one component, shows you the smallest useful thing it does, and folds the result into a content importer that grows page by page.</p>
+
+<nav class="chapter-nav">
+	<a class="next" href="01-rewriting-html.html">Next: Chapter 1 — Rewriting HTML safely →</a>
+</nav>
+
+<p class="next-preview">In chapter 1 you'll meet the canonical importer's first input — a folder of Markdown posts whose embedded HTML needs cleaning before it ever sees a WordPress database. We'll add lazy loading, rewrite relative URLs, and strip event handlers in a single linear pass.</p>
+
+</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/learn/recap.html b/docs/learn/recap.html
new file mode 100644
index 000000000..0b5ae055b
--- /dev/null
+++ b/docs/learn/recap.html
@@ -0,0 +1,95 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Recap · PHP Toolkit</title>
+<meta name="description" content="Where to go after the four-chapter tutorial — what the importer used, what the toolkit covers beyond it.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="./">Learn</a>
+		<a href="../reference/">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<main class="learn-landing">
+
+<h1>Recap and where to go next</h1>
+
+<p class="lede">Across four chapters you built a working content importer. It reads a ZIP of Markdown posts, cleans the HTML inside each one, frontloads referenced images over HTTP, and streams a WXR file the WordPress importer plugin will accept. None of it required curl, libzip, libxml2, or DOMDocument; all of it runs on PHP 7.2 through 8.3 and inside a browser via WordPress Playground.</p>
+
+<section class="what-you-built">
+	<h2>What you built</h2>
+
+	<table class="proof-table">
+	<tr><td>Chapter 1</td><td>→</td><td><code>clean_post_html()</code> using <code>WP_HTML_Tag_Processor</code>: lazy-load images, rewrite URLs, strip scripts, all in one pass.</td></tr>
+	<tr><td>Chapter 2</td><td>→</td><td>Read the input ZIP through <code>ZipFilesystem</code>, stage it in <code>InMemoryFilesystem</code>, defend against zip-slip with <code>ZipDecoder::sanitize_path()</code>.</td></tr>
+	<tr><td>Chapter 3</td><td>→</td><td>Convert each post with <code>MarkdownConsumer</code>, audit the output with <code>WP_Block_Parser</code>, stream the WXR with <code>WXRWriter</code>.</td></tr>
+	<tr><td>Chapter 4</td><td>→</td><td>Frontload images with <code>HttpClient</code> through a sliding-window event loop; mount remote archives with <code>SeekableRequestReadStream</code>.</td></tr>
+	</table>
+</section>
+
+<section class="not-covered">
+	<h2>What the toolkit does that the tutorial didn't touch</h2>
+
+	<p>The importer used eight components. The toolkit ships eighteen. Here's what's left, with the use case each one shows up in:</p>
+
+	<ul class="component-summary">
+		<li><strong>Git</strong> — snapshot your importer's runs into a pure-PHP Git repository for revision history. Useful for "what changed between last week's import and this week's." <a href="../reference/git.html">Reference →</a></li>
+		<li><strong>Merge</strong> — three-way diff and merge for content sync. If posts edit on both the source and the destination side, this is how you reconcile them. <a href="../reference/merge.html">Reference →</a></li>
+		<li><strong>HttpServer</strong> — a tiny local listening port for OAuth callbacks during a CLI workflow, fixture servers for HttpClient tests, or a status page during a long import. Not for production traffic. <a href="../reference/httpserver.html">Reference →</a></li>
+		<li><strong>CORSProxy</strong> — when you ship the importer as a browser tool, a server-side proxy to fetch URLs that don't send the right CORS headers. <a href="../reference/corsproxy.html">Reference →</a></li>
+		<li><strong>CLI</strong> — POSIX-style argument parser to wrap your importer as <code>importer.php --site-url=… --dry-run</code>. <a href="../reference/cli.html">Reference →</a></li>
+		<li><strong>Encoding</strong> — UTF-8 validation and scrubbing for inputs that may contain mixed encodings. Most importers eventually need it. <a href="../reference/encoding.html">Reference →</a></li>
+		<li><strong>XML</strong> — the cursor-based XML processor underneath DataLiberation; reach for it directly when you need to walk export-sized files. <a href="../reference/xml.html">Reference →</a></li>
+		<li><strong>Blueprints</strong> — declarative site setup. Spin up the destination WordPress with the right plugins and options before running the importer against it. <a href="../reference/blueprints.html">Reference →</a></li>
+		<li><strong>Polyfill</strong> — WordPress-shaped helpers (<code>esc_html</code>, <code>add_filter</code>, <code>__</code>) so toolkit code can run outside WordPress without ifdefs. <a href="../reference/polyfill.html">Reference →</a></li>
+		<li><strong>ToolkitCodingStandards</strong> — PHPCS sniffs encoding the project's review feedback as enforceable rules. Borrow if your project follows WordPress style. <a href="../reference/coding-standards.html">Reference →</a></li>
+	</ul>
+</section>
+
+<section class="patterns">
+	<h2>Patterns worth keeping</h2>
+
+	<p>Three shapes recurred across the tutorial. Watch for them in your own code:</p>
+
+	<h3>Cursor over a string</h3>
+	<p><code>WP_HTML_Tag_Processor</code> walks a string forward, records edits as a side-buffer of byte-range replacements, and emits the modified string only when you call <code>get_updated_html()</code>. The result is byte-honest — bytes you didn't edit come through bit-identical. When you need to make small changes to large markup, that property is gold. The XML component's <code>XMLProcessor</code> applies the same pattern to XML.</p>
+
+	<h3>Pull / consume streams</h3>
+	<p><code>ZipFilesystem::open_read_stream()</code>, <code>HttpClient</code> response bodies, <code>InflateReadStream</code>, and the rest all share the same shape: <code>pull(N)</code> reads up to <code>N</code> bytes from the underlying source into an internal buffer and returns how many ended up there; <code>consume(N)</code> reads <code>N</code> bytes from that buffer and advances past them. Memory used is bounded by the chunk size, never by the file size. Once you internalize this loop you can compose any byte source with any byte sink.</p>
+
+	<h3>One interface, multiple backends</h3>
+	<p>Code that takes a <code>Filesystem</code> rather than a path doesn't care if the filesystem is on disk, in memory, in a SQLite database, or inside a ZIP. That's how the importer's stage works for both production (memory) and debugging (local disk) without a code change. Same pattern shows up in HttpClient (curl vs sockets transport) and ByteStream (file, memory, deflate, hash all implementing the same byte-stream interface).</p>
+</section>
+
+<section class="next-actions">
+	<h2>Where to go from here</h2>
+
+	<p>Three honest paths:</p>
+
+	<ol>
+		<li><strong>Take the importer further.</strong> Add a <code>--dry-run</code> flag with the CLI component. Snapshot each run into a Git repository so you can diff between imports. Wrap it in a CORSProxy-fronted browser tool. Each of those is a one-component addition; the structure you have already accommodates them.</li>
+		<li><strong>Pick a single component and go deep.</strong> The reference pages all have refinements past the minimal example — bookmarks and breadcrumbs in HTML, three-way merges in Git, sliding windows and resumable downloads in HttpClient. The depth is there when the project asks for it.</li>
+		<li><strong>Read the source.</strong> Each component lives under <code>components/&lt;Name&gt;/</code>. <code>components/HTML/class-wp-html-tag-processor.php</code> is the same code WordPress core ships in <code>wp-includes/html-api/</code>; <code>components/Zip/class-zipdecoder.php</code> is a clean implementation of the parts of the ZIP spec that the toolkit actually uses. The code is written to be read.</li>
+	</ol>
+</section>
+
+<section class="cta-row" style="margin-top: 3rem;">
+	<a class="cta primary" href="../reference/">Browse all 18 components →</a>
+	<a class="cta" href="../">Back to landing</a>
+	<a class="cta" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+</section>
+
+</main>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/blockparser.html b/docs/reference/blockparser.html
new file mode 100644
index 000000000..d58906482
--- /dev/null
+++ b/docs/reference/blockparser.html
@@ -0,0 +1,330 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>BlockParser — PHP Toolkit reference</title>
+<meta name="description" content="WordPress core&#x27;s block parser, packaged as a standalone library. Turn block markup into a structured tree, lint posts for common authoring mistakes, and audit block usage — all without booting WordPress.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li class="current"><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>BlockParser</h1>
+
+<p class="lede">WordPress core's block parser, packaged as a standalone library. Turn block markup into a structured tree, lint posts for common authoring mistakes, and audit block usage — all without booting WordPress.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/blockparser</code></pre>
+
+<aside class="callout credit">
+	<strong>WordPress core, packaged standalone.</strong> <code>WP_Block_Parser</code> is WordPress core's block parser, packaged here so importers and linters can read <a href="https://developer.wordpress.org/block-editor/reference-guides/block-api/">block markup</a> without booting WordPress. Source: <a href="https://github.com/WordPress/wordpress-develop/blob/trunk/src/wp-includes/class-wp-block-parser.php">WordPress/wordpress-develop</a>.
+</aside>
+
+<p>Block markup is not plain HTML. A post can contain HTML comments that identify blocks, JSON attributes inside those comments, freeform HTML between blocks, and nested blocks whose rendered HTML is interleaved with parent markup.</p><p>This component packages WordPress core's block parser so importers, linters, migration tools, and static analyzers can understand block content without loading WordPress. It deliberately mirrors core behavior — same array shape, same <code>null</code> blocks for freeform HTML, same core block names such as <code>core/paragraph</code> — so code written against this parser keeps working when run inside WordPress, and vice versa.</p><p>Reach for it when you need answers about the block tree: which blocks a post uses, which attributes they carry, where nested blocks appear, or whether content violates a rule your project cares about.</p>
+
+<h2 id="what-you-get-back">What you get back</h2>
+
+<p><code>WP_Block_Parser::parse()</code> returns an array of blocks. Each block is an associative array with five keys: <code>blockName</code>, <code>attrs</code>, <code>innerBlocks</code>, <code>innerHTML</code>, and <code>innerContent</code>.</p><p><code>innerHTML</code> is the HTML inside the block <em>with inner blocks stripped out</em>. <code>innerContent</code> is the interleaved version: an array of HTML strings with <code>null</code> placeholders marking where each inner block belongs.</p><p>Most code starts by checking <code>blockName</code>, then reading <code>attrs</code> or <code>innerHTML</code>. When a post has container blocks such as Group, Columns, or Navigation, look inside <code>innerBlocks</code> too.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>The simplest possible use. Pass a string, get back a tree.</p>
+
+<php-snippet blueprint="toolkit-setup" name="parse.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = "<!-- wp:heading {\"level\":2} -->\n<h2>Welcome</h2>\n<!-- /wp:heading -->\n\n"
+	. "<!-- wp:paragraph -->\n<p>Hello from the block editor.</p>\n<!-- /wp:paragraph -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+foreach ( $blocks as $block ) {
+	if ( null === $block['blockName'] ) {
+		continue;
+	}
+	echo $block['blockName'] . ': ' . trim( strip_tags( $block['innerHTML'] ) ) . "\n";
+}
+</script>
+<script type="text/expected-output">
+core/heading: Welcome
+core/paragraph: Hello from the block editor.
+</script>
+</php-snippet>
+
+<h2 id="refinement-count-every-block-type-in-a-post">Refinement: count every block type in a post</h2>
+
+<p>A common audit task: "How many Paragraph, Image, and Gallery blocks does this post use?" A small queue keeps the example readable while still visiting nested blocks.</p>
+
+<php-snippet blueprint="toolkit-setup" name="count-blocks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = "<!-- wp:group --><div class=\"wp-block-group\">"
+	. "<!-- wp:heading --><h2>Title</h2><!-- /wp:heading -->"
+	. "<!-- wp:paragraph --><p>One.</p><!-- /wp:paragraph -->"
+	. "<!-- wp:paragraph --><p>Two.</p><!-- /wp:paragraph -->"
+	. "<!-- wp:image {\"id\":1} --><figure><img src=\"a.jpg\"/></figure><!-- /wp:image -->"
+	. "</div><!-- /wp:group -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+$counts = array();
+$queue  = $blocks;
+
+while ( ! empty( $queue ) ) {
+	$block = array_shift( $queue );
+
+	if ( null !== $block['blockName'] ) {
+		$name             = $block['blockName'];
+		$counts[ $name ] = isset( $counts[ $name ] ) ? $counts[ $name ] + 1 : 1;
+	}
+
+	foreach ( $block['innerBlocks'] as $inner_block ) {
+		$queue[] = $inner_block;
+	}
+}
+
+arsort( $counts );
+foreach ( $counts as $name => $n ) {
+	echo str_pad( (string) $n, 4, ' ', STR_PAD_LEFT ) . '  ' . $name . "\n";
+}
+</script>
+<script type="text/expected-output">
+   2  core/paragraph
+   1  core/group
+   1  core/heading
+   1  core/image
+</script>
+</php-snippet>
+
+<h2 id="refinement-check-whether-a-post-uses-a-block">Refinement: check whether a post uses a block</h2>
+
+<p>Useful for templates, audits, and migrations: answer one yes/no question without caring where the block appears in the tree.</p>
+
+<php-snippet blueprint="toolkit-setup" name="has-block.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = "<!-- wp:group --><div class=\"wp-block-group\">"
+	. "<!-- wp:buttons --><div class=\"wp-block-buttons\">"
+	. "<!-- wp:button --><div class=\"wp-block-button\"><a>Buy now</a></div><!-- /wp:button -->"
+	. "</div><!-- /wp:buttons -->"
+	. "</div><!-- /wp:group -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+function post_has_block( $blocks, $name ) {
+	$queue = $blocks;
+
+	while ( ! empty( $queue ) ) {
+		$block = array_shift( $queue );
+		if ( $name === $block['blockName'] ) {
+			return true;
+		}
+
+		foreach ( $block['innerBlocks'] as $inner_block ) {
+			$queue[] = $inner_block;
+		}
+	}
+
+	return false;
+}
+
+echo post_has_block( $blocks, 'core/button' ) ? "has button\n" : "missing button\n";
+echo post_has_block( $blocks, 'core/gallery' ) ? "has gallery\n" : "missing gallery\n";
+</script>
+<script type="text/expected-output">
+has button
+missing gallery
+</script>
+</php-snippet>
+
+<h2 id="refinement-lint-headings-for-hierarchy-mistakes">Refinement: lint headings for hierarchy mistakes</h2>
+
+<p>"Don't skip from H2 to H4" is a real accessibility rule. The helper below keeps headings in document order, including headings nested inside Group, Column, and Cover blocks.</p>
+
+<php-snippet blueprint="toolkit-setup" name="lint-headings.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = "<!-- wp:heading -->\n<h2>Intro</h2>\n<!-- /wp:heading -->"
+	. "<!-- wp:heading {\"level\":4} -->\n<h4>Subsection</h4>\n<!-- /wp:heading -->"
+	. "<!-- wp:heading {\"level\":3} -->\n<h3>Body</h3>\n<!-- /wp:heading -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+function collect_headings( $blocks, &$headings ) {
+	foreach ( $blocks as $block ) {
+		if ( 'core/heading' === $block['blockName'] ) {
+			$headings[] = array(
+				'level' => isset( $block['attrs']['level'] ) ? (int) $block['attrs']['level'] : 2,
+				'text'  => trim( strip_tags( $block['innerHTML'] ) ),
+			);
+		}
+
+		collect_headings( $block['innerBlocks'], $headings );
+	}
+}
+
+$headings = array();
+collect_headings( $blocks, $headings );
+
+$last = 1;
+foreach ( $headings as $heading ) {
+	$level = $heading['level'];
+	$label = $heading['text'];
+
+	if ( $level > $last + 1 ) {
+		echo "WARN {$label}: jumped from H{$last} to H{$level}\n";
+	} else {
+		echo "ok   {$label}: H{$level}\n";
+	}
+	$last = $level;
+}
+</script>
+<script type="text/expected-output">
+ok   Intro: H2
+WARN Subsection: jumped from H2 to H4
+ok   Body: H3
+</script>
+</php-snippet>
+
+<h2 id="refinement-find-all-instances-of-a-custom-block">Refinement: find all instances of a custom block</h2>
+
+<p>When auditing an export for a block your plugin owns, collect every match and print the fields a human cares about.</p>
+
+<php-snippet blueprint="toolkit-setup" name="find-custom-block.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = "<!-- wp:paragraph --><p>Reviews</p><!-- /wp:paragraph -->"
+	. "<!-- wp:my-plugin/testimonial {\"author\":\"Jane\",\"rating\":5} -->"
+	. "<blockquote>Loved it.</blockquote>"
+	. "<!-- /wp:my-plugin/testimonial -->"
+	. "<!-- wp:my-plugin/testimonial {\"author\":\"Joe\",\"rating\":4} -->"
+	. "<blockquote>Pretty good.</blockquote>"
+	. "<!-- /wp:my-plugin/testimonial -->";
+
+$blocks = ( new WP_Block_Parser() )->parse( $document );
+
+function find_blocks_by_name( $blocks, $name, &$matches ) {
+	foreach ( $blocks as $block ) {
+		if ( $name === $block['blockName'] ) {
+			$matches[] = $block;
+		}
+
+		find_blocks_by_name( $block['innerBlocks'], $name, $matches );
+	}
+}
+
+$testimonials = array();
+find_blocks_by_name( $blocks, 'my-plugin/testimonial', $testimonials );
+
+foreach ( $testimonials as $i => $b ) {
+	echo ( $i + 1 ) . '. ' . $b['attrs']['author'] . ' (' . $b['attrs']['rating'] . '/5): '
+		. trim( strip_tags( $b['innerHTML'] ) ) . "\n";
+}
+</script>
+<script type="text/expected-output">
+1. Jane (5/5): Loved it.
+2. Joe (4/5): Pretty good.
+</script>
+</php-snippet>
+
+<h2 id="refinement-detect-blocks-with-stale-embed-urls">Refinement: detect blocks with stale embed URLs</h2>
+
+<p>A real-world content audit: find every <code>core/embed</code> whose URL points at a domain you have retired.</p>
+
+<php-snippet blueprint="toolkit-setup" name="audit-embeds.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$document = '<!-- wp:embed {"url":"https://twitter.com/wordpress/status/1","providerNameSlug":"twitter"} /-->'
+	. '<!-- wp:embed {"url":"https://youtube.com/watch?v=abc","providerNameSlug":"youtube"} /-->'
+	. '<!-- wp:embed {"url":"https://vine.co/v/xyz","providerNameSlug":"vine"} /-->';
+
+$retired = array( 'vine.co', 'plus.google.com' );
+
+foreach ( ( new WP_Block_Parser() )->parse( $document ) as $b ) {
+	if ( 'core/embed' !== $b['blockName'] ) {
+		continue;
+	}
+	$url  = isset( $b['attrs']['url'] ) ? $b['attrs']['url'] : '';
+	$host = parse_url( $url, PHP_URL_HOST );
+	$bad  = $host && in_array( $host, $retired, true );
+	echo ( $bad ? 'STALE  ' : 'ok     ' ) . $url . "\n";
+}
+</script>
+<script type="text/expected-output">
+ok     https://twitter.com/wordpress/status/1
+ok     https://youtube.com/watch?v=abc
+STALE  https://vine.co/v/xyz
+</script>
+</php-snippet>
+
+<h2 id="pitfalls">Pitfalls</h2>
+
+<aside class="callout pitfall">freeform HTML between blocks shows up as a block with <code>blockName === null</code>. Always skip that case before comparing names.</aside>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="html.html"><strong>HTML</strong></a><span>Inspect or rewrite the HTML carried by parsed blocks.</span></li>
+	<li><a href="markdown.html"><strong>Markdown</strong></a><span>Move between author-friendly Markdown and serialized block markup.</span></li>
+	<li><a href="dataliberation.html"><strong>DataLiberation</strong></a><span>Audit and transform blocks while migrating content.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/blueprints.html b/docs/reference/blueprints.html
new file mode 100644
index 000000000..2c69e22bb
--- /dev/null
+++ b/docs/reference/blueprints.html
@@ -0,0 +1,228 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Blueprints — PHP Toolkit reference</title>
+<meta name="description" content="Declarative WordPress site provisioning. Write a JSON description of plugins, options, and content; let the runner execute it.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li class="current"><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>Blueprints</h1>
+
+<p class="lede">Declarative WordPress site provisioning. Write a JSON description of plugins, options, and content; let the runner execute it.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/blueprints</code></pre>
+
+<p>A WordPress environment is more than a database dump. It can require a specific core version, plugins, themes, site options, uploaded files, content, and setup steps. Rebuilding that by hand makes demos, tests, bug reports, workshops, and CI fixtures drift over time.</p><p>The Blueprints component treats site setup as data. A blueprint JSON document describes the desired steps, and the runner applies them to either a new WordPress install or an existing one. The validator exists because user-authored JSON needs clear, path-specific errors rather than generic schema failures.</p><p><code>RunnerConfiguration</code> separates the web root from the WordPress core directory, since real hosts often put them in different places. Both paths are explicit on the runner, never inferred.</p><p>Blueprints can <em>create</em> a new WordPress install (download core, set up the database, apply steps) or <em>apply to an existing</em> site. Creating a fresh install needs filesystem access this in-browser runtime doesn't have, so the runnable snippets focus on <code>APPLY_TO_EXISTING_SITE</code>.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p><code>RunnerConfiguration</code> is a fluent builder. The minimum: target site root, target site URL, execution mode.</p>
+
+<php-snippet blueprint="toolkit-setup" name="configure.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Blueprints\Runner;
+use WordPress\Blueprints\RunnerConfiguration;
+
+$config = ( new RunnerConfiguration() )
+	->set_execution_mode( Runner::EXECUTION_MODE_APPLY_TO_EXISTING_SITE )
+	->set_target_site_root( '/wordpress' )
+	->set_target_site_url( 'http://playground.test/' );
+
+echo "mode: " . $config->get_execution_mode() . "\n";
+echo "root: " . $config->get_target_site_root() . "\n";
+echo "url:  " . $config->get_target_site_url() . "\n";
+</script>
+<script type="text/expected-output">
+mode: apply-to-existing-site
+root: /wordpress
+url:  http://playground.test/
+</script>
+</php-snippet>
+
+<h2 id="refinement-generate-blueprint-json-from-php">Refinement: generate blueprint JSON from PHP</h2>
+
+<p>CI jobs and tests stay clearer when PHP builds the blueprint from data instead of hand-writing JSON. Keep the structure plain: <code>version</code>, then a list of step arrays.</p>
+
+<php-snippet blueprint="toolkit-setup" name="build-json.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$site_name = 'Demo Site';
+$plugins   = array( 'gutenberg', 'classic-editor' );
+
+$blueprint = array(
+	'version' => 2,
+	'steps'   => array(
+		array(
+			'step'    => 'setSiteOptions',
+			'options' => array(
+				'blogname'              => $site_name,
+				'permalink_structure'   => '/%postname%/',
+				'show_on_front'         => 'page',
+			),
+		),
+	),
+);
+
+foreach ( $plugins as $slug ) {
+	$blueprint['steps'][] = array(
+		'step'       => 'installPlugin',
+		'pluginData' => "https://downloads.wordpress.org/plugin/{$slug}.zip",
+	);
+	$blueprint['steps'][] = array(
+		'step'   => 'activatePlugin',
+		'plugin' => "{$slug}/{$slug}.php",
+	);
+}
+
+echo json_encode( $blueprint, JSON_PRETTY_PRINT | JSON_UNESCAPED_SLASHES ) . "\n";
+</script>
+<script type="text/expected-output">
+{
+    "version": 2,
+    "steps": [
+        {
+            "step": "setSiteOptions",
+            "options": {
+                "blogname": "Demo Site",
+                "permalink_structure": "/%postname%/",
+                "show_on_front": "page"
+            }
+        },
+        {
+            "step": "installPlugin",
+            "pluginData": "https://downloads.wordpress.org/plugin/gutenberg.zip"
+        },
+        {
+            "step": "activatePlugin",
+            "plugin": "gutenberg/gutenberg.php"
+        },
+        {
+            "step": "installPlugin",
+            "pluginData": "https://downloads.wordpress.org/plugin/classic-editor.zip"
+        },
+        {
+            "step": "activatePlugin",
+            "plugin": "classic-editor/classic-editor.php"
+        }
+    ]
+}
+</script>
+</php-snippet>
+
+<h2 id="refinement-validate-before-running">Refinement: validate before running</h2>
+
+<p>The schema validator returns a human-readable <code>ValidationError</code> instead of a generic "does not match schema" failure. Use it before handing user-authored JSON to a runner.</p>
+
+<php-snippet blueprint="toolkit-setup" name="validate.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Blueprints\Validator\HumanFriendlySchemaValidator;
+
+$schema = array(
+	'type'       => 'object',
+	'required'   => array( 'version', 'steps' ),
+	'properties' => array(
+		'version' => array( 'type' => 'integer' ),
+		'steps'   => array(
+			'type'  => 'array',
+			'items' => array(
+				'type'       => 'object',
+				'required'   => array( 'step' ),
+				'properties' => array(
+					'step' => array( 'type' => 'string' ),
+				),
+			),
+		),
+	),
+);
+
+$blueprint = array(
+	'version' => 2,
+	'steps'   => array(
+		array( 'pluginData' => 'https://downloads.wordpress.org/plugin/gutenberg.zip' ),
+	),
+);
+
+$error = ( new HumanFriendlySchemaValidator( $schema ) )->validate( $blueprint );
+if ( null === $error ) {
+	echo "valid\n";
+} else {
+	echo $error->get_pretty_path() . ": " . $error->message . "\n";
+}
+</script>
+<script type="text/expected-output">
+Blueprint root["steps"][0]: Missing required field: step.
+</script>
+</php-snippet>
+
+<h2 id="the-blueprint-json-shape">The Blueprint JSON shape</h2>
+
+<p>A blueprint is a JSON document with a <code>version</code> field and a <code>steps</code> array. Each step has a <code>"step"</code> discriminator and step-specific fields. This is the same shape used by <a href="https://playground.wordpress.net/">WordPress Playground</a>.</p>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="filesystem.html"><strong>Filesystem</strong></a><span>Prepare files and fixtures before applying site setup steps.</span></li>
+	<li><a href="httpclient.html"><strong>HttpClient</strong></a><span>Download packages or source data as part of provisioning workflows.</span></li>
+	<li><a href="cli.html"><strong>CLI</strong></a><span>Wrap repeatable blueprint operations in a small command.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/bytestream.html b/docs/reference/bytestream.html
new file mode 100644
index 000000000..eed37bf85
--- /dev/null
+++ b/docs/reference/bytestream.html
@@ -0,0 +1,244 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>ByteStream — PHP Toolkit reference</title>
+<meta name="description" content="Composable streaming primitives for reading, writing, transforming, hashing, and compressing byte data. Pull/peek/consume semantics let parsers backtrack without copying, and deflate, inflate, and checksum filters snap together like Lego.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li class="current"><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>ByteStream</h1>
+
+<p class="lede">Composable streaming primitives for reading, writing, transforming, hashing, and compressing byte data. Pull/peek/consume semantics let parsers backtrack without copying, and deflate, inflate, and checksum filters snap together like Lego.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/bytestream</code></pre>
+
+<p>PHP's native streams are powerful but inconsistent. <code>fread</code> on a socket may return short reads with no warning; <code>stream_filter_append</code> is awkward to compose; gzip helpers and file handles expose different APIs. The ByteStream component normalizes these behind one small interface — <code>pull / peek / consume</code> — so a parser, a hash function, and a deflate filter all see the same shape.</p><p>The split between <em>pull</em> (buffer up to N bytes) and <em>consume</em> (advance past N bytes) is the secret. Parsers can <code>peek</code> ahead to detect a record boundary and decide whether to <code>consume</code>, without copying or allocating.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>The canonical loop. <code>pull(N)</code> reads up to <code>N</code> bytes from the underlying source into an internal buffer and returns how many ended up there; <code>consume(N)</code> reads <code>N</code> bytes from that buffer and advances past them. The buffer never grows beyond the chunk size you ask for.</p>
+
+<php-snippet blueprint="toolkit-setup" name="teaser-read.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\ReadStream\FileReadStream;
+
+$path = tempnam( sys_get_temp_dir(), 'demo' );
+file_put_contents( $path, str_repeat( "log line\n", 200 ) );
+
+$reader = FileReadStream::from_path( $path );
+$total = 0;
+while ( ! $reader->reached_end_of_data() ) {
+	$n = $reader->pull( 256 );
+	if ( 0 === $n ) break;
+	$total += strlen( $reader->consume( $n ) );
+}
+$reader->close_reading();
+echo "Read {$total} bytes in 256-byte chunks.\n";
+</script>
+<script type="text/expected-output">
+Read 1800 bytes in 256-byte chunks.
+</script>
+</php-snippet>
+
+<h2 id="refinement-memorypipe-as-write-then-read-buffer">Refinement: memoryPipe as write-then-read buffer</h2>
+
+<p><code>MemoryPipe</code> is bidirectional: you <code>append_bytes()</code> as a writer and <code>pull/consume</code> as a reader. Easiest way to wire one component's output into another's input.</p>
+
+<php-snippet blueprint="toolkit-setup" name="memory-pipe.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+
+$pipe = new MemoryPipe();
+$pipe->append_bytes( "first chunk\n" );
+$pipe->append_bytes( "second chunk\n" );
+$pipe->append_bytes( "third chunk\n" );
+$pipe->close_writing();
+
+while ( ! $pipe->reached_end_of_data() ) {
+	$n = $pipe->pull( 1024 );
+	if ( 0 === $n ) break;
+	echo "got: " . $pipe->consume( $n );
+}
+</script>
+<script type="text/expected-output">
+got: first chunk
+second chunk
+third chunk
+</script>
+</php-snippet>
+
+<h2 id="refinement-compress-on-the-way-in-decompress-on-the-way-out">Refinement: compress on the way in, decompress on the way out</h2>
+
+<p>Wrap a stream in <code>DeflateReadStream</code> to get compressed bytes out; wrap it in <code>InflateReadStream</code> to get decompressed bytes out. Both are full <code>ByteReadStream</code> implementations, so they nest into anything else that takes a stream.</p>
+
+<php-snippet blueprint="toolkit-setup" name="deflate-roundtrip.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\DeflateReadStream;
+use WordPress\ByteStream\ReadStream\InflateReadStream;
+
+$original = str_repeat( "the quick brown fox. ", 50 );
+
+$src        = new MemoryPipe( $original );
+$src->close_writing();
+$deflated   = new DeflateReadStream( $src, ZLIB_ENCODING_DEFLATE );
+$compressed = $deflated->consume_all();
+
+$src2     = new MemoryPipe( $compressed );
+$src2->close_writing();
+$inflated = new InflateReadStream( $src2, ZLIB_ENCODING_DEFLATE );
+$round    = $inflated->consume_all();
+
+printf( "original  : %d bytes\n", strlen( $original ) );
+printf( "deflated  : %d bytes (%.1f%%)\n", strlen( $compressed ), 100 * strlen( $compressed ) / strlen( $original ) );
+printf( "round-trip: %s\n", $round === $original ? 'OK' : 'BROKEN' );
+</script>
+<script type="text/expected-output">
+original  : 1050 bytes
+deflated  : 45 bytes (4.3%)
+round-trip: OK
+</script>
+</php-snippet>
+
+<h2 id="refinement-line-by-line-reads-from-a-chunked-source">Refinement: line-by-line reads from a chunked source</h2>
+
+<p>Reading text by line means handling chunk boundaries that fall mid-line. Keep the trailing partial line and prepend it to the next pull. The rest of the loop pretends the data was always whole.</p>
+
+<php-snippet blueprint="toolkit-setup" name="lines.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+
+$pipe = new MemoryPipe();
+$pipe->append_bytes( "alpha\nbravo\ncharl" );
+$pipe->append_bytes( "ie\ndelta\necho\n" );
+$pipe->close_writing();
+
+$tail = '';
+$count = 0;
+while ( ! $pipe->reached_end_of_data() ) {
+	$n = $pipe->pull( 8 );
+	if ( 0 === $n ) break;
+	$buf   = $tail . $pipe->consume( $n );
+	$lines = explode( "\n", $buf );
+	$tail  = array_pop( $lines );
+	foreach ( $lines as $line ) {
+		printf( "[%d] %s\n", ++$count, $line );
+	}
+}
+if ( '' !== $tail ) {
+	printf( "[%d] %s\n", ++$count, $tail );
+}
+</script>
+<script type="text/expected-output">
+[1] alpha
+[2] bravo
+[3] charlie
+[4] delta
+[5] echo
+</script>
+</php-snippet>
+
+<h2 id="refinement-limit-a-stream-to-a-fixed-window">Refinement: limit a stream to a fixed window</h2>
+
+<p><code>LimitedByteReadStream</code> exposes only the next N bytes of an underlying stream as if those were the entire stream. This is how the ZIP decoder hands you the body of one entry without letting you read into the next.</p>
+
+<php-snippet blueprint="toolkit-setup" name="limited.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\LimitedByteReadStream;
+
+$source = new MemoryPipe( "HEADER:42|BODY:hello there|FOOTER:done" );
+$source->close_writing();
+
+$source->pull( 10 );
+$source->consume( 10 );
+
+$body = new LimitedByteReadStream( $source, 16 );
+echo "body sees: " . $body->consume_all() . "\n";
+echo "remaining in source: " . $source->consume_all() . "\n";
+</script>
+<script type="text/expected-output">
+body sees: BODY:hello there
+remaining in source: |FOOTER:done
+</script>
+</php-snippet>
+
+<h2 id="pitfalls">Pitfalls</h2>
+
+<aside class="callout pitfall">a producer must call <code>close_writing()</code> when done — otherwise the consumer eventually throws <code>NotEnoughDataException</code> instead of seeing EOF.</aside>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="filesystem.html"><strong>Filesystem</strong></a><span>Back file reads and writes with the same stream primitives.</span></li>
+	<li><a href="zip.html"><strong>Zip</strong></a><span>Read and write archive entries one stream at a time.</span></li>
+	<li><a href="httpclient.html"><strong>HttpClient</strong></a><span>Process request and response bodies incrementally.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/cli.html b/docs/reference/cli.html
new file mode 100644
index 000000000..a42c80a04
--- /dev/null
+++ b/docs/reference/cli.html
@@ -0,0 +1,273 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>CLI — PHP Toolkit reference</title>
+<meta name="description" content="POSIX-style argument parser. Long options, short bundles, inline values, positional args — one static call.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li class="current"><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>CLI</h1>
+
+<p class="lede">POSIX-style argument parser. Long options, short bundles, inline values, positional args — one static call.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/cli</code></pre>
+
+<p>Real CLI tools in PHP usually mean either pulling in <code>symfony/console</code> (and the transitive dependencies that come with it) or hand-rolling argv parsing that breaks the first time someone writes <code>-vvv</code> or <code>--port=8080</code>. The toolkit's <code>CLI</code> class is one static method, no dependencies, and handles the POSIX shapes you actually see.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>The smallest useful invocation: one boolean flag, one positional. Each option is a four-tuple of <code>[ short, has_value, default, description ]</code>.</p>
+
+<php-snippet blueprint="toolkit-setup" name="parse-flag.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\CLI\CLI;
+
+$option_defs = array(
+	'verbose' => array( 'v', false, false, 'Enable verbose output' ),
+);
+
+list( $positionals, $options ) = CLI::parse_command_args_and_options(
+	array( '-v', 'input.txt' ),
+	$option_defs
+);
+
+echo "verbose: " . ( $options['verbose'] ? 'yes' : 'no' ) . "\n";
+echo "input:   " . $positionals[0] . "\n";
+</script>
+<script type="text/expected-output">
+verbose: yes
+input:   input.txt
+</script>
+</php-snippet>
+
+<h2 id="refinement-mix-values-flags-and-bundles">Refinement: mix values, flags, and bundles</h2>
+
+<p>The parser accepts <code>--port 8080</code>, <code>--port=8080</code>, <code>-p 8080</code>, and <code>-p=8080</code>. It also expands bundled boolean shorts such as <code>-afv</code>.</p>
+
+<php-snippet blueprint="toolkit-setup" name="mix-shapes.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\CLI\CLI;
+
+$option_defs = array(
+	'all'     => array( 'a', false, false, 'Process everything' ),
+	'force'   => array( 'f', false, false, 'Overwrite existing files' ),
+	'verbose' => array( 'v', false, false, 'Verbose output' ),
+	'output'  => array( 'o', true,  null,  'Output path' ),
+	'port'    => array( 'p', true,  '3000', 'Server port' ),
+);
+
+$argv = array( '-afv', '--port=8080', '-o', '/tmp/result.txt', 'input.json' );
+list( $positionals, $options ) = CLI::parse_command_args_and_options( $argv, $option_defs );
+
+echo "input:   " . $positionals[0] . "\n";
+echo "flags:   " . implode( ', ', array_keys( array_filter( array(
+	'all'     => $options['all'],
+	'force'   => $options['force'],
+	'verbose' => $options['verbose'],
+) ) ) ) . "\n";
+echo "output:  " . $options['output'] . "\n";
+echo "port:    " . $options['port'] . "\n";
+</script>
+<script type="text/expected-output">
+input:   input.json
+flags:   all, force, verbose
+output:  /tmp/<tempfile>.txt
+port:    8080
+</script>
+</php-snippet>
+
+<h2 id="refinement-validate-required-options">Refinement: validate required options</h2>
+
+<p>The parser fills in defaults but never enforces "required". Check for <code>null</code> after parsing — full control over the error message.</p>
+
+<php-snippet blueprint="toolkit-setup" name="require-options.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\CLI\CLI;
+
+$option_defs = array(
+	'site-url'  => array( 'u', true, null, 'Public site URL (required)' ),
+	'site-path' => array( null, true, null, 'Target directory (required)' ),
+);
+
+$argv = array( '--site-url', 'https://mysite.test' );
+
+try {
+	list( , $options ) = CLI::parse_command_args_and_options( $argv, $option_defs );
+	foreach ( array( 'site-url', 'site-path' ) as $name ) {
+		if ( null === $options[ $name ] ) {
+			throw new RuntimeException( "Missing required option --{$name}" );
+		}
+	}
+	echo "All good.\n";
+} catch ( Exception $e ) {
+	echo "error: " . $e->getMessage() . "\n";
+}
+</script>
+<script type="text/expected-output">
+error: Missing required option --site-path
+</script>
+</php-snippet>
+
+<h2 id="refinement-generate---help-from-definitions">Refinement: generate --help from definitions</h2>
+
+<p>Because each option carries its own description, you can render help text by walking the same definitions you parse with. No second source of truth.</p>
+
+<php-snippet blueprint="toolkit-setup" name="help-text.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\CLI\CLI;
+
+$option_defs = array(
+	'output'  => array( 'o', true,  null,  'Write result to FILE' ),
+	'force'   => array( 'f', false, false, 'Overwrite existing files' ),
+	'verbose' => array( 'v', false, false, 'Verbose output' ),
+	'help'    => array( 'h', false, false, 'Show this help and exit' ),
+);
+
+function render_help( array $defs ) {
+	echo "Usage: mytool [options] <input>\n\nOptions:\n";
+	foreach ( $defs as $long => $def ) {
+		list( $short, $has_value, $default, $desc ) = $def;
+		$flag = ( $short ? "-{$short}, " : '    ' ) . "--{$long}";
+		if ( $has_value ) $flag .= '=VALUE';
+		echo sprintf( "  %-28s %s\n", $flag, $desc );
+	}
+}
+
+list( , $options ) = CLI::parse_command_args_and_options( array( '-h' ), $option_defs );
+if ( $options['help'] ) render_help( $option_defs );
+</script>
+<script type="text/expected-output">
+Usage: mytool [options] <input>
+
+Options:
+  -o, --output=VALUE           Write result to FILE
+  -f, --force                  Overwrite existing files
+  -v, --verbose                Verbose output
+  -h, --help                   Show this help and exit
+</script>
+</php-snippet>
+
+<h2 id="refinement-git-style-subcommands">Refinement: git-style subcommands</h2>
+
+<p>To build a tool with subcommands like <code>mytool deploy</code>, peel the first positional off <code>argv</code>, dispatch, and parse the rest with a per-command option set.</p>
+
+<php-snippet blueprint="toolkit-setup" name="subcommands.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\CLI\CLI;
+
+$commands = array(
+	'deploy' => array(
+		'env'     => array( 'e', true, 'staging', 'Target environment' ),
+		'dry-run' => array( 'n', false, false, 'Preview without applying' ),
+	),
+	'rollback' => array(
+		'to' => array( 't', true, null, 'Revision to roll back to' ),
+	),
+);
+
+function run( array $argv, array $commands ) {
+	if ( empty( $argv ) ) {
+		echo "Usage: mytool <command> [options]\nCommands: " . implode( ', ', array_keys( $commands ) ) . "\n";
+		return;
+	}
+	$command = array_shift( $argv );
+	if ( ! isset( $commands[ $command ] ) ) {
+		echo "Unknown command: {$command}\n";
+		return;
+	}
+	list( $positionals, $options ) = CLI::parse_command_args_and_options( $argv, $commands[ $command ] );
+	echo "command={$command}\n";
+	echo "options: " . json_encode( $options ) . "\n";
+	echo "positionals: " . json_encode( $positionals ) . "\n";
+}
+
+run( array( 'deploy', '--env=production', '-n', 'web-01', 'web-02' ), $commands );
+echo "---\n";
+run( array( 'rollback', '-t', 'abc123' ), $commands );
+</script>
+<script type="text/expected-output">
+command=deploy
+options: {"env":"production","dry-run":true}
+positionals: ["web-01","web-02"]
+---
+command=rollback
+options: {"to":"abc123"}
+positionals: []
+</script>
+</php-snippet>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="filesystem.html"><strong>Filesystem</strong></a><span>Keep command behavior testable with in-memory storage.</span></li>
+	<li><a href="blueprints.html"><strong>Blueprints</strong></a><span>Build repeatable site setup commands around parsed options.</span></li>
+	<li><a href="httpserver.html"><strong>HttpServer</strong></a><span>Add a local web UI to a CLI workflow.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/coding-standards.html b/docs/reference/coding-standards.html
new file mode 100644
index 000000000..228ac0bdb
--- /dev/null
+++ b/docs/reference/coding-standards.html
@@ -0,0 +1,90 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>ToolkitCodingStandards — PHP Toolkit reference</title>
+<meta name="description" content="PHP_CodeSniffer sniffs used by this project: enforce Yoda comparisons and ban the short ternary where it hides falsy-value bugs.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li class="current"><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>ToolkitCodingStandards</h1>
+
+<p class="lede">PHP_CodeSniffer sniffs used by this project: enforce Yoda comparisons and ban the short ternary where it hides falsy-value bugs.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/toolkit-coding-standards</code></pre>
+
+<p>This package is not a general-purpose style guide. It holds project-specific PHP_CodeSniffer rules for review comments the toolkit wants automated: comparisons should follow the WordPress Yoda style, and short ternaries should not hide whether a fallback is meant for <code>null</code> only or for all falsy values.</p><p>Use it in this monorepo, or in a project that intentionally wants the same review tradeoffs. If your project does not follow WordPress-style comparisons, the Yoda sniff is probably the wrong rule for you.</p>
+
+<h2 id="reference-the-standard-from-your-phpcsxml">Reference the standard from your phpcs.xml</h2>
+
+<p>The component is a PHPCS ruleset, so the useful examples are configuration and before/after code rather than runtime snippets. Activate both sniffs at once by referencing <code>WordPressToolkitCodingStandards</code>:</p><p>Then run phpcs and phpcbf the usual way:</p>
+
+<h2 id="enforceyodacomparison-catches-accidental-assignment">EnforceYodaComparison: catches accidental assignment</h2>
+
+<p>Yoda comparisons (<code>true === $x</code>) make typo-induced assignments easier to catch and match the WordPress style used throughout the toolkit:</p><p>The sniff covers <code>===</code>, <code>!==</code>, <code>==</code>, and <code>!=</code>, and stays quiet when both sides are dynamic.</p>
+
+<h2 id="why-ban-the-short-ternary">Why ban the short ternary</h2>
+
+<p>Developers confuse the short ternary (<code>$a ?: $b</code>) with the null-coalescing operator (<code>$a ?? $b</code>). They differ on falsy-but-not-null values: <code>0 ?: 'fallback'</code> returns <code>'fallback'</code>, but <code>0 ?? 'fallback'</code> returns <code>0</code>. The sniff bans <code>?:</code> entirely so reviewers don't have to relitigate this on every PR.</p>
+
+<h2 id="review-friendly-replacements">Review-friendly replacements</h2>
+
+<p>When the fallback should apply only to <code>null</code>, use <code>??</code>. When the fallback should apply to every falsy value, write the full ternary so the intent is visible in review.</p>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="polyfill.html"><strong>Polyfill</strong></a><span>Share WordPress-style compatibility expectations across standalone packages.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/corsproxy.html b/docs/reference/corsproxy.html
new file mode 100644
index 000000000..517404723
--- /dev/null
+++ b/docs/reference/corsproxy.html
@@ -0,0 +1,160 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>CORSProxy — PHP Toolkit reference</title>
+<meta name="description" content="A small PHP CORS proxy intended for browser-side code that needs to reach servers without CORS headers.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li class="current"><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>CORSProxy</h1>
+
+<p class="lede">A small PHP CORS proxy intended for browser-side code that needs to reach servers without CORS headers.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/corsproxy</code></pre>
+
+<p>A Playground-style browser tool reads <code>https://api.github.com/repos/WordPress/php-toolkit</code>, a plugin ZIP from <code>downloads.wordpress.org</code>, or a raw fixture from GitHub. The browser blocks the response when the upstream server does not send the required CORS headers, even though PHP can fetch the same public URL server-side.</p><p>The CORSProxy component is that server-side bridge. It accepts a target URL, fetches it from PHP, and returns a browser-readable response. Because an open proxy is a security and abuse risk, real deployments should add host allowlists, rate limits, header controls, and private-network protections appropriate to their environment.</p>
+
+<h2 id="run-the-proxy-locally">Run the proxy locally</h2>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>Drop a <code>cors-proxy-config.php</code> next to <code>cors-proxy.php</code>. If that file defines a <code>playground_cors_proxy_maybe_rate_limit()</code> function, the proxy calls it before forwarding any request — your one chance to reject early. Without the file, the proxy applies its default rate limiter, which is fine for development but should be replaced for any deployment that gets real traffic.</p><p>This example uses a per-IP token bucket stored on disk. Replace with Redis or memcached for multi-host deployments.</p>
+
+<php-snippet blueprint="toolkit-setup" name="cors-proxy-config.php" runnable="false">
+<script type="application/x-php">
+<?php
+// cors-proxy-config.php — placed next to cors-proxy.php.
+
+function playground_cors_proxy_maybe_rate_limit() {
+	$ip      = isset( $_SERVER['REMOTE_ADDR'] ) ? $_SERVER['REMOTE_ADDR'] : '0.0.0.0';
+	$bucket  = sys_get_temp_dir() . '/cors-rl-' . md5( $ip );
+	$now     = time();
+	$window  = 60;
+	$max_req = 30;
+
+	$hits = array();
+	if ( file_exists( $bucket ) ) {
+		$hits = json_decode( file_get_contents( $bucket ), true );
+		if ( ! is_array( $hits ) ) $hits = array();
+	}
+	$hits = array_filter( $hits, function ( $t ) use ( $now, $window ) {
+		return $t > $now - $window;
+	} );
+
+	if ( count( $hits ) >= $max_req ) {
+		header( 'Retry-After: ' . $window );
+		http_response_code( 429 );
+		echo 'Rate limit exceeded';
+		exit;
+	}
+
+	$hits[] = $now;
+	file_put_contents( $bucket, json_encode( array_values( $hits ) ) );
+}
+
+echo "Config loaded — rate limiter armed.\n";
+</script>
+</php-snippet>
+
+<h2 id="refinement-allowlist-upstream-hosts">Refinement: allowlist upstream hosts</h2>
+
+<p>Out of the box the proxy will fetch any public URL. Most real deployments want a fixed list of upstreams — GitHub, Packagist, wp.org. Both the rate-limit logic and the allowlist live in the same hook, since <code>cors-proxy.php</code> only calls <code>playground_cors_proxy_maybe_rate_limit()</code> once. The example below shows just the allowlist concern; in practice you stack both in one function inside <code>cors-proxy-config.php</code>.</p>
+
+<php-snippet blueprint="toolkit-setup" name="cors-proxy-config-allowlist.php" runnable="false">
+<script type="application/x-php">
+<?php
+// cors-proxy-config.php — combine with the rate-limit example above.
+
+function playground_cors_proxy_maybe_rate_limit() {
+	$allow = array(
+		'api.github.com',
+		'raw.githubusercontent.com',
+		'codeload.github.com',
+		'repo.packagist.org',
+		'downloads.wordpress.org',
+		'api.wordpress.org',
+	);
+
+	$target = isset( $_SERVER['PATH_INFO'] ) ? $_SERVER['PATH_INFO'] : ( '/' . ( isset( $_SERVER['QUERY_STRING'] ) ? $_SERVER['QUERY_STRING'] : '' ) );
+	$target = ltrim( $target, '/' );
+	$host   = parse_url( $target, PHP_URL_HOST );
+
+	if ( ! $host || ! in_array( strtolower( $host ), $allow, true ) ) {
+		http_response_code( 403 );
+		header( 'Content-Type: text/plain' );
+		echo "Upstream not allowed: " . ( $host ? $host : '(none)' );
+		exit;
+	}
+}
+
+echo "Allowlist config active.\n";
+</script>
+</php-snippet>
+
+<h2 id="browser-side-fetch-through-the-proxy">Browser-side fetch through the proxy</h2>
+
+<p>Once deployed, the client side is just <code>fetch()</code> with the proxy URL. Drop this into any HTML page.</p>
+
+<h2 id="deploy-behind-nginx">Deploy behind nginx</h2>
+
+<p>The proxy is a single PHP script — any SAPI works. nginx + php-fpm is a common production setup. <code>PATH_INFO</code> is what the proxy reads to learn the target URL.</p>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="httpclient.html"><strong>HttpClient</strong></a><span>Fetch upstream responses from PHP when browser CORS blocks direct access.</span></li>
+	<li><a href="httpserver.html"><strong>HttpServer</strong></a><span>Understand the local-server shape before deploying a proxy endpoint.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/dataliberation.html b/docs/reference/dataliberation.html
new file mode 100644
index 000000000..70c0ee2b6
--- /dev/null
+++ b/docs/reference/dataliberation.html
@@ -0,0 +1,316 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>DataLiberation — PHP Toolkit reference</title>
+<meta name="description" content="Streaming WordPress import/export. WXR, SQL, block markup — without loading whole datasets into memory.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li class="current"><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>DataLiberation</h1>
+
+<p class="lede">Streaming WordPress import/export. WXR, SQL, block markup — without loading whole datasets into memory.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/data-liberation</code></pre>
+
+<p>WordPress content should be portable, but real migrations cross several formats. A site export might arrive as WXR, a Markdown folder, or entities from another CMS. URLs can hide in block attributes, HTML, CSS, feeds, GUIDs, and post meta. Importers must also resume after a failed media download or upload.</p><p>The DataLiberation component streams WordPress-shaped data through readers, transformers, and writers. It models posts, terms, comments, attachments, and metadata as <code>ImportEntity</code> objects, then lets a pipeline rewrite each entity without loading the full export into memory.</p><p>The API reflects specific migration bugs: relative URLs in known block attributes, URLs inside inline CSS, self-closing block comments that must keep their shape, and origin-only URLs whose trailing slash style should not change during a rewrite.</p><p>Reach for it when the job combines formats: build WXR from another CMS, rewrite a staging export for production, frontload remote assets, or compose Markdown, XML, HTML, CSS, and URL rewriting into one pipeline.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>Stream a single post into a WXR document via <code>WXRWriter</code>. The writer holds no buffer beyond what is needed to close currently-open tags, so memory stays flat regardless of input size.</p>
+
+<php-snippet blueprint="toolkit-setup" name="wxr-quickstart.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+$writer->append_entity( new ImportEntity( 'post', array(
+	'post_title' => 'Hello',
+	'content'    => 'World.',
+	'post_id'    => '1',
+	'status'     => 'publish',
+) ) );
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+$wxr = $pipe->consume_all();
+
+echo "bytes: " . strlen( $wxr ) . "\n";
+echo false !== strpos( $wxr, '<title>Hello</title>' ) ? "title exported\n" : "title missing\n";
+echo false !== strpos( $wxr, '<wp:status>publish</wp:status>' ) ? "status exported\n" : "status missing\n";
+</script>
+<script type="text/expected-output">
+bytes: 475
+title exported
+status exported
+</script>
+</php-snippet>
+
+<h2 id="refinement-build-a-wxr-programmatically-from-any-source">Refinement: build a WXR programmatically from any source</h2>
+
+<p>The writer doesn't care where entities come from. Loop over rows from a CMS, a CSV, or a Notion API dump and emit posts plus their meta and comments.</p>
+
+<php-snippet blueprint="toolkit-setup" name="build-wxr.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+
+$rows = array(
+	array( 'id' => 10, 'title' => 'About', 'body' => '<p>About us.</p>', 'tags' => array( 'company' ) ),
+	array( 'id' => 11, 'title' => 'Blog',  'body' => '<p>Hello world.</p>', 'tags' => array( 'news', 'launch' ) ),
+);
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+
+foreach ( $rows as $row ) {
+	$writer->append_entity( new ImportEntity( 'post', array(
+		'post_id'    => (string) $row['id'],
+		'post_title' => $row['title'],
+		'content'    => $row['body'],
+		'status'     => 'publish',
+		'post_type'  => 'post',
+	) ) );
+	foreach ( $row['tags'] as $i => $tag ) {
+		$writer->append_entity( new ImportEntity( 'term', array(
+			'term_id'  => (string) ( $row['id'] * 100 + $i ),
+			'taxonomy' => 'post_tag',
+			'slug'     => $tag,
+			'parent'   => '0',
+		) ) );
+	}
+}
+
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+
+$wxr = $pipe->consume_all();
+echo "items: " . substr_count( $wxr, '<item>' ) . "\n";
+echo "terms: " . substr_count( $wxr, '<wp:term>' ) . "\n";
+echo false !== strpos( $wxr, '<title>Blog</title>' ) ? "Blog post exported\n" : "Blog post missing\n";
+</script>
+<script type="text/expected-output">
+items: 2
+terms: 3
+Blog post exported
+</script>
+</php-snippet>
+
+<h2 id="refinement-read-entities-from-a-wxr-file-with-constant-memory">Refinement: read entities from a WXR file with constant memory</h2>
+
+<p><code>WXREntityReader</code> emits one entity at a time. A 10 GB WXR uses the same memory as a 10 KB one.</p>
+
+<php-snippet blueprint="toolkit-setup" name="wxr-read.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\DataLiberation\EntityReader\WXREntityReader;
+
+$wxr = <<<XML
+<?xml version="1.0" encoding="UTF-8" ?>
+<rss version="2.0" xmlns:wp="http://wordpress.org/export/1.2/" xmlns:content="http://purl.org/rss/1.0/modules/content/">
+<channel>
+<title>Demo</title>
+<item><title>First</title><wp:post_id>1</wp:post_id><wp:post_type>post</wp:post_type><content:encoded>Body 1</content:encoded></item>
+<item><title>Second</title><wp:post_id>2</wp:post_id><wp:post_type>post</wp:post_type><content:encoded>Body 2</content:encoded></item>
+</channel>
+</rss>
+XML;
+
+$reader = WXREntityReader::create();
+$reader->append_bytes( $wxr );
+$reader->input_finished();
+
+while ( $reader->next_entity() ) {
+	$entity = $reader->get_entity();
+	echo $entity->get_type() . ': ' . json_encode( $entity->get_data() ) . "\n";
+}
+</script>
+<script type="text/expected-output">
+site_option: {"option_name":"blogname","option_value":"Demo"}
+post: {"post_title":"First","post_id":"1","post_type":"post","post_content":"Body 1"}
+post: {"post_title":"Second","post_id":"2","post_type":"post","post_content":"Body 2"}
+</script>
+</php-snippet>
+
+<h2 id="refinement-streaming-transform-rewrite-urls-while-copying-wxr">Refinement: streaming transform: rewrite URLs while copying WXR</h2>
+
+<p>Wire reader to writer to rewrite a WXR file on the fly. This pattern is how you migrate a staging export to production: swap <code>staging.example.com</code> for <code>example.com</code> without ever loading the file into memory.</p>
+
+<php-snippet blueprint="toolkit-setup" name="rewrite-urls.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityReader\WXREntityReader;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+
+$source_xml = <<<XML
+<?xml version="1.0" encoding="UTF-8" ?>
+<rss version="2.0" xmlns:wp="http://wordpress.org/export/1.2/" xmlns:content="http://purl.org/rss/1.0/modules/content/">
+<channel>
+<item><title>Hello</title><wp:post_id>1</wp:post_id><wp:post_type>post</wp:post_type>
+<content:encoded>Visit https://staging.example.com/about for more.</content:encoded></item>
+</channel>
+</rss>
+XML;
+
+$reader = WXREntityReader::create();
+$reader->append_bytes( $source_xml );
+$reader->input_finished();
+
+$out_pipe = new MemoryPipe();
+$writer   = new WXRWriter( $out_pipe );
+
+while ( $reader->next_entity() ) {
+	$entity = $reader->get_entity();
+	$data   = $entity->get_data();
+	foreach ( array( 'post_content', 'content', 'description' ) as $field ) {
+		if ( isset( $data[ $field ] ) ) {
+			$data[ $field ] = str_replace( 'staging.example.com', 'example.com', $data[ $field ] );
+		}
+	}
+	if ( 'post' === $entity->get_type() ) {
+		$data['content'] = isset( $data['post_content'] ) ? $data['post_content'] : ( isset( $data['content'] ) ? $data['content'] : '' );
+	}
+	$writer->append_entity( new ImportEntity( $entity->get_type(), $data ) );
+}
+
+$writer->finalize();
+$writer->close_writing();
+$out_pipe->close_writing();
+
+$wxr = $out_pipe->consume_all();
+echo false !== strpos( $wxr, 'https://example.com/about' ) ? "new URL present\n" : "new URL missing\n";
+echo false === strpos( $wxr, 'staging.example.com' ) ? "old URL removed\n" : "old URL still present\n";
+</script>
+<script type="text/expected-output">
+new URL present
+old URL removed
+</script>
+</php-snippet>
+
+<h2 id="refinement-render-markdown-into-a-wxr-import-in-one-pipeline">Refinement: render Markdown into a WXR import in one pipeline</h2>
+
+<p>Compose <code>MarkdownConsumer</code> with <code>WXRWriter</code> to publish a folder of Markdown directly as a WordPress import file.</p>
+
+<php-snippet blueprint="toolkit-setup" name="md-to-wxr.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\DataLiberation\EntityWriter\WXRWriter;
+use WordPress\DataLiberation\ImportEntity;
+use WordPress\Markdown\MarkdownConsumer;
+
+@mkdir( '/tmp/md-src', 0777, true );
+file_put_contents( '/tmp/md-src/hello.md',  "---\ntitle: Hello\n---\n\n# Hello\n\nFirst post." );
+file_put_contents( '/tmp/md-src/second.md', "---\ntitle: Second\n---\n\nMore text **here**." );
+
+$pipe   = new MemoryPipe();
+$writer = new WXRWriter( $pipe );
+
+$id = 1;
+foreach ( glob( '/tmp/md-src/*.md' ) as $path ) {
+	$consumer = new MarkdownConsumer( file_get_contents( $path ) );
+	$consumer->consume();
+	$writer->append_entity( new ImportEntity( 'post', array(
+		'post_id'    => (string) $id++,
+		'post_title' => $consumer->get_meta_value( 'title' ) ?: basename( $path, '.md' ),
+		'content'    => $consumer->get_block_markup(),
+		'status'     => 'publish',
+		'post_type'  => 'post',
+		'post_name'  => basename( $path, '.md' ),
+	) ) );
+}
+
+$writer->finalize();
+$writer->close_writing();
+$pipe->close_writing();
+
+$wxr = $pipe->consume_all();
+echo "posts: " . substr_count( $wxr, '<item>' ) . "\n";
+echo false !== strpos( $wxr, '&lt;!-- wp:heading' ) ? "block markup exported\n" : "block markup missing\n";
+echo false !== strpos( $wxr, '<title>Second</title>' ) ? "frontmatter title exported\n" : "frontmatter title missing\n";
+</script>
+<script type="text/expected-output">
+posts: 2
+block markup exported
+frontmatter title exported
+</script>
+</php-snippet>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="markdown.html"><strong>Markdown</strong></a><span>Use Markdown as a source or destination format.</span></li>
+	<li><a href="blockparser.html"><strong>BlockParser</strong></a><span>Analyze serialized blocks inside post content.</span></li>
+	<li><a href="httpclient.html"><strong>HttpClient</strong></a><span>Download media and remote source data while importing.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/encoding.html b/docs/reference/encoding.html
new file mode 100644
index 000000000..aaea5042e
--- /dev/null
+++ b/docs/reference/encoding.html
@@ -0,0 +1,233 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Encoding — PHP Toolkit reference</title>
+<meta name="description" content="UTF-8 validation and scrubbing with a pure-PHP fallback when mbstring is unavailable. Detects malformed bytes and replaces them per the Unicode maximal-subpart algorithm.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li class="current"><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>Encoding</h1>
+
+<p class="lede">UTF-8 validation and scrubbing with a pure-PHP fallback when <code>mbstring</code> is unavailable. Detects malformed bytes and replaces them per the Unicode maximal-subpart algorithm.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/encoding</code></pre>
+
+<p>Every parser in this toolkit eventually has to decide what to do with text bytes. XML rejects malformed UTF-8. JSON and databases can fail late. CSS, HTML, WXR, and Blueprint validation all need consistent answers about whether a string is well-formed Unicode.</p><p>The Encoding component provides the small UTF-8 primitives the rest of the toolkit can share: validate bytes, scrub invalid sequences, scan code points, and detect Unicode noncharacters. When <code>mbstring</code> is available it can delegate to it; when it is not, the component uses its own byte scanner so behavior stays available in restricted PHP environments.</p><p>Historically, this became the common foundation for Blueprint validation and CSS/XML processing, replacing ad hoc Unicode helpers with the WordPress core UTF-8 routines used here.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p><code>wp_is_valid_utf8()</code> rejects overlong sequences, surrogate halves, and stray ISO-8859-1 bytes. Use it as a guard in front of any code path that assumes UTF-8 (database, JSON, XML).</p>
+
+<php-snippet blueprint="toolkit-setup" name="validate.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Encoding\wp_is_valid_utf8;
+
+$samples = array(
+	'ASCII'          => 'just a test',
+	'UTF-8 pencil'   => "\xE2\x9C\x8F",
+	'latin-1 byte'   => "B\xFCch",
+	'overlong slash' => "\xC1\xBF",
+	'surrogate half' => "\xED\xB0\x80",
+);
+
+foreach ( $samples as $label => $bytes ) {
+	echo sprintf( "%-14s %s\n", $label . ':', wp_is_valid_utf8( $bytes ) ? 'valid' : 'invalid' );
+}
+</script>
+<script type="text/expected-output">
+ASCII:         valid
+UTF-8 pencil:  valid
+latin-1 byte:  invalid
+overlong slash: invalid
+surrogate half: invalid
+</script>
+</php-snippet>
+
+<h2 id="refinement-scrubbing-invalid-bytes-with-ufffd">Refinement: scrubbing invalid bytes with U+FFFD</h2>
+
+<p>Replace each ill-formed sequence with the Unicode replacement character. Useful right before serializing to XML, JSON, or sending to an LLM that will choke on broken bytes.</p>
+
+<php-snippet blueprint="toolkit-setup" name="scrub.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Encoding\wp_scrub_utf8;
+
+$broken = "the byte \xC0 should not be here.";
+echo wp_scrub_utf8( $broken ) . "\n";
+
+echo wp_scrub_utf8( ".\xE2\x8C\xE2\x8C." ) . "\n";
+</script>
+<script type="text/expected-output">
+the byte � should not be here.
+.��.
+</script>
+</php-snippet>
+
+<h2 id="refinement-detecting-noncharacters-mysqlutf8mb4-will-reject">Refinement: detecting noncharacters MySQL/utf8mb4 will reject</h2>
+
+<p>Code points like U+FFFE, U+FFFF, and the U+FDD0–U+FDEF block are valid Unicode but forbidden in XML and rejected by some databases. Check before inserting user-submitted content into a strict <code>utf8mb4</code> column.</p>
+
+<php-snippet blueprint="toolkit-setup" name="noncharacters.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Encoding\wp_has_noncharacters;
+
+$samples = array(
+	'normal text' => 'normal text',
+	'U+FFFE'      => "oops \u{FFFE}",
+	'U+FDD0'      => "hi \u{FDD0} bye",
+);
+
+foreach ( $samples as $label => $text ) {
+	echo sprintf( "%-12s %s\n", $label . ':', wp_has_noncharacters( $text ) ? 'reject' : 'ok' );
+}
+</script>
+<script type="text/expected-output">
+normal text: ok
+U+FFFE:      reject
+U+FDD0:      reject
+</script>
+</php-snippet>
+
+<h2 id="refinement-three-way-pipeline-validate-scrub-then-check-noncharacters">Refinement: three-way pipeline: validate, scrub, then check noncharacters</h2>
+
+<p>Real-world inputs are messy: an old WXR export, a CSV with mixed encodings, a paste from Word. Combination of validate + scrub + noncharacter-check covers the three classes of breakage that bite later.</p>
+
+<php-snippet blueprint="toolkit-setup" name="pipeline.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Encoding\wp_is_valid_utf8;
+use function WordPress\Encoding\wp_scrub_utf8;
+use function WordPress\Encoding\wp_has_noncharacters;
+
+$inputs = array(
+	'good'      => 'Café',
+	'latin1'    => "caf\xE9",
+	'overlong'  => "x\xC1\xBFy",
+	'noncharac' => "hi \u{FFFE} there",
+);
+
+foreach ( $inputs as $label => $bytes ) {
+	$valid    = wp_is_valid_utf8( $bytes );
+	$cleaned  = wp_scrub_utf8( $bytes );
+	$weird    = wp_has_noncharacters( $cleaned );
+	echo sprintf( "%-10s valid=%s noncharacter=%s -> %s\n", $label, $valid ? 'Y' : 'N', $weird ? 'Y' : 'N', $cleaned );
+}
+</script>
+<script type="text/expected-output">
+good       valid=Y noncharacter=N -> Café
+latin1     valid=N noncharacter=N -> caf�
+overlong   valid=N noncharacter=N -> x��y
+noncharac  valid=Y noncharacter=Y -> hi ￾ there
+</script>
+</php-snippet>
+
+<h2 id="refinement-salvaging-a-legacy-iso-8859-1-column-inside-a-utf-8-corpus">Refinement: salvaging a legacy ISO-8859-1 column inside a UTF-8 corpus</h2>
+
+<p>Old WordPress databases sometimes mix encodings: most rows are UTF-8 but a few were stored as latin-1. Detect the bad rows with <code>wp_is_valid_utf8()</code> and only re-encode those.</p>
+
+<php-snippet blueprint="toolkit-setup" name="mixed-encoding.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Encoding\wp_is_valid_utf8;
+use function WordPress\Encoding\wp_scrub_utf8;
+
+$rows = array(
+	1 => 'Plain ASCII',
+	2 => 'Café',
+	3 => "caf\xE9",
+	4 => "weird \xC0 byte",
+);
+
+foreach ( $rows as $id => $value ) {
+	if ( wp_is_valid_utf8( $value ) ) {
+		echo "#$id ok: $value\n";
+		continue;
+	}
+	$converted = @iconv( 'ISO-8859-1', 'UTF-8', $value );
+	if ( false !== $converted && wp_is_valid_utf8( $converted ) ) {
+		echo "#$id recovered as latin1: $converted\n";
+	} else {
+		echo "#$id unrecoverable, scrubbing: " . wp_scrub_utf8( $value ) . "\n";
+	}
+}
+</script>
+<script type="text/expected-output">
+#1 ok: Plain ASCII
+#2 ok: Café
+#3 recovered as latin1: café
+#4 recovered as latin1: weird À byte
+</script>
+</php-snippet>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="html.html"><strong>HTML</strong></a><span>Normalize incoming text before HTML tokenization.</span></li>
+	<li><a href="xml.html"><strong>XML</strong></a><span>Keep invalid bytes out of XML streams.</span></li>
+	<li><a href="dataliberation.html"><strong>DataLiberation</strong></a><span>Clean content before importing it into WordPress.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/filesystem.html b/docs/reference/filesystem.html
new file mode 100644
index 000000000..22ae72421
--- /dev/null
+++ b/docs/reference/filesystem.html
@@ -0,0 +1,291 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Filesystem — PHP Toolkit reference</title>
+<meta name="description" content="One Filesystem interface across local disk, in-memory trees, SQLite databases, and ZIP archives. Forward-slash paths everywhere — even on Windows — so the same code runs in tests, in production, and inside read-only ZIPs.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li class="current"><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>Filesystem</h1>
+
+<p class="lede">One <code>Filesystem</code> interface across local disk, in-memory trees, SQLite databases, and ZIP archives. Forward-slash paths everywhere — even on Windows — so the same code runs in tests, in production, and inside read-only ZIPs.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/filesystem</code></pre>
+
+<p>Code that touches the filesystem is hard to test, hard to port to Windows, and impossible to point at non-disk storage without rewriting it. Swap <code>LocalFilesystem</code> for <code>InMemoryFilesystem</code> in tests and your suite stops touching <code>/tmp</code>; swap it for <code>SQLiteFilesystem</code> and your "files" become rows in a portable database; swap it for <code>ZipFilesystem</code> and you can read inside an archive with the same calls.</p><p>Every backend uses forward slashes regardless of host OS. No <code>DIRECTORY_SEPARATOR</code> juggling, no Windows-only test failures, no surprises when a path moves between backends.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>The fastest backend. No disk I/O, no cleanup, no test-isolation problems.</p>
+
+<php-snippet blueprint="toolkit-setup" name="teaser-memory.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+
+$fs = InMemoryFilesystem::create();
+$fs->put_contents( '/hello.txt', 'Hello, world!' );
+echo $fs->get_contents( '/hello.txt' );
+</script>
+<script type="text/expected-output">
+Hello, world!
+</script>
+</php-snippet>
+
+<h2 id="refinement-test-code-without-touching-disk">Refinement: test code without touching disk</h2>
+
+<p>Code that takes a <code>Filesystem</code> parameter, instead of calling <code>file_get_contents()</code> directly, can be tested against an <code>InMemoryFilesystem</code>. The test sets up files in memory, exercises the function, and asserts on what got written — no temp directories, no cleanup.</p>
+
+<php-snippet blueprint="toolkit-setup" name="test-without-disk.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\Filesystem;
+use WordPress\Filesystem\InMemoryFilesystem;
+
+function bump_version( Filesystem $fs, $path ) {
+	$json = json_decode( $fs->get_contents( $path ), true );
+	list( $maj, $min, $patch ) = explode( '.', $json['version'] );
+	$json['version'] = $maj . '.' . $min . '.' . ( (int) $patch + 1 );
+	$fs->put_contents( $path, json_encode( $json ) );
+}
+
+$fs = InMemoryFilesystem::create();
+$fs->put_contents( '/package.json', '{"version":"1.2.3"}' );
+bump_version( $fs, '/package.json' );
+
+echo $fs->get_contents( '/package.json' ) . "\n";
+</script>
+<script type="text/expected-output">
+{"version":"1.2.4"}
+</script>
+</php-snippet>
+
+<h2 id="refinement-local-disk-with-a-chrooted-root">Refinement: local disk with a chrooted root</h2>
+
+<p><code>LocalFilesystem::create($root)</code> is implicitly chrooted: every path resolves relative to <code>$root</code> and a <code>../</code> cannot escape. Reach for it when a request path or CLI argument names a file inside one project directory.</p>
+
+<php-snippet blueprint="toolkit-setup" name="local-chroot.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\LocalFilesystem;
+
+$root = sys_get_temp_dir() . '/toolkit-' . uniqid();
+$fs   = LocalFilesystem::create( $root );
+
+$fs->mkdir( '/uploads', array( 'recursive' => true ) );
+$fs->put_contents( '/uploads/note.txt', 'Hi from local disk.' );
+
+echo $fs->get_contents( '/uploads/../uploads/note.txt' ) . "\n";
+
+$fs->rmdir( '/', array( 'recursive' => true ) );
+echo "exists after cleanup? " . ( is_dir( $root ) ? 'yes' : 'no' ) . "\n";
+</script>
+<script type="text/expected-output">
+Hi from local disk.
+exists after cleanup? no
+</script>
+</php-snippet>
+
+<h2 id="refinement-sqlite-as-a-portable-file-store">Refinement: sQLite as a portable file store</h2>
+
+<p>The whole tree lives in one SQLite database file. Use it for self-contained scratch storage that survives process boundaries without leaving loose files behind.</p>
+
+<php-snippet blueprint="toolkit-setup" name="sqlite.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\SQLiteFilesystem;
+
+$fs = SQLiteFilesystem::create( ':memory:' );
+$fs->mkdir( '/posts', array( 'recursive' => true ) );
+for ( $i = 1; $i <= 3; $i++ ) {
+	$fs->put_contents( "/posts/post-{$i}.md", "# Post {$i}\n\nBody {$i}." );
+}
+
+foreach ( $fs->ls( '/posts' ) as $name ) {
+	$first = strtok( $fs->get_contents( '/posts/' . $name ), "\n" );
+	echo "{$name}: {$first}\n";
+}
+</script>
+<script type="text/expected-output">
+post-1.md: # Post 1
+post-2.md: # Post 2
+post-3.md: # Post 3
+</script>
+</php-snippet>
+
+<h2 id="refinement-copy-a-tree-across-backends">Refinement: copy a tree across backends</h2>
+
+<p>The killer composability move: <code>copy_between_filesystems()</code> streams files chunk-by-chunk from any source to any target. Pull a ZIP into SQLite, snapshot SQLite to disk, mirror disk into RAM — all the same call.</p>
+
+<php-snippet blueprint="toolkit-setup" name="cross-backend-copy.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Filesystem\LocalFilesystem;
+use WordPress\Filesystem\SQLiteFilesystem;
+use function WordPress\Filesystem\copy_between_filesystems;
+
+$root  = sys_get_temp_dir() . '/copytree-' . uniqid();
+$local = LocalFilesystem::create( $root );
+$local->mkdir( '/site/posts', array( 'recursive' => true ) );
+$local->put_contents( '/site/posts/2024-01.md', '# Hello 2024' );
+$local->put_contents( '/site/index.html', '<h1>Home</h1>' );
+
+$sqlite = SQLiteFilesystem::create( ':memory:' );
+copy_between_filesystems( array(
+	'source_filesystem' => $local,
+	'source_path'       => '/site',
+	'target_filesystem' => $sqlite,
+	'target_path'       => '/snapshot',
+) );
+
+$mem = InMemoryFilesystem::create();
+copy_between_filesystems( array(
+	'source_filesystem' => $sqlite,
+	'source_path'       => '/snapshot',
+	'target_filesystem' => $mem,
+	'target_path'       => '/copy',
+) );
+
+echo "in memory after two copies:\n";
+echo "  posts: " . implode( ', ', $mem->ls( '/copy/posts' ) ) . "\n";
+echo "  index: " . $mem->get_contents( '/copy/index.html' ) . "\n";
+
+$local->rmdir( '/', array( 'recursive' => true ) );
+</script>
+<script type="text/expected-output">
+in memory after two copies:
+  posts: 2024-01.md
+  index: <h1>Home</h1>
+</script>
+</php-snippet>
+
+<h2 id="refinement-atomic-write-via-tempfile-rename">Refinement: atomic write via tempfile rename</h2>
+
+<p>Write to a sibling tempfile, then rename — that's how you avoid leaving a half-written file on crash. <code>rename()</code> is atomic within a single filesystem.</p>
+
+<php-snippet blueprint="toolkit-setup" name="atomic-write.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\Filesystem;
+use WordPress\Filesystem\LocalFilesystem;
+
+function atomic_put_contents( Filesystem $fs, $path, $bytes ) {
+	$tmp = $path . '.tmp.' . bin2hex( random_bytes( 4 ) );
+	$fs->put_contents( $tmp, $bytes );
+	$fs->rename( $tmp, $path );
+}
+
+$root = sys_get_temp_dir() . '/atomic-' . uniqid();
+$fs   = LocalFilesystem::create( $root );
+
+$fs->put_contents( '/config.json', '{"v":1}' );
+atomic_put_contents( $fs, '/config.json', '{"v":2}' );
+
+echo "config: " . $fs->get_contents( '/config.json' ) . "\n";
+echo "no .tmp leftovers: " . count( $fs->ls( '/' ) ) . " entries in root\n";
+
+$fs->rmdir( '/', array( 'recursive' => true ) );
+</script>
+<script type="text/expected-output">
+config: {"v":2}
+no .tmp leftovers: 1 entries in root
+</script>
+</php-snippet>
+
+<h2 id="refinement-path-helpers-that-behave-the-same-on-windows">Refinement: path helpers that behave the same on Windows</h2>
+
+<p>Unix path semantics apply on every host OS. This matters for abstract paths such as a SQLite key or a ZIP entry name because those paths do not live on a real drive.</p>
+
+<php-snippet blueprint="toolkit-setup" name="path-helpers.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use function WordPress\Filesystem\wp_join_unix_paths;
+use function WordPress\Filesystem\wp_unix_dirname;
+use function WordPress\Filesystem\wp_unix_path_resolve_dots;
+
+echo wp_join_unix_paths( '/var/www', '/site/', '/index.php' ) . "\n";
+echo wp_unix_dirname( '/a/b/c/d.txt', 2 ) . "\n";
+echo wp_unix_path_resolve_dots( '/a/b/../c/./d/../e' ) . "\n";
+</script>
+<script type="text/expected-output">
+/var/www/site/index.php
+/a/b
+a/c/e
+</script>
+</php-snippet>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="bytestream.html"><strong>ByteStream</strong></a><span>Open files as readers and writers instead of loading full strings.</span></li>
+	<li><a href="zip.html"><strong>Zip</strong></a><span>Mount archives and copy data between archive-backed and normal filesystems.</span></li>
+	<li><a href="git.html"><strong>Git</strong></a><span>Expose repository trees through a filesystem-shaped API.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/git.html b/docs/reference/git.html
new file mode 100644
index 000000000..4508e7b05
--- /dev/null
+++ b/docs/reference/git.html
@@ -0,0 +1,304 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Git — PHP Toolkit reference</title>
+<meta name="description" content="A pure-PHP Git client and server. Commits, branches, diffs, HTTP push/pull — all without shelling out to git.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li class="current"><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>Git</h1>
+
+<p class="lede">A pure-PHP Git client and server. Commits, branches, diffs, HTTP push/pull — all without shelling out to <code>git</code>.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/git</code></pre>
+
+<p>Git is a useful storage model even when a server cannot run the <code>git</code> binary: snapshots, branches, object-addressed files, diffs, merges, and sync over HTTP. That matters for WordPress tools that want revision history for generated files, content snapshots, site state, or collaborative edits in constrained runtimes.</p><p>The Git component implements the core repository operations in PHP and stores objects through the toolkit <code>Filesystem</code> interface. That means the same repository can live on disk, in memory, or in another backend, and higher-level code can commit files without knowing where objects are stored.</p><p>The docs start with simple commits because that mental model scales: a repository is just objects plus refs. From there, branches, history walking, root commits, and merges become details you can reason about instead of magic shell behavior.</p><p>Choose it for tests, browser-like sandboxes, hosted WordPress environments, and applications that need Git behavior through PHP APIs instead of shell commands.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>The simplest possible repository: an <code>InMemoryFilesystem</code> as object storage and one <code>commit()</code> call. Reach for this in tests, in WP-CLI snapshots, or any place you want versioning without touching disk.</p>
+
+<php-snippet blueprint="toolkit-setup" name="commit-in-memory.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+
+$oid = $repo->commit( array(
+	'updates' => array(
+		'README.md'           => "# My Project\n",
+		'src/hello-world.php' => '<?php echo "Hello!";',
+	),
+) );
+
+echo "commit: {$oid}\n";
+echo "HEAD:   " . $repo->get_branch_tip( 'HEAD' ) . "\n";
+echo "README: " . $repo->read_object_by_path( '/README.md' )->consume_all();
+</script>
+<script type="text/expected-output">
+commit: <oid>
+HEAD: <oid>
+README: # My Project
+</script>
+</php-snippet>
+
+<h2 id="refinement-walk-the-commit-history">Refinement: walk the commit history</h2>
+
+<p>Follow the parent chain from <code>HEAD</code> backwards. Building block for a WP-CLI "post revisions" log or a "what changed since release X" report.</p>
+
+<php-snippet blueprint="toolkit-setup" name="walk-history.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitRepository;
+use WordPress\Git\Model\Commit;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+foreach ( array( 'add intro', 'fix typo', 'expand examples' ) as $i => $msg ) {
+	$repo->commit( array(
+		'updates' => array( 'post.md' => "# Draft {$i}" ),
+		'commit'  => array( 'message' => $msg ),
+	) );
+}
+
+$oid = $repo->get_branch_tip( 'HEAD' );
+while ( ! Commit::is_null_hash( $oid ) ) {
+	$c = $repo->read_object( $oid )->as_commit();
+	echo substr( $c->hash, 0, 7 ) . '  ' . trim( $c->message ) . "\n";
+	$oid = $c->get_first_parent_hash();
+	if ( ! $oid || ! $repo->has_object( $oid ) ) break;
+}
+</script>
+<script type="text/expected-output">
+<hash>  expand examples
+<hash>  fix typo
+<hash>  add intro
+</script>
+</php-snippet>
+
+<h2 id="refinement-treat-a-repository-like-a-filesystem">Refinement: treat a repository like a filesystem</h2>
+
+<p><code>GitFilesystem</code> wraps a repository in this toolkit's <code>Filesystem</code> interface. With the default options, each <code>put_contents()</code> records a new commit.</p>
+
+<php-snippet blueprint="toolkit-setup" name="git-filesystem.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitFilesystem;
+use WordPress\Git\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+$fs   = GitFilesystem::create( $repo );
+
+$fs->put_contents( '/posts/hello.md', "# Hello\nFirst draft." );
+$fs->put_contents( '/posts/about.md', "# About\nWho we are." );
+$fs->put_contents( '/posts/hello.md', "# Hello\nSecond draft." );
+
+echo "tree:\n";
+foreach ( $fs->ls( '/posts' ) as $name ) {
+	echo "  /posts/{$name}\n";
+}
+echo "\nhello.md now:\n" . $fs->get_contents( '/posts/hello.md' ) . "\n";
+</script>
+<script type="text/expected-output">
+tree:
+  /posts/about.md
+  /posts/hello.md
+
+hello.md now:
+# Hello
+Second draft.
+</script>
+</php-snippet>
+
+<h2 id="refinement-branch-edit-and-switch-back">Refinement: branch, edit, and switch back</h2>
+
+<p>Create a feature branch off the current commit, change files, flip <code>HEAD</code> back. Useful for experimental edits in collaborative tools.</p>
+
+<php-snippet blueprint="toolkit-setup" name="branches.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+$base = $repo->commit( array(
+	'updates' => array( 'config.json' => '{"flag":false}' ),
+	'commit'  => array( 'message' => 'baseline' ),
+) );
+
+$repo->create_branch( 'refs/heads/experiment', $base );
+$repo->checkout( 'refs/heads/experiment' );
+$repo->commit( array(
+	'updates' => array( 'config.json' => '{"flag":true}' ),
+	'commit'  => array( 'message' => 'flip the flag' ),
+) );
+
+echo "on experiment: " . $repo->read_object_by_path( '/config.json' )->consume_all() . "\n";
+
+$repo->checkout( 'refs/heads/trunk' );
+echo "on trunk:      " . $repo->read_object_by_path( '/config.json' )->consume_all() . "\n";
+</script>
+<script type="text/expected-output">
+on experiment: {"flag":true}
+on trunk:      {"flag":false}
+</script>
+</php-snippet>
+
+<h2 id="refinement-three-way-merge-two-branches">Refinement: three-way merge two branches</h2>
+
+<p>The classic Git workflow: branch off, edit on each side, merge. <code>$repo->merge()</code> finds the common ancestor, three-way-merges every file, and creates a merge commit.</p>
+
+<php-snippet blueprint="toolkit-setup" name="merge-branches.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+$base = $repo->commit( array( 'updates' => array(
+	'todo.txt' => "buy milk\nwalk dog\nread book\n",
+) ) );
+
+$repo->commit( array( 'updates' => array(
+	'todo.txt' => "buy oat milk\nwalk dog\nread book\n",
+) ) );
+
+$repo->create_branch( 'refs/heads/feature', $base );
+$repo->checkout( 'refs/heads/feature' );
+$repo->commit( array( 'updates' => array(
+	'todo.txt' => "buy milk\nwalk dog\nread book\nwrite blog post\n",
+) ) );
+
+$repo->checkout( 'refs/heads/trunk' );
+$result = $repo->merge( 'refs/heads/feature' );
+
+echo "merge head: {$result['new_head']}\n";
+echo "conflicts:  " . ( $result['conflicts'] ? implode( ',', $result['conflicts'] ) : 'none' ) . "\n";
+echo "result:\n" . $repo->read_object_by_path( '/todo.txt' )->consume_all();
+</script>
+<script type="text/expected-output">
+merge head: <oid>
+conflicts:  none
+result:
+buy oat milk
+walk dog
+read book
+write blog post
+</script>
+</php-snippet>
+
+<h2 id="refinement-snapshot-wordpress-options-into-a-repo">Refinement: snapshot WordPress options into a repo</h2>
+
+<p>Serialize a chunk of WP state (options, post meta, a theme config) on every save and commit it. You get free history, diffs between snapshots, and a "rollback to last week" button.</p>
+
+<php-snippet blueprint="toolkit-setup" name="options-snapshot.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Git\GitRepository;
+
+$repo = new GitRepository( InMemoryFilesystem::create() );
+
+$snapshots = array(
+	array( 'blogname' => 'My Site',  'posts_per_page' => 10, 'timezone_string' => 'UTC' ),
+	array( 'blogname' => 'My Site',  'posts_per_page' => 20, 'timezone_string' => 'UTC' ),
+	array( 'blogname' => 'New Name', 'posts_per_page' => 20, 'timezone_string' => 'Europe/Warsaw' ),
+);
+
+foreach ( $snapshots as $i => $options ) {
+	$repo->commit( array(
+		'updates' => array( 'options.json' => json_encode( $options, JSON_PRETTY_PRINT ) ),
+		'commit'  => array( 'message' => "snapshot #{$i}" ),
+	) );
+}
+
+$head    = $repo->get_branch_tip( 'HEAD' );
+$parent  = $repo->read_object( $head )->as_commit()->get_first_parent_hash();
+$diff    = $repo->diff_commits( $head, $parent );
+
+echo "Files changed in last snapshot:\n";
+foreach ( $diff as $name => $entry ) {
+	echo "  {$name}\n";
+}
+</script>
+<script type="text/expected-output">
+Files changed in last snapshot:
+  options.json
+</script>
+</php-snippet>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="filesystem.html"><strong>Filesystem</strong></a><span>Work with repository trees through a storage abstraction.</span></li>
+	<li><a href="merge.html"><strong>Merge</strong></a><span>Resolve divergent histories with explicit three-way merge logic.</span></li>
+	<li><a href="bytestream.html"><strong>ByteStream</strong></a><span>Read and write object data without accidental buffering.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/html.html b/docs/reference/html.html
new file mode 100644
index 000000000..77c86e8c3
--- /dev/null
+++ b/docs/reference/html.html
@@ -0,0 +1,284 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>HTML — PHP Toolkit reference</title>
+<meta name="description" content="WP_HTML_Tag_Processor and WP_HTML_Processor: a pure-PHP, browser-grade HTML5 parser and tag rewriter ported from WordPress core.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+
+<aside class="sidebar" aria-label="Reference navigation">
+	<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+	<nav class="toc" aria-label="Table of contents"></nav>
+	<details class="components-nav" open>
+		<summary>All components</summary>
+		<ol>
+			<li class="current"><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+		</ol>
+	</details>
+</aside>
+
+<article class="content">
+
+<h1>HTML</h1>
+
+<p class="lede">A browser-grade HTML5 parser and tag rewriter for PHP, ported from WordPress core. Walk HTML as a cursor, edit attributes byte-for-byte, query by ancestry — without <code>libxml2</code>, without re-serializing, and without losing the bytes you didn't ask to change.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/html</code></pre>
+
+<aside class="callout credit">
+	<strong>Ported from WordPress core.</strong> <a href="https://developer.wordpress.org/reference/classes/wp_html_tag_processor/"><code>WP_HTML_Tag_Processor</code></a> and <a href="https://developer.wordpress.org/reference/classes/wp_html_processor/"><code>WP_HTML_Processor</code></a> are the same classes WordPress core ships in <code>wp-includes/html-api/</code>. The official method-by-method reference lives on developer.wordpress.org; this page is just a few more examples in the toolkit's voice. Source: <a href="https://github.com/WordPress/wordpress-develop/tree/trunk/src/wp-includes/html-api">WordPress/wordpress-develop</a>. The toolkit version tracks core; bug fixes flow in both directions.
+</aside>
+
+<p>WordPress filters HTML constantly: post content, comments, excerpts, feeds, <a href="https://developer.wordpress.org/block-editor/reference-guides/block-api/">block markup</a>, imported documents. Those fragments often omit <code>&lt;html&gt;</code> and <code>&lt;body&gt;</code>, close tags implicitly, and contain markup browsers handle gracefully but <code>DOMDocument</code> chokes on. The HTML component matches what browsers do — without the extension.</p>
+
+<p>The component gives you two processors. <code>WP_HTML_Tag_Processor</code> is a forward-only cursor over tags and tokens; use it for attribute rewriting at scale. <code>WP_HTML_Processor</code> layers HTML5 tree construction on top so you can query by ancestry (breadcrumbs), serialize the parsed document, and trust that <code>&lt;p&gt;one&lt;p&gt;two</code> parses as two paragraphs the way a browser sees it.</p>
+
+<h2 id="minimal">A minimal example</h2>
+
+<p>Add <code>loading="lazy"</code> to every image in a fragment. The smallest demonstration of every property the component is built around: walk by tag name, conditional edits, byte-honest output.</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-html-minimal.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<article><img src="hero.jpg" alt="Hero"><p>Hi</p><img src="x.png" alt=""></article>';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag( 'img' ) ) {
+	if ( null === $tags->get_attribute( 'loading' ) ) {
+		$tags->set_attribute( 'loading', 'lazy' );
+	}
+}
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<article><img src="hero.jpg" alt="Hero" loading="lazy"><p>Hi</p><img src="x.png" alt="" loading="lazy"></article>
+</script>
+</php-snippet>
+
+<p>The Tag Processor is allocation-light by design: edits are recorded as byte-range replacements and applied lazily when you call <code>get_updated_html()</code>. The first time you read the modified HTML the cost is proportional to the number of edits, not to the size of the document.</p>
+
+<h2 id="absolute-urls">Refinement: rewrite relative URLs</h2>
+
+<p>Walk every <code>&lt;a&gt;</code> tag, classify the <code>href</code> as already-absolute or not, and prepend a base URL when needed. Same processor, different filter:</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-html-absolute.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<p><a href="/x">rel</a> <a href="https://other.test/y">abs</a> <a href="#frag">frag</a></p>';
+$base = 'https://example.com';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag( 'a' ) ) {
+	$href = $tags->get_attribute( 'href' );
+	if ( ! is_string( $href ) || '' === $href ) continue;
+	if ( preg_match( '#^[a-z][a-z0-9+.\-]*:#i', $href ) ) continue;
+	if ( 0 === strpos( $href, '//' ) || 0 === strpos( $href, '#' ) ) continue;
+	$tags->set_attribute( 'href', rtrim( $base, '/' ) . '/' . ltrim( $href, '/' ) );
+}
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<p><a href="https://example.com/x">rel</a> <a href="https://other.test/y">abs</a> <a href="#frag">frag</a></p>
+</script>
+</php-snippet>
+
+<h2 id="strip">Refinement: strip script tags and on* handlers</h2>
+
+<p>The cursor exposes one trick the others don't: <code>get_attribute_names_with_prefix()</code>. Combined with <code>set_modifiable_text('')</code> for raw-text elements, you can neutralize the most common pasted-HTML XSS vectors in one walk.</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-html-strip.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<p onclick="x()">hi</p><script>evil()</script><img src="x" onerror="boom()">';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag() ) {
+	if ( 'SCRIPT' === $tags->get_tag() && ! $tags->is_tag_closer() ) {
+		$tags->set_modifiable_text( '' );
+	}
+	foreach ( $tags->get_attribute_names_with_prefix( 'on' ) as $attr ) {
+		$tags->remove_attribute( $attr );
+	}
+}
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<p>hi</p><script></script><img src="x">
+</script>
+</php-snippet>
+
+<h2 id="csp">Refinement: stamp a CSP nonce</h2>
+
+<p>For Content Security Policy in <code>nonce-</code> mode, every inline <code>&lt;script&gt;</code> and <code>&lt;style&gt;</code> needs a matching nonce attribute. Tag-by-tag is exactly the right granularity:</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-html-nonce.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$nonce = bin2hex( random_bytes( 8 ) );
+$html  = '<style>body{font:16px sans-serif}</style><script>init()</script>';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+while ( $tags->next_tag() ) {
+	$tag = $tags->get_tag();
+	if ( ( 'SCRIPT' === $tag || 'STYLE' === $tag ) && ! $tags->is_tag_closer() ) {
+		$tags->set_attribute( 'nonce', $nonce );
+	}
+}
+echo "nonce: $nonce\n" . $tags->get_updated_html();
+</script>
+</php-snippet>
+
+<h2 id="ancestry">Refinement: query by ancestry with WP_HTML_Processor</h2>
+
+<p>The Tag Processor walks tags as a flat sequence — fast and lean, but blind to context. When you need "every <code>&lt;img&gt;</code> directly inside a <code>&lt;figure&gt;</code>" or "the first <code>&lt;h1&gt;</code> outside any <code>&lt;blockquote&gt;</code>," reach for <code>WP_HTML_Processor</code>. It implements HTML5 tree construction, exposes <code>get_breadcrumbs()</code>, and accepts a <code>breadcrumbs</code> filter on <code>next_tag()</code>:</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-html-breadcrumbs.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<article>'
+	. '<figure><img src="hero.jpg" alt="Hero"></figure>'
+	. '<p>Body <img src="emoji.png" alt=""> mid-paragraph.</p>'
+	. '<figure><img src="diagram.png" alt="Diagram"></figure>'
+	. '</article>';
+
+$p = WP_HTML_Processor::create_fragment( $html );
+$figure_images = 0;
+while ( $p->next_tag( array( 'breadcrumbs' => array( 'FIGURE', 'IMG' ) ) ) ) {
+	$p->add_class( 'figure-image' );
+	$figure_images++;
+}
+echo "found $figure_images figure images\n" . $p->get_updated_html();
+</script>
+<script type="text/expected-output">
+found 2 figure images
+<article><figure><img src="hero.jpg" alt="Hero" class="figure-image"></figure><p>Body <img src="emoji.png" alt=""> mid-paragraph.</p><figure><img src="diagram.png" alt="Diagram" class="figure-image"></figure></article>
+</script>
+</php-snippet>
+
+<p>Notice that the <code>&lt;img&gt;</code> inside the <code>&lt;p&gt;</code> didn't get the class — its breadcrumbs are <code>(ARTICLE, P, IMG)</code>, not <code>(FIGURE, IMG)</code>. The full processor is the right tool whenever the question contains the word "inside."</p>
+
+<h2 id="bookmarks">Refinement: bookmarks for backward edits</h2>
+
+<p>The Tag Processor is forward-only, but bookmarks let you save a position, scan ahead, and seek back to rewrite an earlier tag based on what you found later:</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-html-bookmarks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+$html = '<ul>'
+	. '<li><input type="checkbox" checked> Buy milk</li>'
+	. '<li><input type="checkbox"> Walk dog</li>'
+	. '<li><input type="checkbox" checked> Read book</li>'
+	. '</ul>';
+
+$tags = new WP_HTML_Tag_Processor( $html );
+$tags->next_tag( 'ul' );
+$tags->set_bookmark( 'list' );
+
+$total = 0; $done = 0;
+while ( $tags->next_tag( 'input' ) ) {
+	$total++;
+	if ( null !== $tags->get_attribute( 'checked' ) ) $done++;
+}
+
+$tags->seek( 'list' );
+$tags->set_attribute( 'data-progress', "$done/$total" );
+$tags->release_bookmark( 'list' );
+
+echo $tags->get_updated_html();
+</script>
+<script type="text/expected-output">
+<ul data-progress="2/3"><li><input type="checkbox" checked> Buy milk</li><li><input type="checkbox"> Walk dog</li><li><input type="checkbox" checked> Read book</li></ul></script>
+</php-snippet>
+
+<p>Bookmarks are explicitly released because each one pins a small amount of state in the processor. In a long document with many bookmarks, releasing them as soon as you're done keeps memory flat.</p>
+
+<h2 id="when">When to use which</h2>
+
+<table class="api-table">
+<tr><th>Use</th><th>For</th></tr>
+<tr><td><code>WP_HTML_Tag_Processor</code></td><td>Attribute rewriting, sanitization, finding tags by name. Forward-only walks. Anything where speed and byte-honesty matter more than context.</td></tr>
+<tr><td><code>WP_HTML_Processor::create_fragment()</code></td><td>Queries by ancestry (<code>breadcrumbs</code>), heading outline extraction, anything that needs to know "is this tag inside that one."</td></tr>
+<tr><td><code>WP_HTML_Decoder::decode_text_node()</code></td><td>Turning entity-encoded text (<code>AT&amp;amp;T</code>) back into raw text correctly. Implements the HTML5 entity algorithm — don't roll your own.</td></tr>
+<tr><td><code>WP_HTML_Decoder::attribute_starts_with()</code></td><td>Safe URL-prefix checks that respect encoded characters (<code>java&amp;#x09;script:</code>). The classic <code>strpos</code> approach misses these.</td></tr>
+</table>
+
+<h2 id="pitfalls">Pitfalls</h2>
+
+<aside class="callout pitfall">
+	<strong>Mutations are buffered.</strong> Edits don't appear in the source string until you call <code>get_updated_html()</code>. If you're hashing, logging, or pattern-matching the original string after edits, you'll see stale content. Read state from the processor (<code>get_attribute()</code>), not from the original string.
+</aside>
+
+<aside class="callout pitfall">
+	<strong>Tag closers are visited too.</strong> <code>next_tag()</code> stops on both opening and closing tags. For most attribute-rewriting code, gate with <code>! $tags-&gt;is_tag_closer()</code> so you don't try to set attributes on a <code>&lt;/script&gt;</code>.
+</aside>
+
+<aside class="callout pitfall">
+	<strong>Tag-name matches are uppercase.</strong> <code>get_tag()</code> always returns the tag name in uppercase (<code>'IMG'</code>, not <code>'img'</code>). Compare accordingly. The filter argument to <code>next_tag()</code> is case-insensitive in either direction.
+</aside>
+
+<aside class="callout pitfall">
+	<strong>Don't confuse <code>WP_HTML_Tag_Processor</code> with the full processor.</strong> The cursor is forward-only and ancestry-blind. If you call <code>get_breadcrumbs()</code> on it, you'll get a thin shape that doesn't reflect HTML5 tree construction — implicit <code>&lt;tbody&gt;</code> insertion, automatic <code>&lt;p&gt;</code> closing, and the rest live only in <code>WP_HTML_Processor</code>.
+</aside>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="../learn/01-rewriting-html.html"><strong>Tutorial — Rewriting HTML safely</strong></a><span>The chapter that introduces the cursor model and the <code>clean_post_html()</code> function reused later in the importer.</span></li>
+	<li><a href="blockparser.html"><strong>BlockParser</strong></a><span>Parse block comments first, then rewrite the HTML inside each block with the cursor.</span></li>
+	<li><a href="markdown.html"><strong>Markdown</strong></a><span>Convert Markdown to block markup before polishing the HTML it generates.</span></li>
+	<li><a href="dataliberation.html"><strong>DataLiberation</strong></a><span>Rewrite URLs and media references across an entire export, not one fragment at a time.</span></li>
+</ul>
+
+</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/httpclient.html b/docs/reference/httpclient.html
new file mode 100644
index 000000000..782c4b0f9
--- /dev/null
+++ b/docs/reference/httpclient.html
@@ -0,0 +1,622 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>HttpClient — PHP Toolkit reference</title>
+<meta name="description" content="Async HTTP client without curl required. Uses sockets when curl is missing, supports concurrent requests and streaming responses.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li class="current"><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>HttpClient</h1>
+
+<p class="lede">Async HTTP client without <code>curl</code> required. Uses sockets when curl is missing, supports concurrent requests and streaming responses.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/http-client</code></pre>
+
+<p>A plugin installer starts with one request to download <code>plugin.zip</code>. A migration then adds progress reporting, a ten-request media window, resumable downloads, and a remote ZIP reader that feeds ZipFilesystem directly. Those workflows need the same request API from the first GET to the final streamed archive.</p><p>The HttpClient component gives the toolkit a small request/response model, middleware for redirects and caching, concurrent fetches, and response bodies exposed as byte streams. It runs through curl when PHP provides curl and through pure PHP sockets when it does not. Callers keep the same code path.</p><p>Use it to fetch plugin metadata, submit import callbacks, mirror a media library, read a WXR export, or pipe a remote archive into Zip and Filesystem code.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>The smallest flow has three steps: create a request, wait until headers arrive, then consume the body stream. This is intentionally close to the Fetch API shape, but the body is a toolkit byte stream instead of a buffered string.</p>
+
+<php-snippet blueprint="toolkit-setup" name="get.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$client  = new Client();
+$stream  = $client->fetch( new Request( 'https://example.com/' ) );
+
+$response = $stream->await_response();
+echo "status: " . $response->status_code . "\n";
+echo "first 80 bytes: " . substr( $stream->consume_all(), 0, 80 ) . "\n";
+</script>
+</php-snippet>
+
+<h2 id="refinement-post-to-a-url">Refinement: pOST to a URL</h2>
+
+<p>Uploads use the same shape. The only difference is that the request declares a method, request headers, and an upload body stream. Here the body is form-encoded text wrapped in <code>MemoryPipe</code>; a file upload could provide a file-backed read stream instead.</p>
+
+<php-snippet blueprint="toolkit-setup" name="post.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+use WordPress\ByteStream\MemoryPipe;
+
+$payload = http_build_query(
+	array(
+		'title' => 'Hello',
+		'tags'  => 'http,php',
+	),
+	'',
+	'&'
+);
+
+$client  = new Client();
+$request = new Request( 'https://httpbin.org/post', array(
+	'method'      => 'POST',
+	'headers'     => array(
+		'content-type'   => 'application/x-www-form-urlencoded',
+		'content-length' => (string) strlen( $payload ),
+	),
+	'body_stream' => new MemoryPipe( $payload ),
+) );
+
+$response = $client->fetch( $request )->json();
+echo "Server saw form title: " . $response['form']['title'] . "\n";
+</script>
+</php-snippet>
+
+<h2 id="refinement-build-a-json-request-object">Refinement: build a JSON request object</h2>
+
+<p>A <code>Request</code> is just data until a client enqueues it. That makes it easy to test request construction without network access. The constructor normalizes headers, calculates <code>content-length</code> when the body stream has a known length, and moves URL credentials into an Authorization header.</p>
+
+<php-snippet blueprint="toolkit-setup" name="request-object.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\HttpClient\Request;
+
+$body = new MemoryPipe( json_encode( array(
+	'title' => 'Hello',
+	'tags'  => array( 'docs', 'php' ),
+) ) );
+$body->close_writing();
+
+$request = new Request( 'https://user:secret@api.example.test/posts', array(
+	'method'      => 'POST',
+	'headers'     => array( 'content-type' => 'application/json' ),
+	'body_stream' => $body,
+) );
+
+echo $request->method . ' ' . $request->url . "\n";
+echo "content-type: " . $request->get_header( 'content-type' ) . "\n";
+echo "content-length: " . $request->get_header( 'content-length' ) . "\n";
+echo "authorization: " . substr( $request->get_header( 'authorization' ), 0, 10 ) . "...\n";
+</script>
+<script type="text/expected-output">
+POST https://api.example.test/posts
+content-type: application/json
+content-length: 39
+authorization: Basic dXNl...
+</script>
+</php-snippet>
+
+<h2 id="refinement-parse-response-headers">Refinement: parse response headers</h2>
+
+<p>Most applications receive <code>Response</code> objects from <code>await_response()</code>. Transports, middleware, and tests sometimes need the lower-level parser: <code>Response::from_http_headers()</code> turns raw HTTP header bytes into normalized status and case-insensitive headers.</p>
+
+<php-snippet blueprint="toolkit-setup" name="parse-response.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Request;
+use WordPress\HttpClient\Response;
+
+$request = new Request( 'https://api.example.test/posts/42' );
+$raw = "HTTP/1.1 201 Created\r\n"
+	. "Content-Type: application/json\r\n"
+	. "Location: /posts/42\r\n"
+	. "Content-Length: 27\r\n\r\n";
+
+$response = Response::from_http_headers( $raw, $request );
+
+echo "status: " . $response->status_code . ' ' . $response->get_reason_phrase() . "\n";
+echo "ok:     " . ( $response->ok() ? 'yes' : 'no' ) . "\n";
+echo "type:   " . $response->get_header( 'CONTENT-TYPE' ) . "\n";
+echo "size:   " . $response->total_bytes . " bytes\n";
+</script>
+<script type="text/expected-output">
+status: 201 Created
+ok:     yes
+type:   application/json
+size:   27 bytes
+</script>
+</php-snippet>
+
+<h2 id="pick-the-right-reading-style">Pick the right reading style</h2>
+
+<p>There are three common ways to consume a response. Start simple, then move down the table only when the workflow demands it.</p>
+
+<h2 id="refinement-choose-a-transport">Refinement: choose a transport</h2>
+
+<p>The transport is the I/O backend. It should not change your request, response, redirect, cache, or stream code; it only changes how bytes move across the network.</p><p><code>concurrency</code>, <code>timeout_ms</code>, <code>cache_dir</code>, redirects, and response streaming sit above the transport, so the examples later on work with either backend.</p>
+
+<php-snippet blueprint="toolkit-setup" name="transports.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+
+$default = new Client(); // Same as array( 'transport' => 'auto' ).
+
+$portable = new Client( array(
+	'transport' => 'sockets',
+) );
+
+if ( extension_loaded( 'curl' ) ) {
+	$curl = new Client( array(
+		'transport' => 'curl',
+	) );
+}
+</script>
+</php-snippet>
+
+<h2 id="refinement-follow-redirects-and-inspect-the-final-request">Refinement: follow redirects and inspect the final request</h2>
+
+<p>Redirects are middleware, not transport behavior. The client follows up to five redirects by default. The original <code>Request</code> keeps a chain to the final request, so importers can log where a source URL actually landed.</p>
+
+<php-snippet blueprint="toolkit-setup" name="redirects.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$client   = new Client();
+$request  = new Request( 'https://httpbin.org/redirect-to?url=https://example.com/' );
+$stream   = $client->fetch( $request );
+$response = $stream->await_response();
+$stream->consume_all();
+
+$final = $request->latest_redirect();
+echo "original: " . $request->url . "\n";
+echo "final:    " . $final->url . "\n";
+echo "status:   " . $response->status_code . "\n";
+</script>
+</php-snippet>
+
+<h2 id="refinement-cache-repeatable-get-responses">Refinement: cache repeatable GET responses</h2>
+
+<p>Pass <code>cache_dir</code> to add disk caching for cacheable GET and HEAD responses. Fresh cached responses replay the same header/body events as a network response, so crawlers and importers do not need a separate cache code path. Non-GET requests invalidate matching cache entries instead of being cached.</p>
+
+<php-snippet blueprint="toolkit-setup" name="cache.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$cache_dir = sys_get_temp_dir() . '/http-cache-' . uniqid();
+mkdir( $cache_dir );
+
+$client = new Client( array( 'cache_dir' => $cache_dir ) );
+$url    = 'https://httpbin.org/cache/60';
+
+for ( $i = 1; $i <= 2; $i++ ) {
+	$stream   = $client->fetch( new Request( $url ) );
+	$response = $stream->await_response();
+	$body     = $stream->consume_all();
+	echo "request {$i}: HTTP " . $response->status_code . ', body=' . strlen( $body ) . " bytes\n";
+}
+
+echo "cache files: " . count( glob( $cache_dir . '/*' ) ) . "\n";
+</script>
+</php-snippet>
+
+<h2 id="refinement-handle-failures-without-losing-the-queue">Refinement: handle failures without losing the queue</h2>
+
+<p>Failures arrive as events. That lets a crawler, importer, package installer, or media frontloader log one bad URL and keep processing the rest of the queue. Treat failure handling as part of the event loop, not as one global try/catch around the whole batch.</p>
+
+<php-snippet blueprint="toolkit-setup" name="failures.php" runnable="false">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$client = new Client( array( 'timeout_ms' => 5000 ) );
+$client->enqueue( array(
+	new Request( 'https://example.com/', array( 'method' => 'HEAD' ) ),
+	new Request( 'https://example.invalid/missing' ),
+) );
+
+while ( $client->await_next_event() ) {
+	$request = $client->get_request();
+	$event   = $client->get_event();
+
+	if ( Client::EVENT_GOT_HEADERS === $event ) {
+		echo "ok: " . $request->url . " HTTP " . $request->response->status_code . "\n";
+	} elseif ( Client::EVENT_FAILED === $event ) {
+		echo "failed: " . $request->url . "\n";
+	} elseif ( Client::EVENT_FINISHED === $event ) {
+		echo "finished: " . $request->url . "\n";
+	}
+}
+</script>
+</php-snippet>
+
+<h2 id="refinement-monitor-download-progress">Refinement: monitor download progress</h2>
+
+<p>When you care about progress, use the event loop directly. Count bytes from each <code>EVENT_BODY_CHUNK_AVAILABLE</code> event and compare them with <code>Content-Length</code> when the server provides one.</p>
+
+<php-snippet blueprint="toolkit-setup" name="progress.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$url  = 'https://raw.githubusercontent.com/WordPress/php-toolkit/trunk/components/Zip/Tests/fixtures/childrens-literature.zip';
+$dest = sys_get_temp_dir() . '/progress-' . uniqid() . '.zip';
+
+$client  = new Client();
+$request = new Request( $url );
+$client->enqueue( array( $request ) );
+
+$downloaded = 0;
+$last_step  = -1;
+@unlink( $dest );
+
+while ( $client->await_next_event() ) {
+	$event   = $client->get_event();
+	$request = $client->get_request();
+
+	if ( Client::EVENT_GOT_HEADERS === $event ) {
+		echo "status: " . $request->response->status_code . "\n";
+		continue;
+	}
+
+	if ( Client::EVENT_BODY_CHUNK_AVAILABLE === $event ) {
+		$chunk       = $client->get_response_body_chunk();
+		$downloaded += strlen( $chunk );
+		file_put_contents( $dest, $chunk, FILE_APPEND );
+
+		$total = $request->response->total_bytes;
+		if ( $total ) {
+			$step = min( 100, (int) floor( $downloaded / $total * 100 ) );
+			if ( $step >= $last_step + 25 || 100 === $step ) {
+				echo "progress: {$step}% ({$downloaded}/{$total} bytes)\n";
+				$last_step = $step;
+			}
+		} else {
+			echo "downloaded: {$downloaded} bytes\n";
+		}
+		continue;
+	}
+
+	if ( Client::EVENT_FINISHED === $event ) {
+		echo "saved: {$dest}\n";
+	} elseif ( Client::EVENT_FAILED === $event ) {
+		echo "failed: " . $request->error->message . "\n";
+	}
+}
+</script>
+</php-snippet>
+
+<h2 id="refinement-keep-a-sliding-window-of-10-requests">Refinement: keep a sliding window of 10 requests</h2>
+
+<p>For large queues, do not enqueue everything at once. Keep at most ten active requests, enqueue another as each one finishes, and let the client multiplex only that window.</p>
+
+<php-snippet blueprint="toolkit-setup" name="sliding-window.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$urls = array();
+for ( $i = 1; $i <= 25; $i++ ) {
+	$urls[] = 'https://example.com/?request=' . $i;
+}
+
+$client  = new Client( array( 'concurrency' => 10 ) );
+$pending = $urls;
+$active  = array();
+$done    = 0;
+
+$enqueue_next = function () use ( &$pending, &$active, $client ) {
+	if ( ! $pending ) {
+		return;
+	}
+	$url     = array_shift( $pending );
+	$request = new Request( $url, array( 'method' => 'HEAD' ) );
+	$active[ $request->id ] = $request;
+	$client->enqueue( array( $request ) );
+};
+
+for ( $i = 0; $i < 10; $i++ ) {
+	$enqueue_next();
+}
+
+while ( $active && $client->await_next_event() ) {
+	$request = $client->get_request();
+	$event   = $client->get_event();
+
+	if ( Client::EVENT_GOT_HEADERS === $event ) {
+		echo "headers {$request->id}: " . $request->response->status_code . "\n";
+		continue;
+	}
+
+	if ( Client::EVENT_FINISHED === $event || Client::EVENT_FAILED === $event ) {
+		unset( $active[ $request->id ] );
+		$done++;
+		echo "finished {$done}/25, active=" . count( $active ) . "\n";
+		$enqueue_next();
+	}
+}
+</script>
+</php-snippet>
+
+<h2 id="refinement-resume-a-partial-download">Refinement: resume a partial download</h2>
+
+<p>Resuming is an HTTP contract between you and the server. Save what you already have, send a <code>Range</code> request for the remaining bytes, and append only if the server returns <code>206 Partial Content</code>.</p>
+
+<php-snippet blueprint="toolkit-setup" name="resume-download.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$url  = 'https://raw.githubusercontent.com/WordPress/php-toolkit/trunk/components/Zip/Tests/fixtures/childrens-literature.zip';
+$dest = sys_get_temp_dir() . '/resume-' . uniqid() . '.zip';
+
+$client = new Client();
+
+// Simulate an interrupted first attempt by downloading only the first 32 KB.
+$first = new Request( $url, array(
+	'headers' => array( 'range' => 'bytes=0-32767' ),
+) );
+$stream   = $client->fetch( $first );
+$response = $stream->await_response();
+file_put_contents( $dest, $stream->consume_all() );
+
+if ( 206 !== $response->status_code ) {
+	echo "Server did not honor Range; start over with a full download.\n";
+	exit;
+}
+
+$downloaded = filesize( $dest );
+echo "partial file: {$downloaded} bytes\n";
+
+$resume = new Request( $url, array(
+	'headers' => array( 'range' => 'bytes=' . $downloaded . '-' ),
+) );
+$stream   = $client->fetch( $resume );
+$response = $stream->await_response();
+
+if ( 206 !== $response->status_code ) {
+	echo "Server did not resume; discard partial file and retry from byte 0.\n";
+	exit;
+}
+
+while ( ! $stream->reached_end_of_data() ) {
+	$n = $stream->pull( 8192 );
+	if ( 0 === $n ) {
+		break;
+	}
+	file_put_contents( $dest, $stream->consume( $n ), FILE_APPEND );
+}
+
+echo "complete file: " . filesize( $dest ) . " bytes\n";
+echo "saved: {$dest}\n";
+</script>
+</php-snippet>
+
+<h2 id="refinement-stream-unzip-a-remote-archive">Refinement: stream-unzip a remote archive</h2>
+
+<p>Mount the remote archive with <code>ZipFilesystem</code>, then copy it into any writable filesystem. <code>SeekableRequestReadStream</code> caches received bytes to a temporary file so <code>ZipFilesystem</code> can read the central directory and seek to entries without first writing the ZIP yourself.</p>
+
+<php-snippet blueprint="toolkit-setup" name="stream-unzip.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\ByteStream\SeekableRequestReadStream;
+use WordPress\HttpClient\Request;
+use WordPress\Filesystem\LocalFilesystem;
+use WordPress\Zip\ZipFilesystem;
+use function WordPress\Filesystem\copy_between_filesystems;
+use function WordPress\Filesystem\ls_recursive;
+
+$url  = 'https://raw.githubusercontent.com/WordPress/php-toolkit/trunk/components/Zip/Tests/fixtures/childrens-literature.zip';
+$root = sys_get_temp_dir() . '/remote-zip-' . uniqid();
+mkdir( $root );
+
+$client = new Client();
+$reader = new SeekableRequestReadStream(
+	new Request( $url ),
+	array( 'client' => $client )
+);
+
+$response = $reader->await_response();
+if ( ! $response->ok() ) {
+	echo "HTTP " . $response->status_code . "\n";
+	exit;
+}
+
+$zip   = ZipFilesystem::create( $reader );
+$local = LocalFilesystem::create( $root );
+
+copy_between_filesystems( array(
+	'source_filesystem' => $zip,
+	'source_path'       => '/',
+	'target_filesystem' => $local,
+	'target_path'       => '/',
+) );
+
+$tree  = ls_recursive( $local, '/' );
+$files = 0;
+array_walk_recursive( $tree, function ( $value, $key ) use ( &$files ) {
+	if ( 'type' === $key && 'file' === $value ) {
+		$files++;
+	}
+} );
+
+echo "extracted {$files} files\n";
+echo "root: {$root}\n";
+</script>
+</php-snippet>
+
+<h2 id="refinement-parallel-fan-out-fetch-many-urls-at-once">Refinement: parallel fan-out: fetch many URLs at once</h2>
+
+<p>Enqueue a batch of requests and react to events as they fire. The client multiplexes them — total wall time is roughly the slowest request, not the sum.</p>
+
+<php-snippet blueprint="toolkit-setup" name="fan-out.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$urls = array(
+	'https://wordpress.org/',
+	'https://make.wordpress.org/',
+	'https://developer.wordpress.org/',
+);
+
+$client = new Client();
+$client->enqueue( array_map( function ( $url ) {
+	return new Request( $url, array( 'method' => 'HEAD' ) );
+}, $urls ) );
+
+$results = array();
+while ( $client->await_next_event() ) {
+	$request = $client->get_request();
+	if ( Client::EVENT_GOT_HEADERS === $client->get_event() ) {
+		$results[ $request->url ] = $request->response->status_code;
+	} elseif ( Client::EVENT_FAILED === $client->get_event() ) {
+		$results[ $request->url ] = 'ERR ' . $request->error->message;
+	}
+}
+
+foreach ( $results as $url => $status ) {
+	printf( "%-40s %s\n", $url, $status );
+}
+</script>
+</php-snippet>
+
+<h2 id="refinement-stream-a-download-to-disk-without-oom">Refinement: stream a download to disk without OOM</h2>
+
+<p>Process the body chunk-by-chunk via the event loop. Memory stays flat regardless of file size.</p>
+
+<php-snippet blueprint="toolkit-setup" name="stream-to-disk.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpClient\Client;
+use WordPress\HttpClient\Request;
+
+$dest   = sys_get_temp_dir() . '/wp-readme.html';
+$client = new Client();
+$client->enqueue( array( new Request( 'https://wordpress.org/' ) ) );
+
+$bytes = 0;
+@unlink( $dest );
+
+while ( $client->await_next_event() ) {
+	switch ( $client->get_event() ) {
+		case Client::EVENT_BODY_CHUNK_AVAILABLE:
+			$chunk  = $client->get_response_body_chunk();
+			$bytes += strlen( $chunk );
+			file_put_contents( $dest, $chunk, FILE_APPEND );
+			break;
+		case Client::EVENT_FINISHED:
+			echo "Wrote {$bytes} bytes to {$dest}\n";
+			break;
+	}
+}
+
+echo "Peak memory: " . round( memory_get_peak_usage( true ) / 1024 / 1024, 2 ) . " MB\n";
+</script>
+</php-snippet>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="bytestream.html"><strong>ByteStream</strong></a><span>Stream request and response bodies.</span></li>
+	<li><a href="filesystem.html"><strong>Filesystem</strong></a><span>Persist large downloads without buffering them in memory.</span></li>
+	<li><a href="corsproxy.html"><strong>CORSProxy</strong></a><span>Bridge browser-side tools to servers without CORS headers.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/httpserver.html b/docs/reference/httpserver.html
new file mode 100644
index 000000000..66c499ece
--- /dev/null
+++ b/docs/reference/httpserver.html
@@ -0,0 +1,185 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>HttpServer — PHP Toolkit reference</title>
+<meta name="description" content="A minimal blocking TCP HTTP server in pure PHP. For CLI tools and tests, not for production traffic.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li class="current"><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>HttpServer</h1>
+
+<p class="lede">A minimal blocking TCP HTTP server in pure PHP. For CLI tools and tests, not for production traffic.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/http-server</code></pre>
+
+<p>Sometimes a PHP tool needs a tiny local HTTP surface: a test fixture server, a webhook receiver during development, a CLI tool with a browser UI, or a demo endpoint for another component. Pulling in a production web framework would obscure the example and add dependencies the toolkit avoids.</p><p>The HttpServer component is intentionally small: a blocking TCP server, incoming request objects, and response writers. It is useful for local tools and tests. It is not a replacement for nginx, Apache, php-fpm, RoadRunner, Swoole, or a production application server.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<php-snippet blueprint="toolkit-setup" name="hello-server.php" runnable="false">
+<script type="application/x-php">
+<?php
+require __DIR__ . '/vendor/autoload.php';
+
+use WordPress\HttpServer\TcpServer;
+use WordPress\HttpServer\IncomingRequest;
+use WordPress\HttpServer\Response\ResponseWriteStream;
+
+$server = new TcpServer( '127.0.0.1', 8080 );
+
+$server->set_handler( function ( IncomingRequest $request, ResponseWriteStream $response ) {
+	$response->send_http_code( 200 );
+	$response->send_header( 'Content-Type', 'text/plain' );
+	$response->append_bytes( "Hello from " . $request->method . " " . $request->url . "\n" );
+} );
+
+$server->serve( function ( $host, $port ) {
+	echo "Listening on http://{$host}:{$port}\n";
+} );
+</script>
+</php-snippet>
+
+<h2 id="refinement-a-tiny-json-router">Refinement: a tiny JSON router</h2>
+
+<p>Build a CLI tool with a web UI by switching on the parsed path and method.</p>
+
+<php-snippet blueprint="toolkit-setup" name="mini-router.php" runnable="false">
+<script type="application/x-php">
+<?php
+require __DIR__ . '/vendor/autoload.php';
+
+use WordPress\HttpServer\TcpServer;
+use WordPress\HttpServer\IncomingRequest;
+use WordPress\HttpServer\Response\ResponseWriteStream;
+
+$server = new TcpServer( '127.0.0.1', 8080 );
+
+$server->set_handler( function ( IncomingRequest $request, ResponseWriteStream $response ) {
+	$path = $request->get_parsed_url()->pathname;
+
+	if ( '/api/status' === $path ) {
+		$response->send_http_code( 200 );
+		$response->send_header( 'Content-Type', 'application/json' );
+		$response->append_bytes( json_encode( array(
+			'ok'     => true,
+			'pid'    => getmypid(),
+			'memory' => memory_get_usage( true ),
+		) ) );
+		return;
+	}
+
+	if ( '/api/echo' === $path && 'POST' === $request->method ) {
+		$body = '';
+		while ( ! $request->body_stream->reached_end_of_data() ) {
+			$n = $request->body_stream->pull( 4096 );
+			if ( $n > 0 ) $body .= $request->body_stream->consume( $n );
+		}
+		$response->send_http_code( 200 );
+		$response->send_header( 'Content-Type', 'text/plain' );
+		$response->append_bytes( $body );
+		return;
+	}
+
+	$response->send_http_code( 404 );
+	$response->append_bytes( "Not found\n" );
+} );
+
+$server->serve();
+</script>
+</php-snippet>
+
+<h2 id="refinement-buffered-response-with-auto-content-length">Refinement: buffered response with auto Content-Length</h2>
+
+<p>Use <code>BufferingResponseWriter</code> when you want the framework to compute <code>Content-Length</code> for you, or when the runtime is CGI-shaped and expects the full body up front. This one runs anywhere — no socket required.</p>
+
+<php-snippet blueprint="toolkit-setup" name="buffered-writer.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\HttpServer\Response\BufferingResponseWriter;
+
+$writer = new BufferingResponseWriter();
+$writer->send_http_code( 200 );
+$writer->send_header( 'Content-Type', 'text/html' );
+$writer->append_bytes( '<!doctype html><title>Hi</title><h1>Hello</h1>' );
+$writer->append_bytes( '<p>Buffered body, sent at the end.</p>' );
+
+ob_start();
+$writer->close_writing();
+$response_body = ob_get_clean();
+
+echo "headers before send:\n";
+foreach ( $writer->get_buffered_headers() as $name => $value ) {
+	echo "{$name}: {$value}\n";
+}
+echo "\nbody:\n" . $response_body;
+</script>
+<script type="text/expected-output">
+headers before send:
+Content-Type: text/html
+
+body:
+<!doctype html><title>Hi</title><h1>Hello</h1><p>Buffered body, sent at the end.</p>
+</script>
+</php-snippet>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="cli.html"><strong>CLI</strong></a><span>Expose a local browser UI from a command-line tool.</span></li>
+	<li><a href="httpclient.html"><strong>HttpClient</strong></a><span>Test client code against a small local fixture server.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/index.html b/docs/reference/index.html
new file mode 100644
index 000000000..5330e5107
--- /dev/null
+++ b/docs/reference/index.html
@@ -0,0 +1,74 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Reference — PHP Toolkit</title>
+<meta name="description" content="Per-component reference pages for PHP Toolkit. Each page has a one-line definition, a minimal runnable example, refinements, and pitfalls.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<main class="reference-landing">
+
+<h1>Reference</h1>
+
+<p class="lede">One concept guide per component. Each page assumes you know what HTML is, what a ZIP file is, what a stream is — and explains how this particular component models that thing in pure PHP. If a concept appears for the first time in <a href="../learn/">the tutorial</a>, the reference page links back.</p>
+
+<section class="ref-group">
+	<h2>Content and migration</h2>
+	<ul class="ref-grid">
+		<li><a href="html.html"><strong>HTML</strong><span>Browser-grade HTML5 parser and tag rewriter. Cursor model, byte-for-byte edits, breadcrumb queries.</span></a></li>
+		<li><a href="blockparser.html"><strong>BlockParser</strong><span>Parse WordPress block markup into the array shape WordPress core returns. No <code>block.json</code>, no rendering.</span></a></li>
+		<li><a href="markdown.html"><strong>Markdown</strong><span>Convert between Markdown and WordPress block markup, with frontmatter for metadata.</span></a></li>
+		<li><a href="xml.html"><strong>XML</strong><span>A cursor-based XML processor that reads, edits, and emits export-sized files without building a tree.</span></a></li>
+		<li><a href="encoding.html"><strong>Encoding</strong><span>Validate, classify, and repair UTF-8 bytes before they reach a strict parser.</span></a></li>
+		<li><a href="dataliberation.html"><strong>DataLiberation</strong><span>Stream WordPress-shaped entities between sites. URL rewriting, attachment frontloading, resumable migration.</span></a></li>
+	</ul>
+</section>
+
+<section class="ref-group">
+	<h2>Streams and storage</h2>
+	<ul class="ref-grid">
+		<li><a href="bytestream.html"><strong>ByteStream</strong><span>Pull / peek / consume read streams and chunked write streams. Composable filters: gzip, hash, limit, window.</span></a></li>
+		<li><a href="filesystem.html"><strong>Filesystem</strong><span>One filesystem interface, multiple backends: local disk, memory, SQLite, ZIP-backed.</span></a></li>
+		<li><a href="zip.html"><strong>Zip</strong><span>Read and write ZIP archives one entry at a time, in pure PHP. EPUB, .docx, plugin bundles.</span></a></li>
+		<li><a href="git.html"><strong>Git</strong><span>Read and write Git objects, refs, and trees in memory. Mount a commit as a filesystem.</span></a></li>
+		<li><a href="merge.html"><strong>Merge</strong><span>Three-way diffs and merges with explicit conflict records.</span></a></li>
+	</ul>
+</section>
+
+<section class="ref-group">
+	<h2>Networked tools</h2>
+	<ul class="ref-grid">
+		<li><a href="httpclient.html"><strong>HttpClient</strong><span>HTTP requests with redirects, ranged resumable downloads, an event loop for progress, and pluggable transports.</span></a></li>
+		<li><a href="httpserver.html"><strong>HttpServer</strong><span>Bind to a local port and answer one request. OAuth callbacks, fixture servers, status pages.</span></a></li>
+		<li><a href="corsproxy.html"><strong>CORSProxy</strong><span>Server-side fetch for browser apps that can't bypass the same-origin policy.</span></a></li>
+		<li><a href="cli.html"><strong>CLI</strong><span>Parse <code>argv</code> against a declared command-line contract. No console framework.</span></a></li>
+	</ul>
+</section>
+
+<section class="ref-group">
+	<h2>WordPress runtime support</h2>
+	<ul class="ref-grid">
+		<li><a href="polyfill.html"><strong>Polyfill</strong><span>WordPress-shaped helpers (<code>esc_html</code>, filters, translation stubs) for code that runs outside WordPress.</span></a></li>
+		<li><a href="blueprints.html"><strong>Blueprints</strong><span>Versioned recipes for spinning up a WordPress site with a known plugin set, content, and config.</span></a></li>
+		<li><a href="coding-standards.html"><strong>ToolkitCodingStandards</strong><span>PHPCS sniffs that encode the project's review feedback as enforceable rules.</span></a></li>
+	</ul>
+</section>
+
+</main>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/markdown.html b/docs/reference/markdown.html
new file mode 100644
index 000000000..227aebbe1
--- /dev/null
+++ b/docs/reference/markdown.html
@@ -0,0 +1,263 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Markdown — PHP Toolkit reference</title>
+<meta name="description" content="Bidirectional converter between Markdown and WordPress block markup. Useful for moving content between Markdown files and WordPress while preserving the structures both formats can express.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li class="current"><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>Markdown</h1>
+
+<p class="lede">Bidirectional converter between Markdown and WordPress block markup. Useful for moving content between Markdown files and WordPress while preserving the structures both formats can express.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/markdown</code></pre>
+
+<aside class="callout credit">
+	<strong>Built on league/commonmark.</strong> Markdown parsing is delegated to <a href="https://commonmark.thephpleague.com/"><code>league/commonmark</code></a>; YAML frontmatter is handled by <a href="https://github.com/webuni/front-matter"><code>webuni/front-matter</code></a>. The toolkit's own work is the bridge between CommonMark's AST and <a href="https://developer.wordpress.org/block-editor/reference-guides/block-api/">WordPress block markup</a>, in both directions.
+</aside>
+
+<p>Many publishing workflows start in Markdown: documentation sites, static-site generators, Git-backed editorial workflows, Obsidian vaults, and developer notes. WordPress stores editor content as block markup. Moving between those worlds by string replacement loses metadata and quickly breaks on lists, tables, code blocks, and frontmatter.</p><p>The Markdown component provides a structured bridge. <code>MarkdownConsumer</code> turns Markdown plus frontmatter into block markup and metadata; <code>MarkdownProducer</code> turns supported block markup back into Markdown. The conversion is meant for practical content workflows, not byte-identical round-tripping of every custom block attribute.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>Feed Markdown into <code>MarkdownConsumer</code>, get block markup back. The result is a <code>BlocksWithMetadata</code> object that holds both the rendered blocks and any frontmatter parsed from the document.</p>
+
+<php-snippet blueprint="toolkit-setup" name="quickstart.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+$result = ( new MarkdownConsumer( "# Hello\n\nWelcome to **WordPress**." ) )->consume();
+echo $result->get_block_markup();
+</script>
+<script type="text/expected-output">
+<!-- wp:heading {"level":1} -->
+<h1 class="wp-block-heading" id="hello">Hello</h1>
+<!-- /wp:heading -->
+
+<!-- wp:paragraph -->
+<p>Welcome to <b>WordPress</b>.</p>
+<!-- /wp:paragraph -->
+</script>
+</php-snippet>
+
+<h2 id="refinement-round-trip-blocks-back-to-markdown">Refinement: round-trip: blocks back to Markdown</h2>
+
+<p>Pair <code>MarkdownProducer</code> with <code>MarkdownConsumer</code> to convert in either direction. Round-tripping is lossy for block attributes that have no Markdown representation (custom classes, alignment), so do not expect byte-perfect equality.</p>
+
+<php-snippet blueprint="toolkit-setup" name="roundtrip.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+use WordPress\Markdown\MarkdownProducer;
+
+$md       = "## Round trip\n\n- one\n- two\n- three\n";
+$blocks   = ( new MarkdownConsumer( $md ) )->consume();
+$markdown = ( new MarkdownProducer( $blocks ) )->produce();
+
+echo $markdown;
+</script>
+<script type="text/expected-output">
+## Round trip
+
+- one
+- two
+- three
+</script>
+</php-snippet>
+
+<h2 id="refinement-reading-yaml-frontmatter-as-post-meta">Refinement: reading YAML frontmatter as post meta</h2>
+
+<p>Frontmatter keys come back as arrays so a single key can hold multiple values. Use <code>get_meta_value()</code> when you only want the first scalar.</p>
+
+<php-snippet blueprint="toolkit-setup" name="frontmatter.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+$md = <<<MD
+---
+post_title: "The Name of the Wind"
+post_status: publish
+tags: [fantasy, kingkiller]
+---
+
+Once upon a time...
+MD;
+
+$consumer = new MarkdownConsumer( $md );
+$consumer->consume();
+
+echo 'Title: '   . $consumer->get_meta_value( 'post_title' )  . "\n";
+echo 'Status: '  . $consumer->get_meta_value( 'post_status' ) . "\n";
+$metadata = $consumer->get_all_metadata();
+echo 'Tags: ' . implode( ', ', $metadata['tags'][0] ) . "\n";
+</script>
+<script type="text/expected-output">
+Title: The Name of the Wind
+Status: publish
+Tags: fantasy, kingkiller
+</script>
+</php-snippet>
+
+<h2 id="refinement-migrating-an-obsidian-or-hugo-folder-of-markdown">Refinement: migrating an Obsidian or Hugo folder of Markdown</h2>
+
+<p>Walk a directory of <code>.md</code> files (Obsidian vault, Hugo <code>content/</code>, Jekyll <code>_posts</code>) and emit one block-markup record per file.</p>
+
+<php-snippet blueprint="toolkit-setup" name="migrate-folder.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+@mkdir( '/tmp/vault', 0777, true );
+file_put_contents( '/tmp/vault/welcome.md', "---\ntitle: Welcome\n---\n\nHello world." );
+file_put_contents( '/tmp/vault/roadmap.md', "# Roadmap\n\n1. Ship\n2. Iterate" );
+
+foreach ( glob( '/tmp/vault/*.md' ) as $path ) {
+	$consumer = new MarkdownConsumer( file_get_contents( $path ) );
+	$consumer->consume();
+	$title = $consumer->get_meta_value( 'title' );
+	if ( ! $title ) $title = basename( $path, '.md' );
+	echo "=== $title ($path) ===\n";
+	echo substr( $consumer->get_block_markup(), 0, 120 ) . "...\n\n";
+}
+</script>
+<script type="text/expected-output">
+=== roadmap (/tmp/<tempfile>/roadmap.md) ===
+<!-- wp:heading {"level":1} -->
+<h1 class="wp-block-heading" id="roadmap">Roadmap</h1>
+<!-- /wp:heading -->
+
+<!-- wp:lis...
+
+=== Welcome (/tmp/<tempfile>/welcome.md) ===
+<!-- wp:paragraph -->
+<p>Hello world.</p>
+<!-- /wp:paragraph -->
+
+...
+</script>
+</php-snippet>
+
+<h2 id="refinement-counting-blocks-produced-by-a-markdown-document">Refinement: counting blocks produced by a Markdown document</h2>
+
+<p>After conversion, the block markup is plain WordPress block markup, so <code>parse_blocks()</code> works on it directly. The standard way to introspect what the converter emitted before saving to the database.</p>
+
+<php-snippet blueprint="toolkit-setup" name="count-blocks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Markdown\MarkdownConsumer;
+
+$md = <<<MD
+# Title
+
+A paragraph with **bold** and *italics*.
+
+| Col A | Col B |
+|-------|-------|
+| 1     | 2     |
+
+```php
+echo 'hi';
+```
+
+> A quote.
+MD;
+
+$blocks = ( new MarkdownConsumer( $md ) )->consume()->get_block_markup();
+$counts = array();
+$queue  = parse_blocks( $blocks );
+
+while ( $queue ) {
+	$block = array_shift( $queue );
+	if ( null !== $block['blockName'] ) {
+		$name             = $block['blockName'];
+		$counts[ $name ] = isset( $counts[ $name ] ) ? $counts[ $name ] + 1 : 1;
+	}
+	foreach ( $block['innerBlocks'] as $inner_block ) {
+		$queue[] = $inner_block;
+	}
+}
+foreach ( $counts as $name => $count ) {
+	echo "{$name}: {$count}\n";
+}
+</script>
+<script type="text/expected-output">
+core/heading: 1
+core/paragraph: 2
+core/table: 1
+core/code: 1
+core/quote: 1
+</script>
+</php-snippet>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="blockparser.html"><strong>BlockParser</strong></a><span>Understand the block tree created from Markdown output.</span></li>
+	<li><a href="html.html"><strong>HTML</strong></a><span>Rewrite rendered HTML fragments without using DOMDocument.</span></li>
+	<li><a href="dataliberation.html"><strong>DataLiberation</strong></a><span>Turn Markdown folders into import/export streams.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/merge.html b/docs/reference/merge.html
new file mode 100644
index 000000000..7ced9da74
--- /dev/null
+++ b/docs/reference/merge.html
@@ -0,0 +1,283 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Merge — PHP Toolkit reference</title>
+<meta name="description" content="Three-way merge and diff. Pluggable differ + merger + optional validator.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li class="current"><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>Merge</h1>
+
+<p class="lede">Three-way merge and diff. Pluggable differ + merger + optional validator.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/merge</code></pre>
+
+<p>Content synchronization needs more than "last write wins." A Markdown file changes in Git while the same post changes in WordPress. A generated config changes through both a CLI tool and a UI. In those cases you need a common ancestor, two edited versions, and a way to explain conflicts to a human.</p><p>The Merge component provides the diff and three-way merge primitives used by those workflows. The default examples are line-oriented because that is the most familiar shape, but the strategy is intentionally pluggable: choose the differ, choose the merger, and optionally validate the merged result before accepting it.</p><p>Use the merge result to auto-accept independent edits and to show structured conflicts when a person must decide.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>Feed two strings to <code>LineDiffer</code> and inspect the operations. Every <code>get_changes()</code> entry is a <code>[op, text]</code> pair.</p>
+
+<php-snippet blueprint="toolkit-setup" name="line-diff.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Merge\Diff\Diff;
+use WordPress\Merge\Diff\LineDiffer;
+
+$diff = ( new LineDiffer() )->diff(
+	"alpha\nbeta\ngamma\n",
+	"alpha\nBETA\ngamma\ndelta\n"
+);
+
+$labels = array( Diff::DIFF_EQUAL => '=', Diff::DIFF_DELETE => '-', Diff::DIFF_INSERT => '+' );
+foreach ( $diff->get_changes() as $change ) {
+	echo $labels[ $change[0] ] . ' ' . rtrim( $change[1] ) . "\n";
+}
+</script>
+<script type="text/expected-output">
+= alpha
+- beta
++ BETA
+= gamma
++ delta
+=
+</script>
+</php-snippet>
+
+<h2 id="refinement-render-a-unified-patch">Refinement: render a unified patch</h2>
+
+<p><code>format_as_git_patch()</code> produces output that mirrors <code>git diff</code>, including hunk headers — handy for emails, CI annotations, or a "what changed?" panel.</p>
+
+<php-snippet blueprint="toolkit-setup" name="git-patch.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Merge\Diff\LineDiffer;
+
+$old = "title: Hello\nauthor: Alice\nstatus: draft\n";
+$new = "title: Hello, world\nauthor: Alice\nstatus: published\ntags: greeting\n";
+
+$diff = ( new LineDiffer() )->diff( $old, $new );
+echo $diff->format_as_git_patch( array(
+	'a_source' => 'a/post.yml',
+	'b_source' => 'b/post.yml',
+) );
+</script>
+<script type="text/expected-output">
+diff --git a/post.yml b/post.yml
+--- a/post.yml
++++ b/post.yml
+@@ -1,4 +1,5 @@- title: Hello
++ title: Hello, world
+  author: Alice
+- status: draft
++ status: published
++ tags: greeting
+</script>
+</php-snippet>
+
+<h2 id="refinement-three-way-merge-with-no-conflicts">Refinement: three-way merge with no conflicts</h2>
+
+<p>The classic case: each branch changes a different region. Pass the common ancestor plus both edits to <code>MergeStrategy::merge()</code> and read the merged result.</p>
+
+<php-snippet blueprint="toolkit-setup" name="three-way.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Merge\Diff\LineDiffer;
+use WordPress\Merge\Merge\LineMerger;
+use WordPress\Merge\MergeStrategy;
+
+$strategy = new MergeStrategy( new LineDiffer(), new LineMerger() );
+
+$result = $strategy->merge(
+	"intro\nbody\noutro\n",
+	"intro updated\nbody\noutro\n",
+	"intro\nbody\noutro\nappendix\n"
+);
+
+echo $result->has_conflicts() ? "conflicts!\n" : "clean merge:\n";
+echo $result->get_merged_content();
+</script>
+<script type="text/expected-output">
+clean merge:
+intro updated
+body
+outro
+appendix
+</script>
+</php-snippet>
+
+<h2 id="refinement-inspect-and-surface-conflicts">Refinement: inspect and surface conflicts</h2>
+
+<p>When both sides edit the same region, the merger produces a <code>MergeConflict</code>. The merged content carries Git-style markers, but the structured <code>get_conflicts()</code> output is what you want for a UI that lets the user pick a side.</p>
+
+<php-snippet blueprint="toolkit-setup" name="conflicts.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Merge\Diff\LineDiffer;
+use WordPress\Merge\Merge\LineMerger;
+use WordPress\Merge\MergeStrategy;
+
+$strategy = new MergeStrategy( new LineDiffer(), new LineMerger() );
+$result = $strategy->merge(
+	"line 1\nline 2\n",
+	"line 1\nline 2 from Alice\n",
+	"line 1\nline 2 from Bob\n"
+);
+
+if ( $result->has_conflicts() ) {
+	foreach ( $result->get_conflicts() as $c ) {
+		echo "ours:   " . trim( $c->ours ) . "\n";
+		echo "theirs: " . trim( $c->theirs ) . "\n";
+	}
+}
+echo "\n--- merged content with markers ---\n";
+echo $result->get_merged_content();
+</script>
+<script type="text/expected-output">
+ours:   line 2 from Alice
+theirs: line 2 from Bob
+
+--- merged content with markers ---
+line 1
+
+<<<<<<< HEAD
+line 2 from Alice
+
+=======
+line 2 from Bob
+
+>>>>>>> incoming
+</script>
+</php-snippet>
+
+<h2 id="refinement-sync-a-markdown-folder-against-an-edited-db-copy">Refinement: sync a Markdown folder against an edited DB copy</h2>
+
+<p>A real-world scenario: posts live both in a Git-tracked Markdown folder and in WordPress, and someone edits each. Three-way-merge each post against its common ancestor.</p>
+
+<php-snippet blueprint="toolkit-setup" name="sync-folder-vs-db.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Merge\Diff\LineDiffer;
+use WordPress\Merge\Merge\LineMerger;
+use WordPress\Merge\MergeStrategy;
+
+$strategy = new MergeStrategy( new LineDiffer(), new LineMerger() );
+
+$posts = array(
+	'hello.md' => array(
+		'base' => "# Hello\nDraft body.\n",
+		'disk' => "# Hello\nDraft body, expanded on disk.\n",
+		'db'   => "# Hello\nDraft body.\nNew section from the editor.\n",
+	),
+	'about.md' => array(
+		'base' => "# About\nWho we are.\n",
+		'disk' => "# About\nWho *they* are.\n",
+		'db'   => "# About\nWho we really are.\n",
+	),
+);
+
+foreach ( $posts as $name => $sides ) {
+	$result = $strategy->merge( $sides['base'], $sides['disk'], $sides['db'] );
+	echo "=== {$name} ===\n";
+	echo $result->has_conflicts() ? "(conflict — needs review)\n" : "(auto-merged)\n";
+	echo $result->get_merged_content() . "\n";
+}
+</script>
+<script type="text/expected-output">
+=== hello.md ===
+(conflict — needs review)
+# Hello
+
+<<<<<<< HEAD
+Draft body, expanded on disk.
+
+=======
+New section from the editor.
+
+>>>>>>> incoming 
+
+
+=== about.md ===
+(conflict — needs review)
+# About
+
+<<<<<<< HEAD
+Who *they* are.
+
+=======
+Who we really are.
+
+>>>>>>> incoming
+</script>
+</php-snippet>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="git.html"><strong>Git</strong></a><span>Merge file contents discovered through repository history.</span></li>
+	<li><a href="markdown.html"><strong>Markdown</strong></a><span>Resolve file-based editorial workflows before converting to blocks.</span></li>
+	<li><a href="dataliberation.html"><strong>DataLiberation</strong></a><span>Make content synchronization conflicts visible.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/polyfill.html b/docs/reference/polyfill.html
new file mode 100644
index 000000000..258fbe9c5
--- /dev/null
+++ b/docs/reference/polyfill.html
@@ -0,0 +1,215 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Polyfill — PHP Toolkit reference</title>
+<meta name="description" content="PHP 8 string functions on PHP 7.2+, WordPress hook stubs, and translation/escaping passthroughs so toolkit code runs without WordPress.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li class="current"><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>Polyfill</h1>
+
+<p class="lede">PHP 8 string functions on PHP 7.2+, WordPress hook stubs, and translation/escaping passthroughs so toolkit code runs without WordPress.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/polyfill</code></pre>
+
+<aside class="callout credit">
+	<strong>WordPress-shaped behavior.</strong> When WordPress is loaded, every function in this component defers to WordPress. The standalone implementations of <code>esc_html()</code>, <code>add_filter()</code>, <code>__()</code>, and friends match WordPress core's behavior so the same code runs inside and outside the platform.
+</aside>
+
+<p>A lot of WordPress-adjacent code wants to call <code>esc_html()</code>, <code>__()</code>, or <code>apply_filters()</code> without booting WordPress. The polyfill component provides minimal but real implementations so that code runs unchanged outside WordPress, and stays out of the way when WordPress is loaded (every function uses <code>function_exists()</code> guards).</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>The polyfills define <code>str_contains</code>, <code>str_starts_with</code>, <code>str_ends_with</code>, and <code>array_key_first</code> only when missing.</p>
+
+<php-snippet blueprint="toolkit-setup" name="php8-strings.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+var_dump( str_starts_with( '/var/www/html', '/var' ) );
+var_dump( str_ends_with( 'image.png', '.png' ) );
+var_dump( str_contains( 'WordPress Toolkit', 'Toolkit' ) );
+
+$first_key = array_key_first( array( 'alpha' => 1, 'beta' => 2 ) );
+echo "first key: {$first_key}\n";
+</script>
+<script type="text/expected-output">
+bool(true)
+bool(true)
+bool(true)
+first key: alpha
+</script>
+</php-snippet>
+
+<h2 id="refinement-escaping-and-translation-stubs">Refinement: escaping and translation stubs</h2>
+
+<p>Pass-through implementations let you write code that looks WordPressy and runs anywhere.</p>
+
+<php-snippet blueprint="toolkit-setup" name="wp-stubs.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+echo __( 'Hello, world' ) . "\n";
+echo esc_html( '<script>alert("xss")<\/script>' ) . "\n";
+echo esc_attr( 'a "quoted" value' ) . "\n";
+echo esc_url( 'https://example.com/?a=1&b=2' ) . "\n";
+</script>
+<script type="text/expected-output">
+Hello, world
+&lt;script&gt;alert(&quot;xss&quot;)&lt;/script&gt;
+a &quot;quoted&quot; value
+https://example.com/?a=1&amp;b=2
+</script>
+</php-snippet>
+
+<h2 id="refinement-a-simple-filter-chain">Refinement: a simple filter chain</h2>
+
+<p>The hook system is a real implementation of the WordPress filter API: registered callbacks get applied in priority order, and each one transforms the running value.</p>
+
+<php-snippet blueprint="toolkit-setup" name="filter-chain.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+add_filter( 'sanitize_title', 'trim' );
+add_filter( 'sanitize_title', 'strtolower' );
+add_filter( 'sanitize_title', function ( $title ) {
+	return preg_replace( '/\s+/', '-', $title );
+} );
+
+echo apply_filters( 'sanitize_title', '  My Post Title  ' ) . "\n";
+</script>
+<script type="text/expected-output">
+my-post-title
+</script>
+</php-snippet>
+
+<h2 id="refinement-priority-ordering-and-multi-arg-passing">Refinement: priority ordering and multi-arg passing</h2>
+
+<p>Lower priority numbers run first. The fourth argument to <code>add_filter</code> controls how many context values get passed to the callback.</p>
+
+<php-snippet blueprint="toolkit-setup" name="priority-args.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+add_filter( 'render_price', function ( $html, $price, $currency ) {
+	return $html . " ({$currency} markup)";
+}, 30, 3 );
+
+add_filter( 'render_price', function ( $html, $price ) {
+	return "<strong>{$html}</strong>";
+}, 10, 2 );
+
+add_filter( 'render_price', function ( $html, $price, $currency ) {
+	if ( 'EUR' === $currency ) return $html . ' EUR';
+	return $html . " {$currency}";
+}, 20, 3 );
+
+echo apply_filters( 'render_price', '19.99', 19.99, 'EUR' ) . "\n";
+</script>
+<script type="text/expected-output">
+<strong>19.99</strong> EUR (EUR markup)
+</script>
+</php-snippet>
+
+<h2 id="refinement-hook-based-extension-points-in-standalone-libraries">Refinement: hook-based extension points in standalone libraries</h2>
+
+<p>Use <code>do_action</code> and <code>apply_filters</code> as cheap extension points in your own code, without depending on WordPress.</p>
+
+<php-snippet blueprint="toolkit-setup" name="library-hooks.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+class ImportPipeline {
+	public function process( array $row ) {
+		$row = apply_filters( 'import_pipeline_normalize', $row );
+		do_action( 'import_pipeline_row_processed', $row );
+		return $row;
+	}
+}
+
+add_filter( 'import_pipeline_normalize', function ( $row ) {
+	$row['email'] = strtolower( trim( $row['email'] ) );
+	return $row;
+} );
+
+$log = array();
+add_action( 'import_pipeline_row_processed', function ( $row ) use ( &$log ) {
+	$log[] = $row['email'];
+} );
+
+$pipeline = new ImportPipeline();
+$pipeline->process( array( 'email' => '  USER@EXAMPLE.COM  ' ) );
+$pipeline->process( array( 'email' => 'OTHER@example.com' ) );
+
+echo implode( "\n", $log ) . "\n";
+</script>
+<script type="text/expected-output">
+user@example.com
+other@example.com
+</script>
+</php-snippet>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="html.html"><strong>HTML</strong></a><span>Run WordPress-shaped escaping and translation helpers beside HTML processors.</span></li>
+	<li><a href="blockparser.html"><strong>BlockParser</strong></a><span>Keep standalone block tooling familiar outside WordPress.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/xml.html b/docs/reference/xml.html
new file mode 100644
index 000000000..89a3bdfeb
--- /dev/null
+++ b/docs/reference/xml.html
@@ -0,0 +1,230 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>XML — PHP Toolkit reference</title>
+<meta name="description" content="A streaming, namespace-aware XML processor in pure PHP. Read and modify huge feeds, WXR exports, ePub manifests, and Office Open XML parts without ever loading the document into memory and without depending on libxml2.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+	<aside class="sidebar" aria-label="Reference navigation">
+		<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+		<nav class="toc" aria-label="Table of contents"></nav>
+		<details class="components-nav" open>
+			<summary>All components</summary>
+			<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li class="current"><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+			</ol>
+		</details>
+	</aside>
+	<article class="content">
+
+<h1>XML</h1>
+
+<p class="lede">A streaming, namespace-aware XML processor in pure PHP. Read and modify huge feeds, WXR exports, ePub manifests, and Office Open XML parts without ever loading the document into memory and without depending on <code>libxml2</code>.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/xml</code></pre>
+
+<p><code>SimpleXMLElement</code> and <code>DOMDocument</code> both need <code>libxml2</code> and both build a complete in-memory tree. <code>XMLProcessor</code> walks the document forward as a cursor, keeps modifications in a side buffer, and emits the full updated XML with <code>get_updated_xml()</code> only when you ask for it.</p><p>This design came from WordPress-scale documents such as WXR exports. A migration may only need to rewrite <code>wp:attachment_url</code> values or bump a feed attribute, so the processor optimizes for targeted cursor edits instead of a full validating XML stack.</p>
+
+<h2 id="a-minimal-example">A minimal example</h2>
+
+<p>Find each <code><book></code>, read its price, write a new one, emit the updated document.</p>
+
+<php-snippet blueprint="toolkit-setup" name="bump-prices.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\XML\XMLProcessor;
+
+$xml = '<catalog>'
+	. '<book sku="A1" price="29.99"><title>PHP Internals</title></book>'
+	. '<book sku="A2" price="14.50"><title>WordPress at Scale</title></book>'
+	. '</catalog>';
+
+$p = XMLProcessor::create_from_string( $xml );
+while ( $p->next_tag( 'book' ) ) {
+	$old = (float) $p->get_attribute( '', 'price' );
+	$new = number_format( $old * 1.10, 2, '.', '' );
+	$p->set_attribute( '', 'price', $new );
+}
+
+echo $p->get_updated_xml();
+</script>
+<script type="text/expected-output">
+<catalog><book sku="A1" price="32.99"><title>PHP Internals</title></book><book sku="A2" price="15.95"><title>WordPress at Scale</title></book></catalog>
+</script>
+</php-snippet>
+
+<h2 id="refinement-read-namespaced-attributes-from-a-wxr-export">Refinement: read namespaced attributes from a WXR export</h2>
+
+<p>WordPress's WXR commonly uses <code>wp:</code>, <code>dc:</code>, and <code>content:</code> prefixes bound to namespace names such as <code>http://wordpress.org/export/1.2/</code>. Pass that expanded namespace name, not the prefix; the processor handles whichever prefix the document actually uses.</p>
+
+<php-snippet blueprint="toolkit-setup" name="wxr-namespaces.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\XML\XMLProcessor;
+
+$wxr = '<?xml version="1.0"?>'
+	. '<rss xmlns:wp="http://wordpress.org/export/1.2/" xmlns:dc="http://purl.org/dc/elements/1.1/">'
+	. '<channel><item>'
+	. '<title>Hello World</title>'
+	. '<dc:creator>admin</dc:creator>'
+	. '<wp:post_id>42</wp:post_id>'
+	. '<wp:status>publish</wp:status>'
+	. '</item></channel></rss>';
+
+$WP = 'http://wordpress.org/export/1.2/';
+$DC = 'http://purl.org/dc/elements/1.1/';
+
+$p = XMLProcessor::create_from_string( $wxr );
+while ( $p->next_tag( 'item' ) ) {
+	while ( $p->next_token() ) {
+		if ( $p->is_tag_closer() && 'item' === $p->get_tag_local_name() ) break;
+		if ( ! $p->is_tag_opener() ) continue;
+		$ns = $p->get_tag_namespace();
+		$local = $p->get_tag_local_name();
+		$prefix = ( $WP === $ns ) ? 'wp/' : ( ( $DC === $ns ) ? 'dc/' : '' );
+		echo "{$prefix}{$local}: ";
+		while ( $p->next_token() && '#text' !== $p->get_token_name() ) {}
+		echo trim( $p->get_modifiable_text() ) . "\n";
+	}
+}
+</script>
+<script type="text/expected-output">
+title: Hello World
+dc/creator: admin
+wp/post_id: 42
+wp/status: publish
+</script>
+</php-snippet>
+
+<h2 id="refinement-rewrite-urls-across-an-entire-wxr-export">Refinement: rewrite URLs across an entire WXR export</h2>
+
+<p>Large WXR exports can hold many URLs in <code><link></code>, <code><guid></code>, and post content. Streaming the file lets you rewrite large exports without loading the whole XML document into memory.</p>
+
+<php-snippet blueprint="toolkit-setup" name="rewrite-wxr-urls.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\XML\XMLProcessor;
+
+$wxr = '<?xml version="1.0"?><rss xmlns:wp="http://wordpress.org/export/1.2/"><channel>'
+	. '<wp:base_site_url>https://old.example.com</wp:base_site_url>'
+	. '<item><link>https://old.example.com/2024/post-1</link>'
+	. '<guid>https://old.example.com/?p=1</guid></item>'
+	. '</channel></rss>';
+
+$from = 'https://old.example.com';
+$to   = 'https://new.example.com';
+
+$p = XMLProcessor::create_from_string( $wxr );
+$rewritten = 0;
+
+while ( $p->next_token() ) {
+	if ( '#text' !== $p->get_token_name() ) continue;
+	$text = $p->get_modifiable_text();
+	if ( false === strpos( $text, $from ) ) continue;
+	$p->set_modifiable_text( str_replace( $from, $to, $text ) );
+	$rewritten++;
+}
+
+echo "rewrote {$rewritten} text nodes\n\n";
+echo $p->get_updated_xml();
+</script>
+<script type="text/expected-output">
+rewrote 3 text nodes
+
+<?xml version="1.0"?><rss xmlns:wp="http://wordpress.org/export/1.2/"><channel><wp:base_site_url>https://new.example.com</wp:base_site_url><item><link>https://new.example.com/2024/post-1</link><guid>https://new.example.com/?p=1</guid></item></channel></rss>
+</script>
+</php-snippet>
+
+<h2 id="refinement-parse-opml-to-extract-feed-urls">Refinement: parse OPML to extract feed URLs</h2>
+
+<p>OPML is the format Feedly and many readers use to import/export feed lists. Flat, attribute-heavy XML — exactly what a tag processor handles best.</p>
+
+<php-snippet blueprint="toolkit-setup" name="opml.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\XML\XMLProcessor;
+
+$opml = '<?xml version="1.0"?><opml version="2.0"><head><title>My Feeds</title></head>'
+	. '<body>'
+	. '<outline text="Tech"><outline text="Hacker News" type="rss" xmlUrl="https://news.ycombinator.com/rss"/>'
+	. '<outline text="LWN" type="rss" xmlUrl="https://lwn.net/headlines/rss"/></outline>'
+	. '<outline text="WordPress" type="rss" xmlUrl="https://wordpress.org/news/feed/"/>'
+	. '</body></opml>';
+
+$p = XMLProcessor::create_from_string( $opml );
+while ( $p->next_tag( 'outline' ) ) {
+	$url = $p->get_attribute( '', 'xmlUrl' );
+	if ( null === $url ) continue;
+	echo $p->get_attribute( '', 'text' ) . "\t" . $url . "\n";
+}
+</script>
+<script type="text/expected-output">
+Hacker News	https://news.ycombinator.com/rss
+LWN	https://lwn.net/headlines/rss
+WordPress	https://wordpress.org/news/feed/
+</script>
+</php-snippet>
+
+<h2 id="pitfalls">Pitfalls</h2>
+
+<aside class="callout pitfall">namespace-aware methods use the namespace name declared in <code>xmlns</code>, not the prefix written in the tag. In WXR, <code>get_attribute( 'wp', 'status' )</code> looks for a namespace literally named <code>wp</code>; for the usual WXR declaration you want <code>get_attribute( 'http://wordpress.org/export/1.2/', 'status' )</code>.</aside>
+
+<aside class="callout pitfall">in streaming mode <code>next_tag()</code> can return false because input ran out, not because the document ended. Check <code>is_paused_at_incomplete_input()</code> before assuming you're done.</aside>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="dataliberation.html"><strong>DataLiberation</strong></a><span>Read and write WXR-sized WordPress exports as entities.</span></li>
+	<li><a href="encoding.html"><strong>Encoding</strong></a><span>Validate and scrub text before strict XML processing.</span></li>
+	<li><a href="bytestream.html"><strong>ByteStream</strong></a><span>Keep large XML reads incremental.</span></li>
+</ul>
+
+	</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/docs/reference/zip.html b/docs/reference/zip.html
new file mode 100644
index 000000000..cffff164c
--- /dev/null
+++ b/docs/reference/zip.html
@@ -0,0 +1,391 @@
+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Zip — PHP Toolkit reference</title>
+<meta name="description" content="Read and write ZIP archives in pure PHP. Stream entries one at a time, build EPUBs and .docx files, mount archives as filesystems — without libzip or ZipArchive.">
+<link rel="stylesheet" href="../assets/style.css?v=20260429-rewrite">
+<script type="module" src="https://playground.wordpress.net/php-code-snippet.js"></script>
+<script id="toolkit-setup" type="application/json"></script>
+<script src="../assets/page.js?v=20260429-rewrite" defer></script>
+</head>
+<body>
+<header class="site">
+	<a class="brand" href="../">PHP Toolkit</a>
+	<nav>
+		<a href="../learn/">Learn</a>
+		<a href="./">Reference</a>
+		<a class="github" href="https://github.com/WordPress/php-toolkit">GitHub</a>
+	</nav>
+</header>
+
+<div class="layout">
+
+<aside class="sidebar" aria-label="Reference navigation">
+	<button class="sidebar-toggle" type="button" aria-expanded="false">On this page ▾</button>
+	<nav class="toc" aria-label="Table of contents"></nav>
+	<details class="components-nav" open>
+		<summary>All components</summary>
+		<ol>
+			<li><a href="html.html">HTML</a></li>
+			<li class="current"><a href="zip.html">Zip</a></li>
+			<li><a href="bytestream.html">ByteStream</a></li>
+			<li><a href="filesystem.html">Filesystem</a></li>
+			<li><a href="blockparser.html">BlockParser</a></li>
+			<li><a href="markdown.html">Markdown</a></li>
+			<li><a href="xml.html">XML</a></li>
+			<li><a href="encoding.html">Encoding</a></li>
+			<li><a href="dataliberation.html">DataLiberation</a></li>
+			<li><a href="git.html">Git</a></li>
+			<li><a href="merge.html">Merge</a></li>
+			<li><a href="httpclient.html">HttpClient</a></li>
+			<li><a href="httpserver.html">HttpServer</a></li>
+			<li><a href="corsproxy.html">CORSProxy</a></li>
+			<li><a href="cli.html">CLI</a></li>
+			<li><a href="polyfill.html">Polyfill</a></li>
+			<li><a href="blueprints.html">Blueprints</a></li>
+			<li><a href="coding-standards.html">ToolkitCodingStandards</a></li>
+		</ol>
+	</details>
+</aside>
+
+<article class="content">
+
+<h1>Zip</h1>
+
+<p class="lede">Read and write ZIP archives in pure PHP — no <code>libzip</code>, no <code>ZipArchive</code> extension, no shelling out. The decoder is pull-based, so listing the central directory of a 2 GB archive costs roughly the size of the directory itself; the encoder writes one entry at a time into any byte sink.</p>
+
+<pre><code class="install">composer require wp-php-toolkit/zip</code></pre>
+
+<p>Common PHP ZIP workflows assume <code>ZipArchive</code> is available. It often isn't: shared hosts disable it, WebAssembly runtimes don't have it, Playground's browser-side PHP can't shell out to libzip. The Zip component reimplements the readable subset of the format in pure PHP — Stored and Deflate compression, Zip64 for archives over 4 GB, central-directory parsing — and exposes it through three layers, ordered from highest to lowest level.</p>
+
+<p>The highest-level type is <code>ZipFilesystem</code>: an archive presented through the toolkit's <code>Filesystem</code> interface, so you call <code>get_contents()</code> and <code>ls()</code> the same way you would on a local directory or an in-memory tree. Below that, <code>ZipDecoder</code> and <code>ZipEncoder</code> stream individual entries when you care about the format itself — building an EPUB whose <code>mimetype</code> entry must be stored uncompressed and first, repacking an archive while modifying one file. At the bottom, <code>FileEntry</code> is the small struct that names a path, a compression method, and a body reader.</p>
+
+<h2 id="minimal">A minimal example</h2>
+
+<p>Wrap a ZIP file as a filesystem and read one entry. This is the shape every later refinement is built on.</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-zip-minimal.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+
+// Build a tiny archive on disk.
+$path = tempnam( sys_get_temp_dir(), 'demo' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+$enc->append_file( new FileEntry( array(
+	'path'               => 'readme.txt',
+	'compression_method' => ZipDecoder::COMPRESSION_NONE,
+	'body_reader'        => new MemoryPipe( 'Hello from inside the zip.' ),
+) ) );
+$enc->close();
+$out->close_writing();
+
+// Read it back as a filesystem.
+$zip = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+echo $zip->get_contents( 'readme.txt' );
+</script>
+<script type="text/expected-output">
+Hello from inside the zip.
+</script>
+</php-snippet>
+
+<p>Three things to notice. The encoder takes a <code>ByteWriteStream</code> sink — here a file, but it could equally be an HTTP response body, an in-memory buffer, or another component's input. Each entry's body is itself a stream — <code>MemoryPipe</code> here, but for large files you'd pass a <code>FileReadStream</code> and the encoder would inflate from disk without buffering the whole entry in memory. And reading is one line: <code>ZipFilesystem::create()</code> wraps the byte reader, parses the central directory, and gives you the standard <code>Filesystem</code> interface.</p>
+
+<h2 id="epub">Refinement: build an EPUB</h2>
+
+<p>EPUB is a ZIP archive with one rule the spec is strict about: the <code>mimetype</code> entry must be the first entry in the file, and it must be stored uncompressed. Everything else is up to you. The Zip component lets you express that constraint directly:</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-zip-epub.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+
+$path = tempnam( sys_get_temp_dir(), 'book' ) . '.epub';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+
+// 1. mimetype MUST come first, MUST be uncompressed.
+$enc->append_file( new FileEntry( array(
+	'path'               => 'mimetype',
+	'compression_method' => ZipDecoder::COMPRESSION_NONE,
+	'body_reader'        => new MemoryPipe( 'application/epub+zip' ),
+) ) );
+
+// 2. Everything else compresses normally.
+$container = '<?xml version="1.0"?>'
+	. '<container version="1.0" xmlns="urn:oasis:names:tc:opendocument:xmlns:container">'
+	. '<rootfiles><rootfile full-path="EPUB/package.opf" media-type="application/oebps-package+xml"/></rootfiles>'
+	. '</container>';
+
+foreach ( array(
+	'META-INF/container.xml' => $container,
+	'EPUB/package.opf'       => '<package version="3.0" xmlns="http://www.idpf.org/2007/opf"><metadata/><manifest/><spine/></package>',
+	'EPUB/chapter1.xhtml'    => '<html xmlns="http://www.w3.org/1999/xhtml"><body><h1>Chapter 1</h1></body></html>',
+) as $name => $body ) {
+	$enc->append_file( new FileEntry( array(
+		'path'               => $name,
+		'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+		'body_reader'        => new MemoryPipe( $body ),
+	) ) );
+}
+$enc->close();
+$out->close_writing();
+
+$zip = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+printf( "mimetype: %s\nsize: %d bytes\n", $zip->get_contents( 'mimetype' ), filesize( $path ) );
+</script>
+</php-snippet>
+
+<aside class="callout pitfall">
+	<strong>Pitfall — EPUB validators reject compressed mimetypes.</strong> If you mark the <code>mimetype</code> entry as <code>COMPRESSION_DEFLATE</code>, the file will look right to ad-hoc unzippers but fail validation in real e-readers. <code>COMPRESSION_NONE</code> for that one entry; <code>COMPRESSION_DEFLATE</code> for the rest.
+</aside>
+
+<h2 id="stream">Refinement: stream a large entry</h2>
+
+<p>Calling <code>get_contents( 'data.csv' )</code> on a 500 MB CSV inside a ZIP would buffer 500 MB of inflated data into a single PHP string. <code>open_read_stream()</code> returns a pull-based reader instead, so you can process the entry in chunks:</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-zip-stream.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+
+$path = tempnam( sys_get_temp_dir(), 'big' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+$enc->append_file( new FileEntry( array(
+	'path'               => 'data.csv',
+	'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+	'body_reader'        => new MemoryPipe( str_repeat( "id,value\n1,foo\n2,bar\n", 5000 ) ),
+) ) );
+$enc->close();
+$out->close_writing();
+
+$zip    = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+$stream = $zip->open_read_stream( 'data.csv' );
+
+$rows = 0; $tail = '';
+while ( ! $stream->reached_end_of_data() ) {
+	$n = $stream->pull( 8192 );
+	if ( 0 === $n ) break;
+	$chunk  = $tail . $stream->consume( $n );
+	$lines  = explode( "\n", $chunk );
+	$tail   = array_pop( $lines );
+	$rows  += count( $lines );
+}
+printf( "parsed %d rows in 8 KB chunks\n", $rows );
+</script>
+</php-snippet>
+
+<aside class="callout pitfall">
+	<strong>Pitfall — one entry stream at a time.</strong> The decoder advances through the archive linearly. Open one read stream, drain or close it, then open the next. Holding two open simultaneously is undefined.
+</aside>
+
+<h2 id="repack">Refinement: repack an archive</h2>
+
+<p>Modifying one entry in place is impossible at the format level — the central directory points at byte offsets, so changing any entry's compressed size invalidates everything after it. The pragmatic answer is repack: stream the source into a new archive, swapping the entry you want to change.</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-zip-repack.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+
+// Build a source archive.
+$src_path = tempnam( sys_get_temp_dir(), 'orig' ) . '.zip';
+$src_out  = FileWriteStream::from_path( $src_path, 'truncate' );
+$src_enc  = new ZipEncoder( $src_out );
+foreach ( array(
+	'config.json'   => '{"debug":false,"version":"1.0"}',
+	'app/index.php' => '<?php echo "hello";',
+) as $name => $body ) {
+	$src_enc->append_file( new FileEntry( array(
+		'path'               => $name,
+		'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+		'body_reader'        => new MemoryPipe( $body ),
+	) ) );
+}
+$src_enc->close();
+$src_out->close_writing();
+
+// Repack with config.json swapped.
+$source   = ZipFilesystem::create( FileReadStream::from_path( $src_path ) );
+$dst_path = tempnam( sys_get_temp_dir(), 'repacked' ) . '.zip';
+$dst_out  = FileWriteStream::from_path( $dst_path, 'truncate' );
+$dst_enc  = new ZipEncoder( $dst_out );
+
+$dirs = array( '/' );
+while ( $dirs ) {
+	$dir = array_shift( $dirs );
+	foreach ( $source->ls( $dir ) as $name ) {
+		$path = rtrim( $dir, '/' ) . '/' . $name;
+		if ( $source->is_dir( $path ) ) { $dirs[] = $path; continue; }
+		$rel  = ltrim( $path, '/' );
+		$body = ( 'config.json' === $rel )
+			? '{"debug":true,"version":"1.0.1"}'
+			: $source->get_contents( $rel );
+		$dst_enc->append_file( new FileEntry( array(
+			'path'               => $rel,
+			'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+			'body_reader'        => new MemoryPipe( $body ),
+		) ) );
+	}
+}
+$dst_enc->close();
+$dst_out->close_writing();
+
+$repacked = ZipFilesystem::create( FileReadStream::from_path( $dst_path ) );
+echo "new config: " . $repacked->get_contents( 'config.json' ) . "\n";
+</script>
+</php-snippet>
+
+<h2 id="zip-slip">Refinement: defend against zip-slip</h2>
+
+<p>A malicious archive can name an entry <code>../../etc/passwd</code> and trick a naive extractor into writing outside the destination. Run every entry path through <code>ZipDecoder::sanitize_path()</code> before extraction:</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-zip-slip.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\Zip\ZipDecoder;
+
+foreach ( array(
+	'../../etc/passwd',
+	'./safe/path.txt',
+	'a/../../b/secret',
+	'a//b///c.txt',
+	'../../../../root/.ssh/authorized_keys',
+) as $name ) {
+	printf( "%-45s => %s\n", $name, ZipDecoder::sanitize_path( $name ) );
+}
+</script>
+</php-snippet>
+
+<h2 id="composing">Refinement: pipe entries into another filesystem</h2>
+
+<p>The whole point of <code>ZipFilesystem</code> implementing the <code>Filesystem</code> interface is composition. <code>copy_between_filesystems()</code> walks one filesystem and writes its contents into another — so unpacking a ZIP into an in-memory tree, where you can validate or edit before committing to disk, is one helper call:</p>
+
+<php-snippet blueprint="toolkit-setup" name="ref-zip-compose.php">
+<script type="application/x-php">
+<?php
+require '/wordpress/wp-content/php-toolkit/vendor/autoload.php';
+
+use WordPress\ByteStream\MemoryPipe;
+use WordPress\ByteStream\ReadStream\FileReadStream;
+use WordPress\ByteStream\WriteStream\FileWriteStream;
+use WordPress\Filesystem\InMemoryFilesystem;
+use WordPress\Zip\FileEntry;
+use WordPress\Zip\ZipDecoder;
+use WordPress\Zip\ZipEncoder;
+use WordPress\Zip\ZipFilesystem;
+use function WordPress\Filesystem\copy_between_filesystems;
+
+$path = tempnam( sys_get_temp_dir(), 'app' ) . '.zip';
+$out  = FileWriteStream::from_path( $path, 'truncate' );
+$enc  = new ZipEncoder( $out );
+foreach ( array(
+	'app/index.php' => '<?php echo "ok";',
+	'app/style.css' => 'body{margin:0}',
+) as $name => $body ) {
+	$enc->append_file( new FileEntry( array(
+		'path'               => $name,
+		'compression_method' => ZipDecoder::COMPRESSION_DEFLATE,
+		'body_reader'        => new MemoryPipe( $body ),
+	) ) );
+}
+$enc->close();
+$out->close_writing();
+
+$zip = ZipFilesystem::create( FileReadStream::from_path( $path ) );
+$mem = InMemoryFilesystem::create();
+copy_between_filesystems( array(
+	'source_filesystem' => $zip,
+	'source_path'       => '/',
+	'target_filesystem' => $mem,
+	'target_path'       => '/',
+) );
+$mem->put_contents( '/app/VERSION', '1.0.0' );
+echo "added VERSION; index.php is still: " . $mem->get_contents( '/app/index.php' );
+</script>
+</php-snippet>
+
+<h2 id="when">When to use which type</h2>
+
+<table class="api-table">
+<tr><th>Use</th><th>For</th></tr>
+<tr><td><code>ZipFilesystem::create()</code></td><td>Reading. You want <code>get_contents()</code>, <code>ls()</code>, <code>is_dir()</code> over a ZIP. The most common case.</td></tr>
+<tr><td><code>ZipEncoder</code></td><td>Writing. Stream entries into any <code>ByteWriteStream</code> sink. Required when format rules matter (EPUB, .docx).</td></tr>
+<tr><td><code>ZipDecoder</code></td><td>Low-level read access to the central directory and individual entry headers. Most code reaches for <code>ZipFilesystem</code> instead.</td></tr>
+<tr><td><code>open_read_stream()</code> on a ZipFilesystem</td><td>Inflating a single large entry without buffering it whole in memory.</td></tr>
+<tr><td><code>copy_between_filesystems()</code></td><td>Moving entries from a ZIP into another filesystem (memory, local, SQLite).</td></tr>
+</table>
+
+<h2 id="pitfalls">Pitfalls</h2>
+
+<aside class="callout pitfall">
+	<strong>Updating an entry in place is impossible.</strong> The central directory points at byte offsets — change one entry's compressed size and every later offset shifts. Repack into a new archive instead.
+</aside>
+
+<aside class="callout pitfall">
+	<strong>Never extract entry paths verbatim.</strong> Always run paths through <code>ZipDecoder::sanitize_path()</code>. Without it, a hostile archive can write outside the destination directory.
+</aside>
+
+<aside class="callout pitfall">
+	<strong>One entry stream at a time.</strong> The decoder is positional. Drain or close one entry stream before opening the next.
+</aside>
+
+<aside class="callout pitfall">
+	<strong>Encrypted archives aren't supported.</strong> If you need to read AES-encrypted ZIPs, this isn't the component. The file format technically allows encryption, but the toolkit deliberately excludes it because the implementation surface is large and the use case is rare in WordPress contexts.
+</aside>
+
+<h2 id="see-also">See also</h2>
+
+<ul class="related-components">
+	<li><a href="../learn/02-streaming-archives.html"><strong>Tutorial — Streaming archives</strong></a><span>The chapter that builds the importer's input on top of <code>ZipFilesystem</code>.</span></li>
+	<li><a href="filesystem.html"><strong>Filesystem</strong></a><span>The interface ZipFilesystem implements. Local, memory, SQLite backends share the same API.</span></li>
+	<li><a href="bytestream.html"><strong>ByteStream</strong></a><span>The pull/peek/consume primitives the encoder and decoder use as their input and output.</span></li>
+	<li><a href="httpclient.html"><strong>HttpClient</strong></a><span>Stream a downloaded ZIP into ZipFilesystem without ever touching disk.</span></li>
+</ul>
+
+</article>
+</div>
+
+<footer class="site">
+	<a href="https://github.com/WordPress/php-toolkit">WordPress/php-toolkit</a>
+</footer>
+</body>
+</html>
diff --git a/package.json b/package.json
index d340c9b20..74f02b551 100644
--- a/package.json
+++ b/package.json
@@ -21,5 +21,6 @@
   "bugs": {
     "url": "https://github.com/WordPress/php-toolkit/issues"
   },
-  "homepage": "https://github.com/WordPress/php-toolkit#readme"
+  "homepage": "https://github.com/WordPress/php-toolkit#readme",
+  "packageManager": "npm@11.6.2+sha512.ee22b335fcbc95662cdf3ab8a053daf045d9cf9c6df6040d28965abb707512b2c16fa6c5eec049d34c74f78f390cebd14f697919eadb97756564d4f9eccc4954"
 }
diff --git a/phpcs.xml b/phpcs.xml
index c20486124..02ed3994a 100644
--- a/phpcs.xml
+++ b/phpcs.xml
@@ -11,6 +11,7 @@
     <exclude-pattern>/plugins/url-updater/</exclude-pattern>
     <exclude-pattern>/bin/build-phar</exclude-pattern>
     <exclude-pattern>/examples/</exclude-pattern>
+    <exclude-pattern>/docs/</exclude-pattern>
     <exclude-pattern>rector.php</exclude-pattern>
     <exclude-pattern>components/CORSProxy/cors-proxy-functions.php</exclude-pattern>
     <exclude-pattern>components/Markdown/bin/build/*</exclude-pattern>

Style	Use when	Tradeoff
`consume_all()` or `json()`	Small HTML, JSON, or API responses.	Buffers the full body.
`Client::await_next_event()`	Progress bars, streaming to disk, queues, failure handling.	You own the event loop.
Filesystem and parser composition	Remote ZIPs, WXR files, import pipelines.	Requires a stream-aware consumer.
Transport	What it does	When to choose it
`auto`	Uses curl when loaded, otherwise sockets.	Application default. Best when you want portability and the fastest available backend.
`sockets`	Uses PHP stream sockets, no curl extension.	Tests, Playground-style runtimes, hosts where curl is unavailable, or proving the dependency-free path works.
`curl`	Uses the curl extension.	Hosts where curl is available and you want to compare behavior or performance explicitly.
Chapter 1	→	`clean_post_html()` using `WP_HTML_Tag_Processor`: lazy-load images, rewrite URLs, strip scripts, all in one pass.
Chapter 2	→	Read the input ZIP through `ZipFilesystem`, stage it in `InMemoryFilesystem`, defend against zip-slip with `ZipDecoder::sanitize_path()`.
Chapter 3	→	Convert each post with `MarkdownConsumer`, audit the output with `WP_Block_Parser`, stream the WXR with `WXRWriter`.
Chapter 4	→	Frontload images with `HttpClient` through a sliding-window event loop; mount remote archives with `SeekableRequestReadStream`.
Use	For
`WP_HTML_Tag_Processor`	Attribute rewriting, sanitization, finding tags by name. Forward-only walks. Anything where speed and byte-honesty matter more than context.
`WP_HTML_Processor::create_fragment()`	Queries by ancestry (`breadcrumbs`), heading outline extraction, anything that needs to know "is this tag inside that one."
`WP_HTML_Decoder::decode_text_node()`	Turning entity-encoded text (`AT&T`) back into raw text correctly. Implements the HTML5 entity algorithm — don't roll your own.
`WP_HTML_Decoder::attribute_starts_with()`	Safe URL-prefix checks that respect encoded characters (`java script:`). The classic `strpos` approach misses these.
Use	For
`ZipFilesystem::create()`	Reading. You want `get_contents()`, `ls()`, `is_dir()` over a ZIP. The most common case.
`ZipEncoder`	Writing. Stream entries into any `ByteWriteStream` sink. Required when format rules matter (EPUB, .docx).
`ZipDecoder`	Low-level read access to the central directory and individual entry headers. Most code reaches for `ZipFilesystem` instead.
`open_read_stream()` on a ZipFilesystem	Inflating a single large entry without buffering it whole in memory.
`copy_between_filesystems()`	Moving entries from a ZIP into another filesystem (memory, local, SQLite).