From 5e95bf04120b948e5ccb3bb05dd48e1f6962baab Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Wed, 18 Feb 2026 21:33:09 +0530
Subject: [PATCH 01/13] Add Server-Timing instrumentation and optimization plan

Introduce RequestTimer for per-request phase tracking (init, backend,
process, total) exposed via Server-Timing response headers. Add
benchmark tooling with --profile mode for collecting timing data.
Document phased optimization plan covering streaming architecture,
code-level fixes, and open design questions for team review.
---
 OPTIMIZATION.md                    | 468 ++++++++++++++++++++++++++
 crates/common/src/lib.rs           |   1 +
 crates/common/src/publisher.rs     |   6 +
 crates/common/src/request_timer.rs | 151 +++++++++
 crates/fastly/src/main.rs          |  12 +-
 scripts/benchmark.sh               | 516 +++++++++++++++++++++++++++++
 6 files changed, 1153 insertions(+), 1 deletion(-)
 create mode 100644 OPTIMIZATION.md
 create mode 100644 crates/common/src/request_timer.rs
 create mode 100755 scripts/benchmark.sh

diff --git a/OPTIMIZATION.md b/OPTIMIZATION.md
new file mode 100644
index 00000000..817696d7
--- /dev/null
+++ b/OPTIMIZATION.md
@@ -0,0 +1,468 @@
+# Trusted Server Optimization Plan
+
+## Status
+
+| Item | Status |
+|------|--------|
+| Production timing instrumentation (`RequestTimer`) | **Implemented** (on `feat/optimize-ts`, not yet deployed) |
+| Benchmark tooling (`scripts/benchmark.sh`) | **Implemented** (includes `--profile` mode) |
+| Viceroy baseline measurements | **Complete** |
+| Staging external TTFB baseline | **Complete** (against staging deployment) |
+| Server-Timing production data | **Blocked** — needs `feat/optimize-ts` deployed to staging |
+| Streaming architecture (`stream_to_client`) | **Planned** — see Phase 2 |
+| Code-level optimizations | **Planned** — see Phase 1 |
+
+---
+
+## Key Finding: Streaming to Client IS Possible
+
+The Fastly Compute SDK provides `Response::stream_to_client()` which returns a `StreamingBody` handle that implements `std::io::Write`. Headers are sent immediately and body chunks stream as they're written.
+
+```rust
+// Current: fully buffered (no bytes reach client until everything is done)
+let body = response.take_body();
+let mut output = Vec::new();
+pipeline.process(body, &mut output)?;    // blocks until complete
+response.set_body(Body::from(output));   // only NOW does client get anything
+return Ok(response);
+
+// Possible: streaming (headers sent immediately, body chunks as processed)
+let body = response.take_body();
+let mut streaming = response.stream_to_client();  // headers sent NOW
+pipeline.process(body, &mut streaming)?;           // each write() → client
+streaming.finish()?;
+```
+
+This changes the optimization strategy — **time-to-last-byte (TTLB) and peak memory CAN be significantly reduced**. TTFB itself is still gated by the Fastly platform floor (~200ms) plus backend response time, but body bytes start reaching the client as soon as the first chunk is processed instead of waiting for the entire response to be buffered.
+
+### Compatibility with `#[fastly::main]` — NEEDS SPIKE
+
+`stream_to_client()` consumes the Response and starts sending. The Fastly SDK enforces that only **one response** is sent per request via `assert_single_downstream_response_is_sent()`. The `#[fastly::main]` macro wraps your function and calls `send_to_client()` on the returned `Response` — so if `stream_to_client()` was already called, the macro **will trigger a panic**.
+
+**This is an unresolved design problem that needs a prototype before committing to the streaming architecture.**
+
+Possible approaches (all need validation):
+
+1. **Drop the `#[fastly::main]` macro** — write a raw `main()` that handles the Fastly request lifecycle manually, giving full control over when/how the response is sent. Need to verify the Fastly SDK supports this.
+2. **Use `std::process::exit(0)` after streaming** — call `stream_to_client()`, process, `finish()`, then `exit(0)` before the macro gets a chance to call `send_to_client()`. Ugly, but may work if Fastly doesn't require cleanup.
+3. **Return a sentinel Response** — investigate whether the SDK treats an already-sent response as a no-op instead of panicking. (Current source code suggests it **does** panic — needs testing on actual Fastly Compute, not just source reading.)
+
+**Action item**: Create a minimal Fastly Compute service that calls `stream_to_client()` and test each approach. This spike should be done **before** any Phase 2 implementation work.
+
+Non-streaming endpoints (static JS, discovery, auction) continue returning `Response` normally. Only the publisher proxy path (the hot path) would use streaming.
+
+---
+
+## How to Use This Document
+
+**For any optimization work:**
+
+1. Run `./scripts/benchmark.sh --save baseline` on `main`
+2. Make your change on a branch
+3. Rebuild: `fastly compute build`
+4. Run `./scripts/benchmark.sh --save branch-name`
+5. Compare: `diff benchmark-results/baseline.txt benchmark-results/branch-name.txt`
+6. For production: `BENCH_URL=https://your-staging.edgecompute.app ./scripts/benchmark.sh --profile`
+7. If the numbers don't improve meaningfully, don't ship it
+
+---
+
+## Baseline Measurements
+
+### Viceroy (Local Simulator)
+
+Measured on `main` branch. Value is in **relative comparison between branches**, not absolute values.
+
+| Endpoint | P50 | P95 | Req/sec | Notes |
+|---|---|---|---|---|
+| `GET /static/tsjs=tsjs-unified.min.js` | 1.9 ms | 3.1 ms | 4,672 | Pure WASM, no backend |
+| `GET /.well-known/trusted-server.json` | 1.3 ms | 1.4 ms | ~770 | Server-side only |
+| `GET /` (publisher proxy) | 400 ms | 595 ms | 21 | Proxies to golf.com, 222KB HTML |
+| `POST /auction` | 984 ms | 1,087 ms | 9.3 | Calls Prebid + APS backends |
+
+- **WASM heap**: 3.0-4.1 MB per request
+- **Init overhead**: <2ms (settings parse + orchestrator + registry)
+- **No cold start pattern** detected in Viceroy
+
+### Staging (External)
+
+Measured externally against staging deployment (golf.com proxy), `main` branch (no Server-Timing deployed yet).
+
+| Endpoint | TTFB | Total | Size | Notes |
+|---|---|---|---|---|
+| `GET /static/tsjs=tsjs-unified.min.js` | ~204 ms | ~219 ms | 28 KB | No backend, pure platform overhead |
+| `GET /` (publisher proxy, golf.com) | ~234 ms | ~441 ms | 230 KB | Backend + processing |
+| `GET /.well-known/trusted-server.json` | ~191 ms | - | - | Returns 500 (needs investigation) |
+
+**Key insight**: Static JS has ~204ms TTFB with zero backend work. This is the **Fastly platform floor** (WASM instantiation + edge routing + TLS). Application code cannot reduce this. The publisher proxy adds only ~30ms TTFB on top — but the full ~441ms total includes waiting for the entire response to be buffered before sending. With streaming, the ~207ms gap between TTFB (234ms) and TTLB (441ms) would shrink because body bytes stream as they're processed instead of being fully buffered.
+
+---
+
+## Implementation Plan
+
+### Phase 0: Deploy Server-Timing Instrumentation (DONE, needs deploy)
+
+**Branch**: `feat/optimize-ts`
+
+Already implemented:
+- `RequestTimer` in `crates/common/src/request_timer.rs` — tracks `init`, `backend`, `process`, `total` phases
+- `Server-Timing` header emitted on every response
+- Wired into `main.rs` and `publisher.rs`
+- `scripts/benchmark.sh --profile` mode to collect and report Server-Timing data
+
+**Action**: Deploy `feat/optimize-ts` to staging, then run:
+```bash
+BENCH_URL=https://<your-staging>.edgecompute.app ./scripts/benchmark.sh --profile
+```
+
+This gives us the real `init`/`backend`/`process` split for golf.com requests.
+
+**Conflict with Phase 2 streaming**: The `Server-Timing` header is currently set **after** response processing completes (line 147 of `main.rs`), which includes `backend` and `process` phase durations. When we switch to `stream_to_client()` in Phase 2, headers are sent **before** processing starts — so `Server-Timing` cannot include the `backend`/`process`/`total` values.
+
+Options for Phase 2:
+- **Move Server-Timing to a trailer** — `StreamingBody` supports trailers via `StreamingBodyExt::append_trailer()`. Requires client support (browsers generally ignore trailers).
+- **Log-only instrumentation** — keep `RequestTimer` for server-side logging but don't include it in response headers on streaming paths. Non-streaming endpoints still get the header.
+- **Keep both paths** — Phase 0 instrumentation continues working on the buffered path. Once streaming is validated and deployed, accept that Server-Timing headers are only available for non-streaming endpoints (static, auction, discovery).
+
+This is **not a blocker** for Phase 0 — the instrumentation is valuable right now on the current buffered architecture. Just be aware it will need adjustment when streaming lands.
+
+---
+
+### Phase 1: Low-Risk Code Optimizations
+
+These are small, safe changes that reduce CPU and memory waste. Ship as one PR, measure before/after.
+
+#### 1.1 Fix gzip streaming — remove full-body buffering
+
+**File**: `crates/common/src/streaming_processor.rs` — `process_gzip_to_gzip`
+
+**Problem**: Reads entire decompressed body into memory via `read_to_end`, despite deflate/brotli paths already using chunk-based `process_through_compression`.
+
+**Fix**: 3 lines — use `process_through_compression` like deflate/brotli:
+
+```rust
+fn process_gzip_to_gzip<R: Read, W: Write>(&mut self, input: R, output: W) -> Result<...> {
+    let decoder = GzDecoder::new(input);
+    let encoder = GzEncoder::new(output, Compression::default());
+    self.process_through_compression(decoder, encoder)
+}
+```
+
+| Impact | LOC | Risk |
+|--------|-----|------|
+| **High** (most responses are gzip; reduces peak memory) | -15/+3 | Low |
+
+#### 1.2 Fix `HtmlRewriterAdapter` — enable true streaming
+
+**File**: `crates/common/src/streaming_processor.rs` — `HtmlRewriterAdapter`
+
+**Problem**: Accumulates entire HTML document before processing, defeating the streaming pipeline. The comment says this is a `lol_html` limitation — **it's not**. `lol_html::HtmlRewriter` supports incremental `write()` calls and emits output via its `OutputSink` callback per-chunk.
+
+**Fix**: Create the `HtmlRewriter` eagerly in `new()`, use `Rc<RefCell<Vec<u8>>>` via the public `lol_html::OutputSink` trait to share the output buffer:
+
+```rust
+struct RcVecSink(Rc<RefCell<Vec<u8>>>);
+
+impl lol_html::OutputSink for RcVecSink {
+    fn handle_chunk(&mut self, chunk: &[u8]) {
+        self.0.borrow_mut().extend_from_slice(chunk);
+    }
+}
+
+pub struct HtmlRewriterAdapter {
+    rewriter: Option<lol_html::HtmlRewriter<'static, RcVecSink>>,
+    output: Rc<RefCell<Vec<u8>>>,
+}
+
+impl StreamProcessor for HtmlRewriterAdapter {
+    fn process_chunk(&mut self, chunk: &[u8], is_last: bool) -> Result<Vec<u8>, io::Error> {
+        if let Some(rewriter) = &mut self.rewriter {
+            if !chunk.is_empty() {
+                rewriter.write(chunk)?;
+            }
+        }
+        if is_last {
+            if let Some(rewriter) = self.rewriter.take() {
+                rewriter.end()?;
+            }
+        }
+        // Drain whatever lol_html produced
+        Ok(std::mem::take(&mut *self.output.borrow_mut()))
+    }
+}
+```
+
+| Impact | LOC | Risk |
+|--------|-----|------|
+| **High** (HTML is most common content type; eliminates 222KB+ buffer) | ~30 refactored | Medium — needs test coverage |
+
+#### 1.3 Remove verbose per-request logging
+
+**Files**: `crates/fastly/src/main.rs:37,64-67`
+
+**Problem**: `log::info!("Settings {settings:?}")` serializes the entire Settings struct (~2KB) on every request. `FASTLY_SERVICE_VERSION` env var logged at info level.
+
+**Fix**: Remove settings dump or gate behind `log::debug!`.
+
+| Impact | LOC | Risk |
+|--------|-----|------|
+| Medium-High | ~3 | None |
+
+#### 1.4 Trivial fixes batch
+
+| Fix | File | LOC |
+|-----|------|-----|
+| Const cookie prefix instead of `format!()` | `publisher.rs:207-210` | 2 |
+| `mem::take` instead of `clone` for overlap buffer | `streaming_replacer.rs:63` | 1 |
+| `eq_ignore_ascii_case` for compression detection | `streaming_processor.rs:47` | 5 |
+| `Cow<str>` for string replacements | `streaming_replacer.rs:120-125` | 5-10 |
+| Remove base64 roundtrip in token computation | `http_util.rs:286-294` | 10-15 |
+| Replace Handlebars with manual interpolation | `synthetic.rs:82-99` | ~20 |
+| Cache `origin_host()` result per-request | `settings.rs` | 5-10 |
+
+---
+
+### Phase 2: Streaming Response Architecture
+
+This is the high-impact architectural change. Uses Fastly's `stream_to_client()` API to send response headers and body chunks to the client as they're processed, instead of buffering everything.
+
+#### 2.1 Publisher proxy: `stream_to_client()` integration
+
+**Files**: `crates/common/src/publisher.rs`, `crates/fastly/src/main.rs`
+
+**Current flow** (fully buffered):
+```
+req.send() → wait for full response → take_body()
+  → process_response_streaming() → collects into Vec<u8>
+  → Body::from(output) → return complete Response
+```
+
+**New flow** (streaming):
+```
+req.send() → take_body() → set response headers
+  → stream_to_client() → returns StreamingBody (headers sent immediately)
+  → pipeline.process(body, &mut streaming_body) → chunks written to client as processed
+  → streaming_body.finish()
+```
+
+**Key enablers**:
+- `StreamingPipeline.process()` already accepts `W: Write` — `StreamingBody` implements `Write`
+- With Phase 1 fixes (gzip streaming + HTML rewriter streaming), the pipeline is already chunk-based
+- Non-text responses can use `streaming_body.append(body)` for O(1) pass-through
+
+**Architecture change in `main.rs`**: The publisher proxy path calls `stream_to_client()` directly instead of returning a `Response`. Other endpoints (static, auction, discovery) continue returning `Response` as before.
+
+**Error handling for streaming**: Once `stream_to_client()` is called, response headers (including status 200) are already sent. If processing fails mid-stream:
+- We cannot change the status code — the client already received 200
+- The `StreamingBody` will be aborted on drop (client sees incomplete response)
+- We should log the error server-side for debugging
+- This is the same trade-off every streaming proxy makes (nginx, Cloudflare Workers, etc.)
+
+To mitigate: validate backend response status and content-type **before** calling `stream_to_client()`. If the backend returns an error, fall back to the buffered path to return a proper error response.
+
+```rust
+// Fetch from backend (blocks for full response including headers)
+let mut backend_resp = req.send(&backend)?;
+
+// Check backend status BEFORE committing to streaming
+if !backend_resp.get_status().is_success() || !should_process_content_type(&backend_resp) {
+    // Buffered path — can return proper error/pass-through response
+    return Ok(backend_resp);
+}
+
+// Commit to streaming — headers sent to client NOW
+let backend_body = backend_resp.take_body();
+let mut client_body = backend_resp.stream_to_client();
+
+// Process chunks — errors logged but response is already in flight
+match pipeline.process(backend_body, &mut client_body) {
+    Ok(()) => client_body.finish()?,
+    Err(e) => {
+        log::error!("Streaming processing failed: {:?}", e);
+        // StreamingBody dropped → client sees truncated response
+        // This is the best we can do after headers are sent
+    }
+}
+```
+
+| Impact | LOC | Risk |
+|--------|-----|------|
+| **High** — reduces time-to-last-byte and peak memory for all proxied pages | ~80-120 | Medium — error handling requires careful design |
+
+#### 2.2 Concurrent origin fetch + auction (future)
+
+**Not applicable for golf.com** (no on-page auction), but for publishers with auction.
+
+The idea: use `req.send_async()` to launch the origin fetch concurrently with auction backend calls (which already use `fastly::http::request::select()` internally). When the origin response arrives, start streaming it to the client via `stream_to_client()`. When the lol_html rewriter reaches the ad injection point in the HTML, check if auction results are available.
+
+This would overlap origin fetch time with auction execution, so the browser starts receiving `<head>` content (CSS, fonts) while the auction is still running.
+
+**Note**: This requires significant refactoring of the auction orchestrator and HTML processor to support async injection. The pseudo-code in the teammate's proposal (`origin_pending.poll()`, `run_auction_async`) represents the desired architecture but these APIs don't exist yet and would need to be built.
+
+| Impact | LOC | Risk |
+|--------|-----|------|
+| **Very High** for auction pages — browser starts loading ~400ms earlier | ~150-200 | High — complex coordination |
+
+---
+
+### Phase 3: Measure and Validate
+
+After implementing Phases 1-2:
+
+1. Deploy to staging
+2. Run `./scripts/benchmark.sh --profile` against staging
+3. Compare Server-Timing data: `init`/`backend`/`process`/`total` before vs after
+4. Compare external TTFB and time-to-last-byte
+5. Check Fastly dashboard for memory/compute metrics
+6. If improvement is marginal, don't ship the streaming architecture (Phase 2)
+
+**Success criteria**:
+- Peak memory per request reduced by 30%+ (measurable via Fastly logs)
+- Time-to-last-byte reduced for large HTML pages
+- No regression on static endpoints or auction
+- Code complexity is justified by measured improvement
+
+---
+
+## Optimization Summary Table
+
+| # | Optimization | Impact | LOC | Risk | Phase |
+|---|---|---|---|---|---|
+| **P0** | Server-Timing instrumentation | Prerequisite | Done | None | 0 |
+| **1.1** | Gzip streaming fix | **High** (memory) | -15/+3 | Low | 1 |
+| **1.2** | HTML rewriter streaming | **High** (memory) | ~30 | Medium | 1 |
+| **1.3** | Remove verbose logging | Medium-High | ~3 | None | 1 |
+| **1.4** | Trivial fixes batch | Low-Medium | ~50 | None | 1 |
+| **2.1** | `stream_to_client()` integration | **High** (TTLB) | ~80-120 | Medium | 2 |
+| **2.2** | Concurrent origin + auction | **Very High** | ~150-200 | High | 2 (future) |
+
+---
+
+## Architecture: Current vs Target
+
+### Current (fully buffered)
+
+```
+Client → Fastly Edge → [WASM starts]
+  → init (settings, orchestrator, registry)     ~1ms
+  → req.send(backend)                           blocks for full response
+  → response.take_body()                        full body in memory
+  → GzDecoder.read_to_end()                     full decompressed in memory
+  → HtmlRewriterAdapter accumulates all input   full HTML in memory
+  → lol_html processes entire document           full output in memory
+  → GzEncoder.write_all()                       full recompressed in memory
+  → Body::from(output)                          Response constructed
+  → return Response                             NOW client gets first byte
+```
+
+**Memory**: compressed + decompressed + processed + recompressed = ~4x response size
+**TTLB**: cannot send any bytes until all processing is complete
+
+### Target (streaming)
+
+```
+Client → Fastly Edge → [WASM starts]
+  → init (settings, orchestrator, registry)     ~1ms
+  → req.send(backend)                           blocks for full response (same as current)
+  → response.take_body()                        body available as Read stream
+  → validate status, set response headers
+  → stream_to_client()                          headers sent to client NOW
+  → GzDecoder.read(8KB chunk)                   8KB decompressed
+  → HtmlRewriter.write(chunk)                   output emitted via callback
+  → GzEncoder.write(processed)                  compressed chunk
+  → StreamingBody.write(chunk)                  chunk sent to client
+  → ... repeat for each chunk ...
+  → StreamingBody.finish()                      done
+```
+
+**Memory**: ~8KB chunk buffer + lol_html internal state (significantly less than 4x response size — exact savings need measurement)
+**TTLB**: client receives first body bytes after first processed chunk, instead of waiting for all processing to complete. For a 222KB page, the savings is the entire processing time (decompression + rewriting + recompression).
+
+---
+
+## Benchmarking Setup
+
+### Prerequisites
+
+```bash
+brew install hey    # HTTP load testing tool (auto-installed by benchmark.sh)
+```
+
+### Available Modes
+
+```bash
+./scripts/benchmark.sh                    # Full benchmark suite
+./scripts/benchmark.sh --quick            # Quick smoke test
+./scripts/benchmark.sh --ttfb             # TTFB analysis only
+./scripts/benchmark.sh --load-test        # Load test only
+./scripts/benchmark.sh --cold-start       # Cold start analysis
+./scripts/benchmark.sh --profile          # Server-Timing phase breakdown
+./scripts/benchmark.sh --save baseline    # Save results to file
+./scripts/benchmark.sh --compare baseline # Compare against saved results
+```
+
+### Profiling Against Staging
+
+```bash
+# Requires Server-Timing branch deployed
+BENCH_URL=https://example.edgecompute.app ./scripts/benchmark.sh --profile
+```
+
+### What the Benchmark Measures
+
+| Test | What it tells you |
+|---|---|
+| TTFB analysis | 20 sequential requests — detects cold start patterns |
+| Cold start | First vs subsequent request latency |
+| Endpoint latency | Per-endpoint timing breakdown (DNS, connect, TTFB, total) |
+| Load test (hey) | Throughput (req/sec), latency distribution (P50/P95/P99) |
+| Profile | Server-Timing phase breakdown: `init`/`backend`/`process`/`total` with min/avg/max/p95 |
+
+### What the Benchmark Does NOT Measure
+
+- Real Fastly edge performance (Viceroy is a simulator)
+- WASM cold start on actual Fastly infrastructure
+- Production TLS handshake overhead
+- Memory usage (use Fastly dashboard or Viceroy logs)
+
+---
+
+## Notes for Team
+
+### What's already on `feat/optimize-ts` branch (uncommitted)
+
+| File | Change |
+|------|--------|
+| `crates/common/src/request_timer.rs` | **New** — `RequestTimer` with `Server-Timing` header output |
+| `crates/common/src/lib.rs` | Added `pub mod request_timer;` |
+| `crates/fastly/src/main.rs` | Wired timer: created at top, `mark_init()`, passed to handlers, `Server-Timing` header set |
+| `crates/common/src/publisher.rs` | Added `mark_backend()` after `req.send()`, `mark_process()` after body processing |
+| `scripts/benchmark.sh` | Added `--profile` mode, auto-install `hey` |
+| `OPTIMIZATION.md` | This document |
+
+### Teammate's `streaming_processor.rs` Changes
+
+A teammate has prepared changes to `streaming_processor.rs` that address items 1.1 and 1.2:
+
+- **Gzip fix**: `process_gzip_to_gzip` now uses `process_through_compression` (3-line change)
+- **HTML rewriter fix**: `HtmlRewriterAdapter` rewritten to use `lol_html::OutputSink` trait with `Rc<RefCell<Vec<u8>>>` for incremental streaming
+
+**Review notes on the HTML rewriter change**:
+- `lol_html::OutputSink` is a public trait (verified in lol_html 2.7.1)
+- The `Rc<RefCell>` pattern is necessary because `HtmlRewriter::new()` takes ownership of the sink, but we need to read output in `process_chunk()`
+- `Option<HtmlRewriter>` with `.take()` is correct — `end()` consumes self
+- The adapter is no longer reusable after `end()` — one per document, which matches actual usage
+- Tests correctly updated to collect output across all chunks
+
+**Correctness issue — must fix in same PR**: `process_through_compression` uses `drop(encoder)` for finalization. For `GzEncoder`, `Drop` calls `finish()` internally but **silently ignores errors**. The gzip trailer contains a CRC32 checksum — if `finish()` fails, corrupted gzip responses are served to clients without any error being reported. This is a pre-existing issue (deflate/brotli have the same `drop()` pattern) but it **must be fixed** when gzip moves to this code path, since gzip is the most common encoding.
+
+Fix: change `process_through_compression` to accept an optional finalization closure, or add a separate `process_gzip_to_gzip` that calls `encoder.finish()` explicitly after `process_through_compression`-style chunk loop.
+
+### Decisions Needed
+
+1. **Deploy `feat/optimize-ts` to staging?** — Needed to get real Server-Timing data before proceeding with optimizations
+2. **`#[fastly::main]` + `stream_to_client()` spike** — The macro calls `send_to_client()` on the returned Response, which will panic if streaming was already started. We need a minimal prototype to validate the approach before any Phase 2 work. See "Compatibility with `#[fastly::main]`" section above.
+3. **Phase 1 vs Phase 2 priority** — Phase 1 (code fixes) is low risk and can ship independently. Phase 2 (streaming architecture) is higher impact but higher risk, and blocked on decision #2.
+4. **Server-Timing on streaming paths** — `stream_to_client()` sends headers before processing completes, so `Server-Timing` can't include `backend`/`process` phases. Options: trailers, log-only, or accept the limitation. See Phase 0 section.
+5. **Concurrent auction + origin (2.2)** — Not applicable for golf.com. Defer to a separate ticket?
+6. **GzEncoder `finish()` correctness** — Fix the `drop(encoder)` error swallowing in `process_through_compression`, or accept the risk?
diff --git a/crates/common/src/lib.rs b/crates/common/src/lib.rs
index a01865f6..c43ed8a3 100644
--- a/crates/common/src/lib.rs
+++ b/crates/common/src/lib.rs
@@ -51,6 +51,7 @@ pub mod openrtb;
 pub mod proxy;
 pub mod publisher;
 pub mod request_signing;
+pub mod request_timer;
 pub mod rsc_flight;
 pub mod settings;
 pub mod settings_data;
diff --git a/crates/common/src/publisher.rs b/crates/common/src/publisher.rs
index fb160f3d..c6b465d5 100644
--- a/crates/common/src/publisher.rs
+++ b/crates/common/src/publisher.rs
@@ -6,6 +6,7 @@ use crate::backend::BackendConfig;
 use crate::http_util::{serve_static_with_etag, RequestInfo};
 
 use crate::constants::{COOKIE_SYNTHETIC_ID, HEADER_X_COMPRESS_HINT, HEADER_X_SYNTHETIC_ID};
+use crate::request_timer::RequestTimer;
 use crate::cookies::create_synthetic_cookie;
 use crate::error::TrustedServerError;
 use crate::integrations::IntegrationRegistry;
@@ -176,6 +177,7 @@ pub fn handle_publisher_request(
     settings: &Settings,
     integration_registry: &IntegrationRegistry,
     mut req: Request,
+    timer: &mut RequestTimer,
 ) -> Result<Response, Report<TrustedServerError>> {
     log::debug!("Proxying request to publisher_origin");
 
@@ -235,6 +237,8 @@ pub fn handle_publisher_request(
             message: "Failed to proxy request to origin".to_string(),
         })?;
 
+    timer.mark_backend();
+
     // Log all response headers for debugging
     log::debug!("Response headers:");
     for (name, value) in response.get_headers() {
@@ -310,6 +314,8 @@ pub fn handle_publisher_request(
         );
     }
 
+    timer.mark_process();
+
     response.set_header(HEADER_X_SYNTHETIC_ID, synthetic_id.as_str());
     if !has_synthetic_cookie {
         response.set_header(
diff --git a/crates/common/src/request_timer.rs b/crates/common/src/request_timer.rs
new file mode 100644
index 00000000..ca3d07a3
--- /dev/null
+++ b/crates/common/src/request_timer.rs
@@ -0,0 +1,151 @@
+//! Lightweight per-request timer for profiling the Fastly Compute request lifecycle.
+//!
+//! Records phase durations using [`std::time::Instant`] and emits them as a
+//! [`Server-Timing`](https://developer.mozilla.org/en-US/docs/Web/HTTP/Reference/Headers/Server-Timing)
+//! header value so that timings are visible in browser `DevTools` (Network → Timing tab).
+
+use std::time::Instant;
+
+/// Records wall-clock durations for each phase of a request.
+///
+/// Usage:
+/// ```ignore
+/// let mut timer = RequestTimer::new();          // captures t0
+/// // ... init work ...
+/// timer.mark_init();                            // captures init duration
+/// // ... backend fetch ...
+/// timer.mark_backend();                         // captures backend duration
+/// // ... body processing ...
+/// timer.mark_process();                         // captures process duration
+/// response.set_header("Server-Timing", timer.header_value());
+/// ```
+pub struct RequestTimer {
+    start: Instant,
+    init_ms: Option<f64>,
+    backend_ms: Option<f64>,
+    process_ms: Option<f64>,
+    last_mark: Instant,
+}
+
+impl RequestTimer {
+    /// Start a new timer. Call this as early as possible in `main()`.
+    #[must_use]
+    pub fn new() -> Self {
+        let now = Instant::now();
+        Self {
+            start: now,
+            init_ms: None,
+            backend_ms: None,
+            process_ms: None,
+            last_mark: now,
+        }
+    }
+
+    /// Mark the end of the initialization phase (settings, orchestrator, registry).
+    pub fn mark_init(&mut self) {
+        let now = Instant::now();
+        self.init_ms = Some(duration_ms(self.last_mark, now));
+        self.last_mark = now;
+    }
+
+    /// Mark the end of the backend fetch phase.
+    pub fn mark_backend(&mut self) {
+        let now = Instant::now();
+        self.backend_ms = Some(duration_ms(self.last_mark, now));
+        self.last_mark = now;
+    }
+
+    /// Mark the end of body processing (decompress, rewrite, recompress).
+    pub fn mark_process(&mut self) {
+        let now = Instant::now();
+        self.process_ms = Some(duration_ms(self.last_mark, now));
+        self.last_mark = now;
+    }
+
+    /// Total elapsed time since the timer was created.
+    #[must_use]
+    pub fn total_ms(&self) -> f64 {
+        duration_ms(self.start, Instant::now())
+    }
+
+    /// Format as a `Server-Timing` header value.
+    ///
+    /// Example output:
+    /// `init;dur=1.2, backend;dur=385.4, process;dur=12.3, total;dur=401.5`
+    #[must_use]
+    pub fn header_value(&self) -> String {
+        let mut parts = Vec::with_capacity(4);
+
+        if let Some(ms) = self.init_ms {
+            parts.push(format!("init;dur={ms:.1}"));
+        }
+        if let Some(ms) = self.backend_ms {
+            parts.push(format!("backend;dur={ms:.1}"));
+        }
+        if let Some(ms) = self.process_ms {
+            parts.push(format!("process;dur={ms:.1}"));
+        }
+
+        parts.push(format!("total;dur={:.1}", self.total_ms()));
+        parts.join(", ")
+    }
+
+    /// Format a single-line log string for Fastly logs.
+    #[must_use]
+    pub fn log_line(&self) -> String {
+        format!(
+            "RequestTimer: init={:.1}ms backend={:.1}ms process={:.1}ms total={:.1}ms",
+            self.init_ms.unwrap_or(0.0),
+            self.backend_ms.unwrap_or(0.0),
+            self.process_ms.unwrap_or(0.0),
+            self.total_ms(),
+        )
+    }
+}
+
+impl Default for RequestTimer {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+fn duration_ms(from: Instant, to: Instant) -> f64 {
+    to.duration_since(from).as_secs_f64() * 1000.0
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn header_value_includes_all_phases() {
+        let mut timer = RequestTimer::new();
+        timer.mark_init();
+        timer.mark_backend();
+        timer.mark_process();
+
+        let header = timer.header_value();
+        assert!(header.contains("init;dur="), "missing init phase");
+        assert!(header.contains("backend;dur="), "missing backend phase");
+        assert!(header.contains("process;dur="), "missing process phase");
+        assert!(header.contains("total;dur="), "missing total phase");
+    }
+
+    #[test]
+    fn header_value_omits_unmarked_phases() {
+        let timer = RequestTimer::new();
+        let header = timer.header_value();
+        assert!(!header.contains("init;dur="));
+        assert!(!header.contains("backend;dur="));
+        assert!(header.contains("total;dur="));
+    }
+
+    #[test]
+    fn log_line_uses_zero_for_unmarked() {
+        let timer = RequestTimer::new();
+        let log = timer.log_line();
+        assert!(log.contains("init=0.0ms"));
+        assert!(log.contains("backend=0.0ms"));
+        assert!(log.contains("process=0.0ms"));
+    }
+}
diff --git a/crates/fastly/src/main.rs b/crates/fastly/src/main.rs
index 0112bd99..a060c400 100644
--- a/crates/fastly/src/main.rs
+++ b/crates/fastly/src/main.rs
@@ -17,6 +17,7 @@ use trusted_server_common::request_signing::{
     handle_deactivate_key, handle_rotate_key, handle_trusted_server_discovery,
     handle_verify_signature,
 };
+use trusted_server_common::request_timer::RequestTimer;
 use trusted_server_common::settings::Settings;
 use trusted_server_common::settings_data::get_settings;
 
@@ -25,6 +26,8 @@ use crate::error::to_error_response;
 
 #[fastly::main]
 fn main(req: Request) -> Result<Response, Error> {
+    let mut timer = RequestTimer::new();
+
     init_logger();
 
     let settings = match get_settings() {
@@ -47,11 +50,14 @@ fn main(req: Request) -> Result<Response, Error> {
         }
     };
 
+    timer.mark_init();
+
     futures::executor::block_on(route_request(
         &settings,
         &orchestrator,
         &integration_registry,
         req,
+        &mut timer,
     ))
 }
 
@@ -60,6 +66,7 @@ async fn route_request(
     orchestrator: &AuctionOrchestrator,
     integration_registry: &IntegrationRegistry,
     req: Request,
+    timer: &mut RequestTimer,
 ) -> Result<Response, Error> {
     log::info!(
         "FASTLY_SERVICE_VERSION: {}",
@@ -119,7 +126,7 @@ async fn route_request(
                 path
             );
 
-            match handle_publisher_request(settings, integration_registry, req) {
+            match handle_publisher_request(settings, integration_registry, req, timer) {
                 Ok(response) => Ok(response),
                 Err(e) => {
                     log::error!("Failed to proxy to publisher origin: {:?}", e);
@@ -136,6 +143,9 @@ async fn route_request(
         response.set_header(key, value);
     }
 
+    log::info!("{}", timer.log_line());
+    response.set_header("Server-Timing", timer.header_value());
+
     Ok(response)
 }
 
diff --git a/scripts/benchmark.sh b/scripts/benchmark.sh
new file mode 100755
index 00000000..8428f36c
--- /dev/null
+++ b/scripts/benchmark.sh
@@ -0,0 +1,516 @@
+#!/usr/bin/env bash
+#
+# Trusted Server Performance Benchmark
+#
+# Measures request latency against a running Viceroy instance.
+# Run this on main, save the output, then run on your branch and compare.
+#
+# Prerequisites:
+#   - Viceroy running: fastly compute serve
+#   - hey installed: brew install hey
+#
+# Usage:
+#   ./scripts/benchmark.sh                    # Run all benchmarks
+#   ./scripts/benchmark.sh --cold-start       # Cold start analysis only
+#   ./scripts/benchmark.sh --load-test        # Load test only
+#   ./scripts/benchmark.sh --quick            # Quick smoke test (fewer requests)
+#   ./scripts/benchmark.sh --profile          # Server-Timing phase breakdown (init/backend/process)
+#   ./scripts/benchmark.sh --save baseline    # Save results to file
+#   ./scripts/benchmark.sh --compare baseline # Compare against saved results
+#
+# What this measures:
+#   - Cold start: first request latency after server restart
+#   - Warm latency: subsequent request timing breakdown (DNS, connect, TTFB, transfer, total)
+#   - Throughput: requests/sec under concurrent load
+#   - Latency distribution: p50, p95, p99 under load
+#
+# What this does NOT measure:
+#   - Real Fastly edge performance (Viceroy is a simulator)
+#   - Network latency to real backends
+#   - Production TLS handshake overhead
+#   - WASM cold start on actual Fastly infrastructure
+#
+# The value is in RELATIVE comparison between branches, not absolute numbers.
+
+set -euo pipefail
+
+# --- Configuration ---
+BASE_URL="${BENCH_URL:-http://127.0.0.1:7676}"
+RESULTS_DIR="$(cd "$(dirname "$0")/.." && pwd)/benchmark-results"
+CURL_FORMAT='
+{
+  "dns_ms":        %{time_namelookup},
+  "connect_ms":    %{time_connect},
+  "tls_ms":        %{time_appconnect},
+  "ttfb_ms":       %{time_starttransfer},
+  "total_ms":      %{time_total},
+  "size_bytes":    %{size_download},
+  "http_code":     %{http_code}
+}'
+
+# Colors (disabled if not a terminal)
+if [ -t 1 ]; then
+    BOLD='\033[1m'
+    GREEN='\033[0;32m'
+    YELLOW='\033[0;33m'
+    RED='\033[0;31m'
+    CYAN='\033[0;36m'
+    RESET='\033[0m'
+else
+    BOLD='' GREEN='' YELLOW='' RED='' CYAN='' RESET=''
+fi
+
+# --- Helpers ---
+
+log_header() {
+    echo ""
+    echo -e "${BOLD}${CYAN}=== $1 ===${RESET}"
+    echo ""
+}
+
+log_info() {
+    echo -e "${GREEN}[INFO]${RESET} $1"
+}
+
+log_warn() {
+    echo -e "${YELLOW}[WARN]${RESET} $1"
+}
+
+log_error() {
+    echo -e "${RED}[ERROR]${RESET} $1"
+}
+
+check_server() {
+    if ! curl -s -o /dev/null -w "%{http_code}" "$BASE_URL/" --max-time 2 > /dev/null 2>&1; then
+        log_error "Server not responding at $BASE_URL"
+        log_error "Start it first: fastly compute serve"
+        exit 1
+    fi
+    log_info "Server responding at $BASE_URL"
+}
+
+check_hey() {
+    if ! command -v hey &> /dev/null; then
+        log_warn "'hey' not installed. Attempting to install via brew..."
+        if command -v brew &> /dev/null; then
+            brew install hey
+            if ! command -v hey &> /dev/null; then
+                log_error "Failed to install 'hey'. Load tests will be skipped."
+                return 1
+            fi
+            log_info "'hey' installed successfully."
+        else
+            log_error "'brew' not found. Install hey manually: https://github.com/rakyll/hey"
+            log_error "Load tests will be skipped."
+            return 1
+        fi
+    fi
+    return 0
+}
+
+# Timed curl request — prints JSON timing breakdown
+timed_curl() {
+    local method="$1"
+    local url="$2"
+    local label="$3"
+    shift 3
+    local extra_args=("$@")
+
+    local result
+    result=$(curl -s -o /dev/null -w "$CURL_FORMAT" \
+        -X "$method" \
+        ${extra_args[@]+"${extra_args[@]}"} \
+        "$url" \
+        --max-time 30 2>/dev/null)
+
+    local total
+    total=$(echo "$result" | grep total_ms | tr -d '", ' | cut -d: -f2)
+    local ttfb
+    ttfb=$(echo "$result" | grep ttfb_ms | tr -d '", ' | cut -d: -f2)
+    local code
+    code=$(echo "$result" | grep http_code | tr -d '", ' | cut -d: -f2)
+    local size
+    size=$(echo "$result" | grep size_bytes | tr -d '", ' | cut -d: -f2)
+
+    # Convert seconds to ms for display
+    local total_ms ttfb_ms
+    total_ms=$(echo "$total * 1000" | bc 2>/dev/null || echo "$total")
+    ttfb_ms=$(echo "$ttfb * 1000" | bc 2>/dev/null || echo "$ttfb")
+
+    printf "  %-40s  HTTP %s  TTFB: %8.2f ms  Total: %8.2f ms  Size: %s bytes\n" \
+        "$label" "$code" "$ttfb_ms" "$total_ms" "$size"
+
+    echo "$result"
+}
+
+# --- Test Data ---
+
+AUCTION_PAYLOAD='{
+  "adUnits": [
+    {
+      "code": "header-banner",
+      "mediaTypes": {
+        "banner": {
+          "sizes": [[728, 90], [970, 250]]
+        }
+      }
+    },
+    {
+      "code": "sidebar",
+      "mediaTypes": {
+        "banner": {
+          "sizes": [[300, 250], [300, 600]]
+        }
+      }
+    }
+  ]
+}'
+
+# --- Benchmark Suites ---
+
+run_cold_start() {
+    log_header "COLD START ANALYSIS"
+    log_info "Measuring first-request latency (simulated via sequential requests)"
+    log_info "In production, cold start includes WASM instantiation which Viceroy may not reflect."
+    echo ""
+
+    echo -e "${BOLD}First request (potential cold path):${RESET}"
+    timed_curl GET "$BASE_URL/" "GET / (first)" > /dev/null
+
+    echo ""
+    echo -e "${BOLD}Subsequent requests (warm path):${RESET}"
+    for i in 1 2 3 4 5; do
+        timed_curl GET "$BASE_URL/" "GET / (warm #$i)" > /dev/null
+    done
+}
+
+run_endpoint_latency() {
+    log_header "ENDPOINT LATENCY (WARM)"
+    log_info "Per-endpoint timing breakdown (5 requests each, reporting median-ish)"
+    echo ""
+
+    local endpoints=(
+        "GET|/|Publisher proxy (fallback)"
+        "GET|/static/tsjs=tsjs-unified.min.js|Static JS bundle"
+        "GET|/.well-known/trusted-server.json|Discovery endpoint"
+    )
+
+    for entry in "${endpoints[@]}"; do
+        IFS='|' read -r method path label <<< "$entry"
+        echo -e "${BOLD}$label${RESET}  ($method $path)"
+
+        for i in $(seq 1 5); do
+            timed_curl "$method" "${BASE_URL}${path}" "  request #$i" > /dev/null
+        done
+        echo ""
+    done
+
+    # Auction endpoint (POST with body)
+    echo -e "${BOLD}Auction endpoint${RESET}  (POST /auction)"
+    for i in $(seq 1 5); do
+        timed_curl POST "${BASE_URL}/auction" "  request #$i" \
+            -H "Content-Type: application/json" \
+            -d "$AUCTION_PAYLOAD" > /dev/null
+    done
+    echo ""
+}
+
+run_load_test() {
+    if ! check_hey; then
+        return
+    fi
+
+    log_header "LOAD TEST"
+    log_info "Concurrent request throughput and latency distribution"
+    echo ""
+
+    local total_requests="${1:-200}"
+    local concurrency="${2:-10}"
+
+    echo -e "${BOLD}GET / (publisher proxy) - ${total_requests} requests, ${concurrency} concurrent${RESET}"
+    echo ""
+    hey -n "$total_requests" -c "$concurrency" -t 30 "$BASE_URL/" 2>&1 | \
+        grep -E "(Requests/sec|Total:|Slowest:|Fastest:|Average:|requests done)|Status code|Latency distribution" -A 20
+    echo ""
+
+    echo -e "${BOLD}GET /static/tsjs=tsjs-unified.min.js (static) - ${total_requests} requests, ${concurrency} concurrent${RESET}"
+    echo ""
+    hey -n "$total_requests" -c "$concurrency" -t 30 "$BASE_URL/static/tsjs=tsjs-unified.min.js" 2>&1 | \
+        grep -E "(Requests/sec|Total:|Slowest:|Fastest:|Average:|requests done)|Status code|Latency distribution" -A 20
+    echo ""
+
+    echo -e "${BOLD}POST /auction - ${total_requests} requests, ${concurrency} concurrent${RESET}"
+    echo ""
+    hey -n "$total_requests" -c "$concurrency" -t 30 \
+        -m POST \
+        -H "Content-Type: application/json" \
+        -d "$AUCTION_PAYLOAD" \
+        "$BASE_URL/auction" 2>&1 | \
+        grep -E "(Requests/sec|Total:|Slowest:|Fastest:|Average:|requests done)|Status code|Latency distribution" -A 20
+    echo ""
+}
+
+run_first_byte_analysis() {
+    log_header "TIME TO FIRST BYTE (TTFB) ANALYSIS"
+    log_info "Measures TTFB across 20 sequential requests to detect patterns"
+    log_info "Look for: first request significantly slower than rest = cold start"
+    echo ""
+
+    echo -e "${BOLD}Sequential TTFB for GET / :${RESET}"
+    echo ""
+    printf "  %-8s  %-12s  %-12s\n" "Request" "TTFB (ms)" "Total (ms)"
+    printf "  %-8s  %-12s  %-12s\n" "-------" "---------" "----------"
+
+    for i in $(seq 1 20); do
+        local result
+        result=$(curl -s -o /dev/null -w "%{time_starttransfer} %{time_total}" \
+            "$BASE_URL/" --max-time 30 2>/dev/null)
+        local ttfb total
+        ttfb=$(echo "$result" | awk '{printf "%.2f", $1 * 1000}')
+        total=$(echo "$result" | awk '{printf "%.2f", $2 * 1000}')
+        printf "  %-8s  %-12s  %-12s\n" "#$i" "${ttfb}" "${total}"
+    done
+    echo ""
+}
+
+# --- Server-Timing Profiler ---
+
+# Parse "init;dur=1.2, backend;dur=385.4, process;dur=12.3, total;dur=401.5"
+# into associative-style variables: st_init=1.2, st_backend=385.4, etc.
+parse_server_timing() {
+    local header="$1"
+    st_init="" st_backend="" st_process="" st_total=""
+    for part in $(echo "$header" | tr ',' '\n'); do
+        local name dur
+        name=$(echo "$part" | sed 's/;.*//' | tr -d ' ')
+        dur=$(echo "$part" | grep -o 'dur=[0-9.]*' | cut -d= -f2)
+        case "$name" in
+            init)    st_init="$dur" ;;
+            backend) st_backend="$dur" ;;
+            process) st_process="$dur" ;;
+            total)   st_total="$dur" ;;
+        esac
+    done
+}
+
+# Collect Server-Timing data over N requests and print stats
+# Also captures external TTFB and total (TTLB) for streaming comparison
+profile_endpoint() {
+    local method="$1"
+    local url="$2"
+    local label="$3"
+    local iterations="${4:-20}"
+    shift 4
+    local extra_args=("$@")
+
+    local init_vals=() backend_vals=() process_vals=() total_vals=()
+    local ttfb_vals=() ttlb_vals=()
+
+    for i in $(seq 1 "$iterations"); do
+        # Capture both Server-Timing header and curl timing in one request
+        local raw
+        raw=$(curl -s -D- -o /dev/null \
+            -w '\n__CURL_TIMING__ %{time_starttransfer} %{time_total}' \
+            -X "$method" \
+            ${extra_args[@]+"${extra_args[@]}"} \
+            "$url" \
+            --max-time 30 2>/dev/null)
+
+        # Extract Server-Timing header
+        local header
+        header=$(echo "$raw" | grep -i '^server-timing:' | sed 's/[Ss]erver-[Tt]iming: *//')
+
+        # Extract curl timing (TTFB and total in seconds)
+        local curl_timing
+        curl_timing=$(echo "$raw" | grep '__CURL_TIMING__' | sed 's/__CURL_TIMING__ //')
+        if [ -n "$curl_timing" ]; then
+            local ext_ttfb ext_total
+            ext_ttfb=$(echo "$curl_timing" | awk '{printf "%.1f", $1 * 1000}')
+            ext_total=$(echo "$curl_timing" | awk '{printf "%.1f", $2 * 1000}')
+            ttfb_vals+=("$ext_ttfb")
+            ttlb_vals+=("$ext_total")
+        fi
+
+        if [ -z "$header" ]; then
+            continue
+        fi
+
+        parse_server_timing "$header"
+        [ -n "$st_init" ]    && init_vals+=("$st_init")
+        [ -n "$st_backend" ] && backend_vals+=("$st_backend")
+        [ -n "$st_process" ] && process_vals+=("$st_process")
+        [ -n "$st_total" ]   && total_vals+=("$st_total")
+    done
+
+    echo -e "  ${BOLD}$label${RESET}  ($method, $iterations iterations)"
+    echo ""
+    printf "  %-12s  %8s  %8s  %8s  %8s\n" "Phase" "Min" "Avg" "Max" "P95"
+    printf "  %-12s  %8s  %8s  %8s  %8s\n" "----------" "------" "------" "------" "------"
+    print_stats "init"    "${init_vals[@]}"
+    print_stats "backend" "${backend_vals[@]}"
+    print_stats "process" "${process_vals[@]}"
+    print_stats "total"   "${total_vals[@]}"
+    echo ""
+    echo -e "  ${BOLD}External timing (curl):${RESET}"
+    printf "  %-12s  %8s  %8s  %8s  %8s\n" "Metric" "Min" "Avg" "Max" "P95"
+    printf "  %-12s  %8s  %8s  %8s  %8s\n" "----------" "------" "------" "------" "------"
+    print_stats "TTFB"    "${ttfb_vals[@]}"
+    print_stats "TTLB"    "${ttlb_vals[@]}"
+    echo ""
+}
+
+# Compute min/avg/max/p95 from a list of floats
+print_stats() {
+    local name="$1"
+    shift
+    local vals=("$@")
+    local count=${#vals[@]}
+
+    if [ "$count" -eq 0 ]; then
+        printf "  %-12s  %8s  %8s  %8s  %8s\n" "$name" "-" "-" "-" "-"
+        return
+    fi
+
+    # Sort values
+    local sorted
+    sorted=$(printf '%s\n' "${vals[@]}" | sort -g)
+
+    local min avg max p95
+    min=$(echo "$sorted" | head -1)
+    max=$(echo "$sorted" | tail -1)
+
+    local sum
+    sum=$(printf '%s\n' "${vals[@]}" | awk '{s+=$1} END {printf "%.1f", s}')
+    avg=$(echo "$sum $count" | awk '{printf "%.1f", $1/$2}')
+
+    local p95_idx
+    p95_idx=$(echo "$count" | awk '{printf "%d", int($1 * 0.95 + 0.5)}')
+    [ "$p95_idx" -lt 1 ] && p95_idx=1
+    p95=$(echo "$sorted" | sed -n "${p95_idx}p")
+
+    printf "  %-12s  %7.1f   %7.1f   %7.1f   %7.1f\n" "$name" "$min" "$avg" "$max" "$p95"
+}
+
+run_profile() {
+    local iterations="${1:-20}"
+
+    log_header "SERVER-TIMING PROFILE"
+    log_info "Collecting Server-Timing header data over $iterations requests per endpoint"
+    log_info "Phases: init (setup) → backend (origin fetch) → process (body rewrite) → total"
+    echo ""
+
+    profile_endpoint GET "$BASE_URL/static/tsjs=tsjs-unified.min.js" \
+        "Static JS bundle" "$iterations"
+
+    profile_endpoint GET "$BASE_URL/.well-known/trusted-server.json" \
+        "Discovery endpoint" "$iterations"
+
+    profile_endpoint GET "$BASE_URL/" \
+        "Publisher proxy (fallback)" "$iterations"
+
+    profile_endpoint POST "$BASE_URL/auction" \
+        "Auction endpoint" "$iterations" \
+        -H "Content-Type: application/json" \
+        -d "$AUCTION_PAYLOAD"
+}
+
+save_results() {
+    local name="$1"
+    mkdir -p "$RESULTS_DIR"
+    local outfile="$RESULTS_DIR/${name}.txt"
+
+    log_info "Saving results to $outfile"
+
+    {
+        echo "# Benchmark Results: $name"
+        echo "# Date: $(date -u '+%Y-%m-%d %H:%M:%S UTC')"
+        echo "# Git: $(git -C "$(dirname "$0")/.." rev-parse --short HEAD 2>/dev/null || echo 'unknown')"
+        echo "# Branch: $(git -C "$(dirname "$0")/.." branch --show-current 2>/dev/null || echo 'unknown')"
+        echo ""
+        run_all 2>&1
+    } > "$outfile"
+
+    log_info "Results saved. Compare later with: diff $RESULTS_DIR/baseline.txt $RESULTS_DIR/branch.txt"
+}
+
+compare_results() {
+    local name="$1"
+    local baseline="$RESULTS_DIR/${name}.txt"
+
+    if [ ! -f "$baseline" ]; then
+        log_error "No saved results found at $baseline"
+        log_error "Run with --save $name first"
+        exit 1
+    fi
+
+    local current
+    current=$(mktemp)
+    run_all 2>&1 > "$current"
+
+    log_header "COMPARISON: current vs $name"
+    diff --color=auto -u "$baseline" "$current" || true
+    rm -f "$current"
+}
+
+run_all() {
+    echo -e "${BOLD}Trusted Server Performance Benchmark${RESET}"
+    echo "Date: $(date -u '+%Y-%m-%d %H:%M:%S UTC')"
+    echo "Git:  $(git -C "$(dirname "$0")/.." rev-parse --short HEAD 2>/dev/null || echo 'unknown')"
+    echo "Branch: $(git -C "$(dirname "$0")/.." branch --show-current 2>/dev/null || echo 'unknown')"
+    echo "Server: $BASE_URL"
+
+    run_cold_start
+    run_first_byte_analysis
+    run_endpoint_latency
+    run_load_test 200 10
+}
+
+run_quick() {
+    echo -e "${BOLD}Trusted Server Performance Benchmark (Quick)${RESET}"
+    echo "Date: $(date -u '+%Y-%m-%d %H:%M:%S UTC')"
+    echo "Git:  $(git -C "$(dirname "$0")/.." rev-parse --short HEAD 2>/dev/null || echo 'unknown')"
+    echo "Server: $BASE_URL"
+
+    run_first_byte_analysis
+    run_load_test 50 5
+}
+
+# --- Main ---
+
+main() {
+    local mode="${1:-all}"
+
+    check_server
+
+    case "$mode" in
+        --cold-start)
+            run_cold_start
+            ;;
+        --load-test)
+            run_load_test "${2:-200}" "${3:-10}"
+            ;;
+        --quick)
+            run_quick
+            ;;
+        --ttfb)
+            run_first_byte_analysis
+            ;;
+        --profile)
+            run_profile "${2:-20}"
+            ;;
+        --save)
+            save_results "${2:?Usage: --save <name>}"
+            ;;
+        --compare)
+            compare_results "${2:?Usage: --compare <name>}"
+            ;;
+        --help|-h)
+            head -30 "$0" | grep '^#' | sed 's/^# \?//'
+            ;;
+        *)
+            run_all
+            ;;
+    esac
+}
+
+main "$@"

From ad993f554c141177deb80f0788f09e8f26b757b3 Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Wed, 18 Feb 2026 21:33:39 +0530
Subject: [PATCH 02/13] Add Server-Timing instrumentation and optimization plan

Introduce RequestTimer for per-request phase tracking (init, backend,
process, total) exposed via Server-Timing response headers. Add
benchmark tooling with --profile mode for collecting timing data.
Document phased optimization plan covering streaming architecture,
code-level fixes, and open design questions for team review.
---
 crates/common/src/publisher.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crates/common/src/publisher.rs b/crates/common/src/publisher.rs
index c6b465d5..0aa2d648 100644
--- a/crates/common/src/publisher.rs
+++ b/crates/common/src/publisher.rs
@@ -6,10 +6,10 @@ use crate::backend::BackendConfig;
 use crate::http_util::{serve_static_with_etag, RequestInfo};
 
 use crate::constants::{COOKIE_SYNTHETIC_ID, HEADER_X_COMPRESS_HINT, HEADER_X_SYNTHETIC_ID};
-use crate::request_timer::RequestTimer;
 use crate::cookies::create_synthetic_cookie;
 use crate::error::TrustedServerError;
 use crate::integrations::IntegrationRegistry;
+use crate::request_timer::RequestTimer;
 use crate::rsc_flight::RscFlightUrlRewriter;
 use crate::settings::Settings;
 use crate::streaming_processor::{Compression, PipelineConfig, StreamProcessor, StreamingPipeline};

From 4d904690dca99ce201467a4669c4a4748e65ae9e Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Wed, 18 Feb 2026 21:59:14 +0530
Subject: [PATCH 03/13] Downgrade Settings debug dump to log::debug and tighten
 max_level to Info

---
 OPTIMIZATION.md | 17 +++++++++++++----
 1 file changed, 13 insertions(+), 4 deletions(-)

diff --git a/OPTIMIZATION.md b/OPTIMIZATION.md
index 817696d7..72a5494f 100644
--- a/OPTIMIZATION.md
+++ b/OPTIMIZATION.md
@@ -196,13 +196,22 @@ impl StreamProcessor for HtmlRewriterAdapter {
 |--------|-----|------|
 | **High** (HTML is most common content type; eliminates 222KB+ buffer) | ~30 refactored | Medium — needs test coverage |
 
-#### 1.3 Remove verbose per-request logging
+#### 1.3 Reduce verbose per-request logging
 
-**Files**: `crates/fastly/src/main.rs:37,64-67`
+**Files**: `crates/fastly/src/main.rs:37,64-67,152-177`
 
-**Problem**: `log::info!("Settings {settings:?}")` serializes the entire Settings struct (~2KB) on every request. `FASTLY_SERVICE_VERSION` env var logged at info level.
+**Problem**: `log::info!("Settings {settings:?}")` serializes the entire Settings struct (~2KB) on every request. `FASTLY_SERVICE_VERSION` env var logged at info level. The logger is configured with `max_level(LevelFilter::Debug)`, meaning every `debug!` and above is evaluated.
 
-**Fix**: Remove settings dump or gate behind `log::debug!`.
+**Fix**: Downgrade the Settings dump to `log::debug!` and tighten the logger's `max_level` to `LevelFilter::Info` for production. The `log_fastly` crate supports `filter_module()` for per-module levels if we still want debug output from specific modules. When the level is filtered, `log` macros short-circuit before evaluating arguments — so the `Settings` `Debug` format is never even computed.
+
+```rust
+// Before: everything at Debug and above is serialized
+.max_level(log::LevelFilter::Debug)
+
+// After: Info in production, debug only for specific modules if needed
+.max_level(log::LevelFilter::Info)
+// Optional: .filter_module("trusted_server", log::LevelFilter::Debug)
+```
 
 | Impact | LOC | Risk |
 |--------|-----|------|

From 01d77e4b95caab5c868b6f7cf82d10348241e9e5 Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Thu, 19 Feb 2026 17:17:17 +0530
Subject: [PATCH 04/13] Remove Server-Timing instrumentation and clean up
 benchmark tooling
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

RequestTimer and Server-Timing header were premature — WASM guest
profiling via profile.sh gives better per-function visibility without
runtime overhead. Also strips dead --profile mode from benchmark.sh.
---
 .gitignore                         |   3 +
 OPTIMIZATION.md                    | 175 ++++++++++++-------
 crates/common/src/lib.rs           |   2 +-
 crates/common/src/publisher.rs     |   7 +-
 crates/common/src/request_timer.rs | 151 ----------------
 crates/fastly/src/main.rs          |  12 +-
 scripts/benchmark.sh               | 146 +---------------
 scripts/profile.sh                 | 269 +++++++++++++++++++++++++++++
 8 files changed, 386 insertions(+), 379 deletions(-)
 delete mode 100644 crates/common/src/request_timer.rs
 create mode 100755 scripts/profile.sh

diff --git a/.gitignore b/.gitignore
index af8ff99b..1bd7e773 100644
--- a/.gitignore
+++ b/.gitignore
@@ -21,3 +21,6 @@ src/*.html
 
 # SSL certificates
 *.pem
+
+/guest-profiles
+/benchmark-results/**
\ No newline at end of file
diff --git a/OPTIMIZATION.md b/OPTIMIZATION.md
index 72a5494f..77e7df45 100644
--- a/OPTIMIZATION.md
+++ b/OPTIMIZATION.md
@@ -4,11 +4,10 @@
 
 | Item | Status |
 |------|--------|
-| Production timing instrumentation (`RequestTimer`) | **Implemented** (on `feat/optimize-ts`, not yet deployed) |
-| Benchmark tooling (`scripts/benchmark.sh`) | **Implemented** (includes `--profile` mode) |
+| Benchmark tooling (`scripts/benchmark.sh`) | **Implemented** |
+| WASM guest profiling (`scripts/profile.sh`) | **Implemented** (flame graphs via `--profile-guest`) |
 | Viceroy baseline measurements | **Complete** |
 | Staging external TTFB baseline | **Complete** (against staging deployment) |
-| Server-Timing production data | **Blocked** — needs `feat/optimize-ts` deployed to staging |
 | Streaming architecture (`stream_to_client`) | **Planned** — see Phase 2 |
 | Code-level optimizations | **Planned** — see Phase 1 |
 
@@ -35,19 +34,33 @@ streaming.finish()?;
 
 This changes the optimization strategy — **time-to-last-byte (TTLB) and peak memory CAN be significantly reduced**. TTFB itself is still gated by the Fastly platform floor (~200ms) plus backend response time, but body bytes start reaching the client as soon as the first chunk is processed instead of waiting for the entire response to be buffered.
 
-### Compatibility with `#[fastly::main]` — NEEDS SPIKE
+### Compatibility with `#[fastly::main]` — use undecorated `main()` (recommended)
 
-`stream_to_client()` consumes the Response and starts sending. The Fastly SDK enforces that only **one response** is sent per request via `assert_single_downstream_response_is_sent()`. The `#[fastly::main]` macro wraps your function and calls `send_to_client()` on the returned `Response` — so if `stream_to_client()` was already called, the macro **will trigger a panic**.
+For streaming final responses, the Fastly SDK docs already define the intended pattern:
 
-**This is an unresolved design problem that needs a prototype before committing to the streaming architecture.**
+- `Request::from_client()` docs explicitly state it is incompatible with `#[fastly::main]` and recommend an undecorated `main()` with explicit response sending.
+- `Response::send_to_client()` / `Response::stream_to_client()` include the same compatibility guidance.
+- `fastly::init()` is public (doc-hidden) and can be called from raw `main()` to initialize the ABI.
 
-Possible approaches (all need validation):
+This means approach #1 is the correct architecture for streaming paths, and approaches like `std::process::exit(0)` or sentinel responses are unnecessary.
 
-1. **Drop the `#[fastly::main]` macro** — write a raw `main()` that handles the Fastly request lifecycle manually, giving full control over when/how the response is sent. Need to verify the Fastly SDK supports this.
-2. **Use `std::process::exit(0)` after streaming** — call `stream_to_client()`, process, `finish()`, then `exit(0)` before the macro gets a chance to call `send_to_client()`. Ugly, but may work if Fastly doesn't require cleanup.
-3. **Return a sentinel Response** — investigate whether the SDK treats an already-sent response as a no-op instead of panicking. (Current source code suggests it **does** panic — needs testing on actual Fastly Compute, not just source reading.)
+Recommended shape:
 
-**Action item**: Create a minimal Fastly Compute service that calls `stream_to_client()` and test each approach. This spike should be done **before** any Phase 2 implementation work.
+```rust
+fn main() -> Result<(), fastly::Error> {
+    fastly::init();
+    let req = fastly::Request::from_client();
+
+    match route_request(req)? {
+        Some(resp) => resp.send_to_client(), // non-streaming path
+        None => {}                           // streaming path already sent + finished
+    }
+
+    Ok(())
+}
+```
+
+**Action item**: Do a focused spike on real Fastly Compute to validate runtime behavior (no double-send panics across mixed routes, proper error behavior for partially streamed responses, and observability expectations). The API viability question is resolved.
 
 Non-streaming endpoints (static JS, discovery, auction) continue returning `Response` normally. Only the publisher proxy path (the hot path) would use streaming.
 
@@ -86,45 +99,31 @@ Measured on `main` branch. Value is in **relative comparison between branches**,
 
 ### Staging (External)
 
-Measured externally against staging deployment (golf.com proxy), `main` branch (no Server-Timing deployed yet).
+Measured externally against staging deployment (golf.com proxy), `main` branch.
 
 | Endpoint | TTFB | Total | Size | Notes |
 |---|---|---|---|---|
-| `GET /static/tsjs=tsjs-unified.min.js` | ~204 ms | ~219 ms | 28 KB | No backend, pure platform overhead |
+| `GET /static/tsjs=tsjs-unified.min.js` | ~204 ms | ~219 ms | 28 KB | No backend; includes client-network + edge path from benchmark vantage |
 | `GET /` (publisher proxy, golf.com) | ~234 ms | ~441 ms | 230 KB | Backend + processing |
 | `GET /.well-known/trusted-server.json` | ~191 ms | - | - | Returns 500 (needs investigation) |
 
-**Key insight**: Static JS has ~204ms TTFB with zero backend work. This is the **Fastly platform floor** (WASM instantiation + edge routing + TLS). Application code cannot reduce this. The publisher proxy adds only ~30ms TTFB on top — but the full ~441ms total includes waiting for the entire response to be buffered before sending. With streaming, the ~207ms gap between TTFB (234ms) and TTLB (441ms) would shrink because body bytes stream as they're processed instead of being fully buffered.
+**Key insight**: Static JS has ~204ms TTFB with zero backend work **from this specific benchmark vantage point**. That number includes client-to-edge RTT, DNS, TLS/connection state, and edge processing; it is **not** a universal Fastly floor. `WASM` instantiation can contribute on cold paths, but warm requests from clients near a POP can be much lower.
+
+For this dataset, treat static TTFB as an environment baseline and compare deltas: the publisher proxy adds only ~30ms TTFB on top. The larger optimization target is the TTFB→TTLB gap (~207ms here), which streaming can shrink by sending body chunks as they are processed instead of waiting for full buffering.
 
 ---
 
 ## Implementation Plan
 
-### Phase 0: Deploy Server-Timing Instrumentation (DONE, needs deploy)
+### Phase 0: Tooling and Baselines (DONE)
 
 **Branch**: `feat/optimize-ts`
 
-Already implemented:
-- `RequestTimer` in `crates/common/src/request_timer.rs` — tracks `init`, `backend`, `process`, `total` phases
-- `Server-Timing` header emitted on every response
-- Wired into `main.rs` and `publisher.rs`
-- `scripts/benchmark.sh --profile` mode to collect and report Server-Timing data
-
-**Action**: Deploy `feat/optimize-ts` to staging, then run:
-```bash
-BENCH_URL=https://<your-staging>.edgecompute.app ./scripts/benchmark.sh --profile
-```
-
-This gives us the real `init`/`backend`/`process` split for golf.com requests.
-
-**Conflict with Phase 2 streaming**: The `Server-Timing` header is currently set **after** response processing completes (line 147 of `main.rs`), which includes `backend` and `process` phase durations. When we switch to `stream_to_client()` in Phase 2, headers are sent **before** processing starts — so `Server-Timing` cannot include the `backend`/`process`/`total` values.
-
-Options for Phase 2:
-- **Move Server-Timing to a trailer** — `StreamingBody` supports trailers via `StreamingBodyExt::append_trailer()`. Requires client support (browsers generally ignore trailers).
-- **Log-only instrumentation** — keep `RequestTimer` for server-side logging but don't include it in response headers on streaming paths. Non-streaming endpoints still get the header.
-- **Keep both paths** — Phase 0 instrumentation continues working on the buffered path. Once streaming is validated and deployed, accept that Server-Timing headers are only available for non-streaming endpoints (static, auction, discovery).
-
-This is **not a blocker** for Phase 0 — the instrumentation is valuable right now on the current buffered architecture. Just be aware it will need adjustment when streaming lands.
+Completed:
+- `scripts/benchmark.sh` — HTTP load testing with TTFB analysis, cold start detection, endpoint latency breakdown
+- `scripts/profile.sh` — WASM guest profiling via `fastly compute serve --profile-guest`, outputs Firefox Profiler-compatible flame graphs
+- Viceroy baseline measurements (see tables above)
+- Staging external TTFB baseline
 
 ---
 
@@ -217,7 +216,46 @@ impl StreamProcessor for HtmlRewriterAdapter {
 |--------|-----|------|
 | Medium-High | ~3 | None |
 
-#### 1.4 Trivial fixes batch
+#### 1.4 Eliminate redundant `config` crate parsing in `get_settings()` — **22% CPU**
+
+**Files**: `crates/common/src/settings_data.rs`, `crates/common/src/settings.rs`
+
+**Problem**: Flame graph profiling shows `get_settings()` consuming ~22% of per-request CPU. The `build.rs` already merges `trusted-server.toml` + all `TRUSTED_SERVER__*` env vars at compile time and writes a fully-resolved TOML file to `target/trusted-server-out.toml`. But at runtime, `get_settings()` calls `Settings::from_toml()`, which re-runs the entire `config` crate pipeline — `Config::builder().add_source(File).add_source(Environment).build().try_deserialize()` — redundantly scanning env vars and merging sources that were already resolved at build time.
+
+**Root cause**: `settings_data.rs` embeds the build-time-resolved TOML via `include_bytes!`, then hands it to `from_toml()` which treats it as a raw config source and re-layers env vars on top.
+
+**Fix**: Replace `Settings::from_toml()` with direct `toml::from_str()` in `get_settings()`. The embedded TOML is already fully resolved — no `config` crate needed at runtime.
+
+```rust
+// Before (22% CPU — re-runs config crate pipeline + env var scan)
+let settings = Settings::from_toml(toml_str)?;
+
+// After (near-instant — just TOML deserialization)
+let settings: Settings = toml::from_str(toml_str)
+    .change_context(TrustedServerError::Configuration {
+        message: "Failed to deserialize embedded config".to_string(),
+    })?;
+```
+
+**Alternative — binary serialization for near-zero cost**: Since `build.rs` already has a fully constructed `Settings` struct, it could serialize to `postcard` (a `no_std`-compatible, WASM-safe binary format). Runtime deserialization becomes a memcpy-like operation instead of TOML parsing. Requires adding `postcard` + updating `build.rs` to write binary and `settings_data.rs` to deserialize binary.
+
+```rust
+// build.rs: serialize to binary instead of TOML
+let bytes = postcard::to_allocvec(&settings).expect("Failed to serialize");
+fs::write(dest_path, bytes)?;
+
+// settings_data.rs: near-instant deserialization
+let settings: Settings = postcard::from_bytes(SETTINGS_DATA)
+    .change_context(TrustedServerError::Configuration { ... })?;
+```
+
+**Recommendation**: Start with the `toml::from_str()` fix (1-line change, no new deps). If profiling still shows meaningful time in TOML parsing, upgrade to `postcard`.
+
+| Impact | LOC | Risk |
+|--------|-----|------|
+| **Very High** (~22% CPU eliminated) | 1-3 | Low — `build.rs` already resolves everything |
+
+#### 1.5 Trivial fixes batch
 
 | Fix | File | LOC |
 |-----|------|-----|
@@ -319,9 +357,9 @@ This would overlap origin fetch time with auction execution, so the browser star
 After implementing Phases 1-2:
 
 1. Deploy to staging
-2. Run `./scripts/benchmark.sh --profile` against staging
-3. Compare Server-Timing data: `init`/`backend`/`process`/`total` before vs after
-4. Compare external TTFB and time-to-last-byte
+2. Run `./scripts/benchmark.sh` against staging for external TTFB/TTLB
+3. Run `./scripts/profile.sh` locally for flame graph comparison
+4. Compare external TTFB and time-to-last-byte before vs after
 5. Check Fastly dashboard for memory/compute metrics
 6. If improvement is marginal, don't ship the streaming architecture (Phase 2)
 
@@ -337,11 +375,12 @@ After implementing Phases 1-2:
 
 | # | Optimization | Impact | LOC | Risk | Phase |
 |---|---|---|---|---|---|
-| **P0** | Server-Timing instrumentation | Prerequisite | Done | None | 0 |
+| **P0** | Tooling and baselines | Prerequisite | Done | None | 0 |
 | **1.1** | Gzip streaming fix | **High** (memory) | -15/+3 | Low | 1 |
 | **1.2** | HTML rewriter streaming | **High** (memory) | ~30 | Medium | 1 |
 | **1.3** | Remove verbose logging | Medium-High | ~3 | None | 1 |
-| **1.4** | Trivial fixes batch | Low-Medium | ~50 | None | 1 |
+| **1.4** | Eliminate redundant `config` crate in `get_settings()` | **Very High** (~22% CPU) | 1-3 | Low | 1 |
+| **1.5** | Trivial fixes batch | Low-Medium | ~50 | None | 1 |
 | **2.1** | `stream_to_client()` integration | **High** (TTLB) | ~80-120 | Medium | 2 |
 | **2.2** | Concurrent origin + auction | **Very High** | ~150-200 | High | 2 (future) |
 
@@ -405,29 +444,40 @@ brew install hey    # HTTP load testing tool (auto-installed by benchmark.sh)
 ./scripts/benchmark.sh --ttfb             # TTFB analysis only
 ./scripts/benchmark.sh --load-test        # Load test only
 ./scripts/benchmark.sh --cold-start       # Cold start analysis
-./scripts/benchmark.sh --profile          # Server-Timing phase breakdown
 ./scripts/benchmark.sh --save baseline    # Save results to file
 ./scripts/benchmark.sh --compare baseline # Compare against saved results
 ```
 
-### Profiling Against Staging
+### WASM Guest Profiling (Flame Graphs)
+
+`fastly compute serve --profile-guest` samples the WASM call stack every 50us and writes a Firefox Profiler-compatible JSON on exit. This shows exactly which Rust functions consume CPU time — compression, HTML rewriting, string operations, init, etc.
 
 ```bash
-# Requires Server-Timing branch deployed
-BENCH_URL=https://example.edgecompute.app ./scripts/benchmark.sh --profile
+./scripts/profile.sh                           # Profile GET / (publisher proxy)
+./scripts/profile.sh --endpoint /auction \
+    --method POST --body '{"adUnits":[]}'      # Profile specific endpoint
+./scripts/profile.sh --requests 50             # More samples for stable flame graph
+./scripts/profile.sh --no-build                # Skip rebuild
+./scripts/profile.sh --open                    # Auto-open Firefox Profiler (macOS)
+
+# View: drag output file onto https://profiler.firefox.com/
 ```
 
-### What the Benchmark Measures
+The script builds, starts the profiling server, fires requests, stops the server, and saves the profile to `benchmark-results/profiles/`.
 
-| Test | What it tells you |
+### What the Tools Measure
+
+| Tool | What it tells you |
 |---|---|
-| TTFB analysis | 20 sequential requests — detects cold start patterns |
-| Cold start | First vs subsequent request latency |
-| Endpoint latency | Per-endpoint timing breakdown (DNS, connect, TTFB, total) |
-| Load test (hey) | Throughput (req/sec), latency distribution (P50/P95/P99) |
-| Profile | Server-Timing phase breakdown: `init`/`backend`/`process`/`total` with min/avg/max/p95 |
+| `benchmark.sh` — TTFB analysis | 20 sequential requests — detects cold start patterns |
+| `benchmark.sh` — Cold start | First vs subsequent request latency |
+| `benchmark.sh` — Endpoint latency | Per-endpoint timing breakdown (DNS, connect, TTFB, total) |
+| `benchmark.sh` — Load test (hey) | Throughput (req/sec), latency distribution (P50/P95/P99) |
+| `profile.sh` | Per-function CPU time inside WASM — flame graph via `--profile-guest` |
+
+**Use `profile.sh` first** to identify which functions are bottlenecks, then use `benchmark.sh` to measure the impact of fixes on external timing.
 
-### What the Benchmark Does NOT Measure
+### What These Tools Do NOT Measure
 
 - Real Fastly edge performance (Viceroy is a simulator)
 - WASM cold start on actual Fastly infrastructure
@@ -442,11 +492,8 @@ BENCH_URL=https://example.edgecompute.app ./scripts/benchmark.sh --profile
 
 | File | Change |
 |------|--------|
-| `crates/common/src/request_timer.rs` | **New** — `RequestTimer` with `Server-Timing` header output |
-| `crates/common/src/lib.rs` | Added `pub mod request_timer;` |
-| `crates/fastly/src/main.rs` | Wired timer: created at top, `mark_init()`, passed to handlers, `Server-Timing` header set |
-| `crates/common/src/publisher.rs` | Added `mark_backend()` after `req.send()`, `mark_process()` after body processing |
-| `scripts/benchmark.sh` | Added `--profile` mode, auto-install `hey` |
+| `scripts/benchmark.sh` | HTTP load testing, TTFB analysis, cold start detection, auto-install `hey` |
+| `scripts/profile.sh` | WASM guest profiling via `--profile-guest`, flame graph workflow |
 | `OPTIMIZATION.md` | This document |
 
 ### Teammate's `streaming_processor.rs` Changes
@@ -469,9 +516,7 @@ Fix: change `process_through_compression` to accept an optional finalization clo
 
 ### Decisions Needed
 
-1. **Deploy `feat/optimize-ts` to staging?** — Needed to get real Server-Timing data before proceeding with optimizations
-2. **`#[fastly::main]` + `stream_to_client()` spike** — The macro calls `send_to_client()` on the returned Response, which will panic if streaming was already started. We need a minimal prototype to validate the approach before any Phase 2 work. See "Compatibility with `#[fastly::main]`" section above.
-3. **Phase 1 vs Phase 2 priority** — Phase 1 (code fixes) is low risk and can ship independently. Phase 2 (streaming architecture) is higher impact but higher risk, and blocked on decision #2.
-4. **Server-Timing on streaming paths** — `stream_to_client()` sends headers before processing completes, so `Server-Timing` can't include `backend`/`process` phases. Options: trailers, log-only, or accept the limitation. See Phase 0 section.
-5. **Concurrent auction + origin (2.2)** — Not applicable for golf.com. Defer to a separate ticket?
-6. **GzEncoder `finish()` correctness** — Fix the `drop(encoder)` error swallowing in `process_through_compression`, or accept the risk?
+1. **Raw `main()` migration spike** — Validate end-to-end behavior on Fastly Compute when using undecorated `main()` + `Request::from_client()` and mixing buffered + streaming routes in one service.
+2. **Phase 1 vs Phase 2 priority** — Phase 1 (code fixes) is low risk and can ship independently. Phase 2 (streaming architecture) is higher impact and should proceed after decision #1 confirms runtime behavior.
+3. **Concurrent auction + origin (2.2)** — Not applicable for golf.com. Defer to a separate ticket?
+4. **GzEncoder `finish()` correctness** — Fix the `drop(encoder)` error swallowing in `process_through_compression`, or accept the risk?
diff --git a/crates/common/src/lib.rs b/crates/common/src/lib.rs
index c43ed8a3..fd6fe5e1 100644
--- a/crates/common/src/lib.rs
+++ b/crates/common/src/lib.rs
@@ -51,7 +51,7 @@ pub mod openrtb;
 pub mod proxy;
 pub mod publisher;
 pub mod request_signing;
-pub mod request_timer;
+
 pub mod rsc_flight;
 pub mod settings;
 pub mod settings_data;
diff --git a/crates/common/src/publisher.rs b/crates/common/src/publisher.rs
index 0aa2d648..0794f066 100644
--- a/crates/common/src/publisher.rs
+++ b/crates/common/src/publisher.rs
@@ -9,7 +9,7 @@ use crate::constants::{COOKIE_SYNTHETIC_ID, HEADER_X_COMPRESS_HINT, HEADER_X_SYN
 use crate::cookies::create_synthetic_cookie;
 use crate::error::TrustedServerError;
 use crate::integrations::IntegrationRegistry;
-use crate::request_timer::RequestTimer;
+
 use crate::rsc_flight::RscFlightUrlRewriter;
 use crate::settings::Settings;
 use crate::streaming_processor::{Compression, PipelineConfig, StreamProcessor, StreamingPipeline};
@@ -177,7 +177,6 @@ pub fn handle_publisher_request(
     settings: &Settings,
     integration_registry: &IntegrationRegistry,
     mut req: Request,
-    timer: &mut RequestTimer,
 ) -> Result<Response, Report<TrustedServerError>> {
     log::debug!("Proxying request to publisher_origin");
 
@@ -237,8 +236,6 @@ pub fn handle_publisher_request(
             message: "Failed to proxy request to origin".to_string(),
         })?;
 
-    timer.mark_backend();
-
     // Log all response headers for debugging
     log::debug!("Response headers:");
     for (name, value) in response.get_headers() {
@@ -314,8 +311,6 @@ pub fn handle_publisher_request(
         );
     }
 
-    timer.mark_process();
-
     response.set_header(HEADER_X_SYNTHETIC_ID, synthetic_id.as_str());
     if !has_synthetic_cookie {
         response.set_header(
diff --git a/crates/common/src/request_timer.rs b/crates/common/src/request_timer.rs
deleted file mode 100644
index ca3d07a3..00000000
--- a/crates/common/src/request_timer.rs
+++ /dev/null
@@ -1,151 +0,0 @@
-//! Lightweight per-request timer for profiling the Fastly Compute request lifecycle.
-//!
-//! Records phase durations using [`std::time::Instant`] and emits them as a
-//! [`Server-Timing`](https://developer.mozilla.org/en-US/docs/Web/HTTP/Reference/Headers/Server-Timing)
-//! header value so that timings are visible in browser `DevTools` (Network → Timing tab).
-
-use std::time::Instant;
-
-/// Records wall-clock durations for each phase of a request.
-///
-/// Usage:
-/// ```ignore
-/// let mut timer = RequestTimer::new();          // captures t0
-/// // ... init work ...
-/// timer.mark_init();                            // captures init duration
-/// // ... backend fetch ...
-/// timer.mark_backend();                         // captures backend duration
-/// // ... body processing ...
-/// timer.mark_process();                         // captures process duration
-/// response.set_header("Server-Timing", timer.header_value());
-/// ```
-pub struct RequestTimer {
-    start: Instant,
-    init_ms: Option<f64>,
-    backend_ms: Option<f64>,
-    process_ms: Option<f64>,
-    last_mark: Instant,
-}
-
-impl RequestTimer {
-    /// Start a new timer. Call this as early as possible in `main()`.
-    #[must_use]
-    pub fn new() -> Self {
-        let now = Instant::now();
-        Self {
-            start: now,
-            init_ms: None,
-            backend_ms: None,
-            process_ms: None,
-            last_mark: now,
-        }
-    }
-
-    /// Mark the end of the initialization phase (settings, orchestrator, registry).
-    pub fn mark_init(&mut self) {
-        let now = Instant::now();
-        self.init_ms = Some(duration_ms(self.last_mark, now));
-        self.last_mark = now;
-    }
-
-    /// Mark the end of the backend fetch phase.
-    pub fn mark_backend(&mut self) {
-        let now = Instant::now();
-        self.backend_ms = Some(duration_ms(self.last_mark, now));
-        self.last_mark = now;
-    }
-
-    /// Mark the end of body processing (decompress, rewrite, recompress).
-    pub fn mark_process(&mut self) {
-        let now = Instant::now();
-        self.process_ms = Some(duration_ms(self.last_mark, now));
-        self.last_mark = now;
-    }
-
-    /// Total elapsed time since the timer was created.
-    #[must_use]
-    pub fn total_ms(&self) -> f64 {
-        duration_ms(self.start, Instant::now())
-    }
-
-    /// Format as a `Server-Timing` header value.
-    ///
-    /// Example output:
-    /// `init;dur=1.2, backend;dur=385.4, process;dur=12.3, total;dur=401.5`
-    #[must_use]
-    pub fn header_value(&self) -> String {
-        let mut parts = Vec::with_capacity(4);
-
-        if let Some(ms) = self.init_ms {
-            parts.push(format!("init;dur={ms:.1}"));
-        }
-        if let Some(ms) = self.backend_ms {
-            parts.push(format!("backend;dur={ms:.1}"));
-        }
-        if let Some(ms) = self.process_ms {
-            parts.push(format!("process;dur={ms:.1}"));
-        }
-
-        parts.push(format!("total;dur={:.1}", self.total_ms()));
-        parts.join(", ")
-    }
-
-    /// Format a single-line log string for Fastly logs.
-    #[must_use]
-    pub fn log_line(&self) -> String {
-        format!(
-            "RequestTimer: init={:.1}ms backend={:.1}ms process={:.1}ms total={:.1}ms",
-            self.init_ms.unwrap_or(0.0),
-            self.backend_ms.unwrap_or(0.0),
-            self.process_ms.unwrap_or(0.0),
-            self.total_ms(),
-        )
-    }
-}
-
-impl Default for RequestTimer {
-    fn default() -> Self {
-        Self::new()
-    }
-}
-
-fn duration_ms(from: Instant, to: Instant) -> f64 {
-    to.duration_since(from).as_secs_f64() * 1000.0
-}
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn header_value_includes_all_phases() {
-        let mut timer = RequestTimer::new();
-        timer.mark_init();
-        timer.mark_backend();
-        timer.mark_process();
-
-        let header = timer.header_value();
-        assert!(header.contains("init;dur="), "missing init phase");
-        assert!(header.contains("backend;dur="), "missing backend phase");
-        assert!(header.contains("process;dur="), "missing process phase");
-        assert!(header.contains("total;dur="), "missing total phase");
-    }
-
-    #[test]
-    fn header_value_omits_unmarked_phases() {
-        let timer = RequestTimer::new();
-        let header = timer.header_value();
-        assert!(!header.contains("init;dur="));
-        assert!(!header.contains("backend;dur="));
-        assert!(header.contains("total;dur="));
-    }
-
-    #[test]
-    fn log_line_uses_zero_for_unmarked() {
-        let timer = RequestTimer::new();
-        let log = timer.log_line();
-        assert!(log.contains("init=0.0ms"));
-        assert!(log.contains("backend=0.0ms"));
-        assert!(log.contains("process=0.0ms"));
-    }
-}
diff --git a/crates/fastly/src/main.rs b/crates/fastly/src/main.rs
index a060c400..0112bd99 100644
--- a/crates/fastly/src/main.rs
+++ b/crates/fastly/src/main.rs
@@ -17,7 +17,6 @@ use trusted_server_common::request_signing::{
     handle_deactivate_key, handle_rotate_key, handle_trusted_server_discovery,
     handle_verify_signature,
 };
-use trusted_server_common::request_timer::RequestTimer;
 use trusted_server_common::settings::Settings;
 use trusted_server_common::settings_data::get_settings;
 
@@ -26,8 +25,6 @@ use crate::error::to_error_response;
 
 #[fastly::main]
 fn main(req: Request) -> Result<Response, Error> {
-    let mut timer = RequestTimer::new();
-
     init_logger();
 
     let settings = match get_settings() {
@@ -50,14 +47,11 @@ fn main(req: Request) -> Result<Response, Error> {
         }
     };
 
-    timer.mark_init();
-
     futures::executor::block_on(route_request(
         &settings,
         &orchestrator,
         &integration_registry,
         req,
-        &mut timer,
     ))
 }
 
@@ -66,7 +60,6 @@ async fn route_request(
     orchestrator: &AuctionOrchestrator,
     integration_registry: &IntegrationRegistry,
     req: Request,
-    timer: &mut RequestTimer,
 ) -> Result<Response, Error> {
     log::info!(
         "FASTLY_SERVICE_VERSION: {}",
@@ -126,7 +119,7 @@ async fn route_request(
                 path
             );
 
-            match handle_publisher_request(settings, integration_registry, req, timer) {
+            match handle_publisher_request(settings, integration_registry, req) {
                 Ok(response) => Ok(response),
                 Err(e) => {
                     log::error!("Failed to proxy to publisher origin: {:?}", e);
@@ -143,9 +136,6 @@ async fn route_request(
         response.set_header(key, value);
     }
 
-    log::info!("{}", timer.log_line());
-    response.set_header("Server-Timing", timer.header_value());
-
     Ok(response)
 }
 
diff --git a/scripts/benchmark.sh b/scripts/benchmark.sh
index 8428f36c..daebccb3 100755
--- a/scripts/benchmark.sh
+++ b/scripts/benchmark.sh
@@ -14,7 +14,7 @@
 #   ./scripts/benchmark.sh --cold-start       # Cold start analysis only
 #   ./scripts/benchmark.sh --load-test        # Load test only
 #   ./scripts/benchmark.sh --quick            # Quick smoke test (fewer requests)
-#   ./scripts/benchmark.sh --profile          # Server-Timing phase breakdown (init/backend/process)
+#   ./scripts/benchmark.sh --ttfb             # TTFB analysis only
 #   ./scripts/benchmark.sh --save baseline    # Save results to file
 #   ./scripts/benchmark.sh --compare baseline # Compare against saved results
 #
@@ -273,147 +273,6 @@ run_first_byte_analysis() {
     echo ""
 }
 
-# --- Server-Timing Profiler ---
-
-# Parse "init;dur=1.2, backend;dur=385.4, process;dur=12.3, total;dur=401.5"
-# into associative-style variables: st_init=1.2, st_backend=385.4, etc.
-parse_server_timing() {
-    local header="$1"
-    st_init="" st_backend="" st_process="" st_total=""
-    for part in $(echo "$header" | tr ',' '\n'); do
-        local name dur
-        name=$(echo "$part" | sed 's/;.*//' | tr -d ' ')
-        dur=$(echo "$part" | grep -o 'dur=[0-9.]*' | cut -d= -f2)
-        case "$name" in
-            init)    st_init="$dur" ;;
-            backend) st_backend="$dur" ;;
-            process) st_process="$dur" ;;
-            total)   st_total="$dur" ;;
-        esac
-    done
-}
-
-# Collect Server-Timing data over N requests and print stats
-# Also captures external TTFB and total (TTLB) for streaming comparison
-profile_endpoint() {
-    local method="$1"
-    local url="$2"
-    local label="$3"
-    local iterations="${4:-20}"
-    shift 4
-    local extra_args=("$@")
-
-    local init_vals=() backend_vals=() process_vals=() total_vals=()
-    local ttfb_vals=() ttlb_vals=()
-
-    for i in $(seq 1 "$iterations"); do
-        # Capture both Server-Timing header and curl timing in one request
-        local raw
-        raw=$(curl -s -D- -o /dev/null \
-            -w '\n__CURL_TIMING__ %{time_starttransfer} %{time_total}' \
-            -X "$method" \
-            ${extra_args[@]+"${extra_args[@]}"} \
-            "$url" \
-            --max-time 30 2>/dev/null)
-
-        # Extract Server-Timing header
-        local header
-        header=$(echo "$raw" | grep -i '^server-timing:' | sed 's/[Ss]erver-[Tt]iming: *//')
-
-        # Extract curl timing (TTFB and total in seconds)
-        local curl_timing
-        curl_timing=$(echo "$raw" | grep '__CURL_TIMING__' | sed 's/__CURL_TIMING__ //')
-        if [ -n "$curl_timing" ]; then
-            local ext_ttfb ext_total
-            ext_ttfb=$(echo "$curl_timing" | awk '{printf "%.1f", $1 * 1000}')
-            ext_total=$(echo "$curl_timing" | awk '{printf "%.1f", $2 * 1000}')
-            ttfb_vals+=("$ext_ttfb")
-            ttlb_vals+=("$ext_total")
-        fi
-
-        if [ -z "$header" ]; then
-            continue
-        fi
-
-        parse_server_timing "$header"
-        [ -n "$st_init" ]    && init_vals+=("$st_init")
-        [ -n "$st_backend" ] && backend_vals+=("$st_backend")
-        [ -n "$st_process" ] && process_vals+=("$st_process")
-        [ -n "$st_total" ]   && total_vals+=("$st_total")
-    done
-
-    echo -e "  ${BOLD}$label${RESET}  ($method, $iterations iterations)"
-    echo ""
-    printf "  %-12s  %8s  %8s  %8s  %8s\n" "Phase" "Min" "Avg" "Max" "P95"
-    printf "  %-12s  %8s  %8s  %8s  %8s\n" "----------" "------" "------" "------" "------"
-    print_stats "init"    "${init_vals[@]}"
-    print_stats "backend" "${backend_vals[@]}"
-    print_stats "process" "${process_vals[@]}"
-    print_stats "total"   "${total_vals[@]}"
-    echo ""
-    echo -e "  ${BOLD}External timing (curl):${RESET}"
-    printf "  %-12s  %8s  %8s  %8s  %8s\n" "Metric" "Min" "Avg" "Max" "P95"
-    printf "  %-12s  %8s  %8s  %8s  %8s\n" "----------" "------" "------" "------" "------"
-    print_stats "TTFB"    "${ttfb_vals[@]}"
-    print_stats "TTLB"    "${ttlb_vals[@]}"
-    echo ""
-}
-
-# Compute min/avg/max/p95 from a list of floats
-print_stats() {
-    local name="$1"
-    shift
-    local vals=("$@")
-    local count=${#vals[@]}
-
-    if [ "$count" -eq 0 ]; then
-        printf "  %-12s  %8s  %8s  %8s  %8s\n" "$name" "-" "-" "-" "-"
-        return
-    fi
-
-    # Sort values
-    local sorted
-    sorted=$(printf '%s\n' "${vals[@]}" | sort -g)
-
-    local min avg max p95
-    min=$(echo "$sorted" | head -1)
-    max=$(echo "$sorted" | tail -1)
-
-    local sum
-    sum=$(printf '%s\n' "${vals[@]}" | awk '{s+=$1} END {printf "%.1f", s}')
-    avg=$(echo "$sum $count" | awk '{printf "%.1f", $1/$2}')
-
-    local p95_idx
-    p95_idx=$(echo "$count" | awk '{printf "%d", int($1 * 0.95 + 0.5)}')
-    [ "$p95_idx" -lt 1 ] && p95_idx=1
-    p95=$(echo "$sorted" | sed -n "${p95_idx}p")
-
-    printf "  %-12s  %7.1f   %7.1f   %7.1f   %7.1f\n" "$name" "$min" "$avg" "$max" "$p95"
-}
-
-run_profile() {
-    local iterations="${1:-20}"
-
-    log_header "SERVER-TIMING PROFILE"
-    log_info "Collecting Server-Timing header data over $iterations requests per endpoint"
-    log_info "Phases: init (setup) → backend (origin fetch) → process (body rewrite) → total"
-    echo ""
-
-    profile_endpoint GET "$BASE_URL/static/tsjs=tsjs-unified.min.js" \
-        "Static JS bundle" "$iterations"
-
-    profile_endpoint GET "$BASE_URL/.well-known/trusted-server.json" \
-        "Discovery endpoint" "$iterations"
-
-    profile_endpoint GET "$BASE_URL/" \
-        "Publisher proxy (fallback)" "$iterations"
-
-    profile_endpoint POST "$BASE_URL/auction" \
-        "Auction endpoint" "$iterations" \
-        -H "Content-Type: application/json" \
-        -d "$AUCTION_PAYLOAD"
-}
-
 save_results() {
     local name="$1"
     mkdir -p "$RESULTS_DIR"
@@ -495,9 +354,6 @@ main() {
         --ttfb)
             run_first_byte_analysis
             ;;
-        --profile)
-            run_profile "${2:-20}"
-            ;;
         --save)
             save_results "${2:?Usage: --save <name>}"
             ;;
diff --git a/scripts/profile.sh b/scripts/profile.sh
new file mode 100755
index 00000000..66cebf0d
--- /dev/null
+++ b/scripts/profile.sh
@@ -0,0 +1,269 @@
+#!/usr/bin/env bash
+#
+# WASM Guest Profiler for Trusted Server
+#
+# Captures function-level flame graphs using Fastly's Wasmtime guest profiler.
+# Samples the WASM call stack every 50us and writes a Firefox Profiler-compatible
+# JSON file after the server stops.
+#
+# Prerequisites:
+#   - Fastly CLI installed: https://developer.fastly.com/learning/tools/cli
+#   - Rust wasm32-wasip1 target: rustup target add wasm32-wasip1
+#
+# Usage:
+#   ./scripts/profile.sh                           # Profile GET / (publisher proxy)
+#   ./scripts/profile.sh --endpoint /auction \
+#       --method POST --body '{"adUnits":[]}'      # Profile specific endpoint
+#   ./scripts/profile.sh --requests 50             # More samples for stable flame graph
+#   ./scripts/profile.sh --no-build                # Skip rebuild, use existing binary
+#   ./scripts/profile.sh --open                    # Auto-open Firefox Profiler (macOS)
+#
+# Output:
+#   Profile saved to benchmark-results/profiles/<timestamp>.json
+#   View: drag file onto https://profiler.firefox.com/
+#
+
+set -euo pipefail
+
+# --- Configuration ---
+PROJECT_ROOT="$(cd "$(dirname "$0")/.." && pwd)"
+PROFILE_DIR="$PROJECT_ROOT/benchmark-results/profiles"
+BASE_URL="http://127.0.0.1:7676"
+SERVER_PID=""
+
+# Defaults
+ENDPOINT="/"
+METHOD="GET"
+REQUESTS=20
+BODY=""
+SKIP_BUILD=false
+AUTO_OPEN=false
+
+# Colors (disabled if not a terminal)
+if [ -t 1 ]; then
+    BOLD='\033[1m'
+    GREEN='\033[0;32m'
+    YELLOW='\033[0;33m'
+    RED='\033[0;31m'
+    CYAN='\033[0;36m'
+    RESET='\033[0m'
+else
+    BOLD='' GREEN='' YELLOW='' RED='' CYAN='' RESET=''
+fi
+
+# --- Helpers ---
+
+log_header() {
+    echo ""
+    echo -e "${BOLD}${CYAN}=== $1 ===${RESET}"
+    echo ""
+}
+
+log_info() {
+    echo -e "${GREEN}[INFO]${RESET} $1"
+}
+
+log_warn() {
+    echo -e "${YELLOW}[WARN]${RESET} $1"
+}
+
+log_error() {
+    echo -e "${RED}[ERROR]${RESET} $1"
+}
+
+stop_server() {
+    # Kill the fastly CLI process if we have its PID
+    if [ -n "$SERVER_PID" ] && kill -0 "$SERVER_PID" 2>/dev/null; then
+        kill "$SERVER_PID" 2>/dev/null || true
+        wait "$SERVER_PID" 2>/dev/null || true
+    fi
+    # Also kill any Viceroy process still on port 7676
+    # (fastly CLI spawns Viceroy as a child; killing the CLI doesn't always propagate)
+    local port_pids
+    port_pids=$(lsof -ti :7676 2>/dev/null | while read pid; do
+        # Only kill Viceroy processes, not unrelated listeners (e.g. Chrome)
+        if ps -p "$pid" -o command= 2>/dev/null | grep -q viceroy; then
+            echo "$pid"
+        fi
+    done)
+    if [ -n "$port_pids" ]; then
+        echo "$port_pids" | xargs kill 2>/dev/null || true
+        sleep 1
+    fi
+}
+
+cleanup() {
+    stop_server
+}
+
+trap cleanup EXIT
+
+usage() {
+    echo "Usage: $0 [OPTIONS]"
+    echo ""
+    echo "Options:"
+    echo "  --endpoint PATH    URL path to profile (default: /)"
+    echo "  --method METHOD    HTTP method (default: GET)"
+    echo "  --body DATA        Request body for POST/PUT"
+    echo "  --requests N       Number of requests to fire (default: 20)"
+    echo "  --no-build         Skip fastly compute build"
+    echo "  --open             Auto-open Firefox Profiler after capture (macOS)"
+    echo "  --help             Show this help"
+    exit 0
+}
+
+# --- Parse Arguments ---
+
+while [[ $# -gt 0 ]]; do
+    case "$1" in
+        --endpoint)  ENDPOINT="$2"; shift 2 ;;
+        --method)    METHOD="$2"; shift 2 ;;
+        --body)      BODY="$2"; shift 2 ;;
+        --requests)  REQUESTS="$2"; shift 2 ;;
+        --no-build)  SKIP_BUILD=true; shift ;;
+        --open)      AUTO_OPEN=true; shift ;;
+        --help|-h)   usage ;;
+        *)           log_error "Unknown option: $1"; usage ;;
+    esac
+done
+
+# --- Main ---
+
+log_header "WASM GUEST PROFILER"
+log_info "Endpoint: $METHOD $ENDPOINT"
+log_info "Requests: $REQUESTS"
+
+# Step 0: Kill any existing server on the profiling port
+EXISTING_PID=$(lsof -ti :7676 2>/dev/null | grep -v "^$" || true)
+if [ -n "$EXISTING_PID" ]; then
+    log_warn "Port 7676 already in use (PID: $EXISTING_PID). Stopping existing server..."
+    kill $EXISTING_PID 2>/dev/null || true
+    sleep 1
+    # Force kill if still alive
+    if lsof -ti :7676 &>/dev/null; then
+        kill -9 $(lsof -ti :7676) 2>/dev/null || true
+        sleep 1
+    fi
+    log_info "Existing server stopped."
+fi
+
+# Step 1: Build
+if [ "$SKIP_BUILD" = false ]; then
+    log_header "BUILD"
+    log_info "Building WASM binary with debug symbols (release + debug=1)..."
+    (cd "$PROJECT_ROOT" && fastly compute build)
+    echo ""
+    log_info "Build complete."
+else
+    log_info "Skipping build (--no-build)"
+fi
+
+# Step 2: Start server with --profile-guest
+log_header "START PROFILING SERVER"
+log_info "Starting fastly compute serve --profile-guest..."
+
+(cd "$PROJECT_ROOT" && fastly compute serve --profile-guest 2>&1) &
+SERVER_PID=$!
+log_info "Server PID: $SERVER_PID"
+
+# Wait for server to be ready
+log_info "Waiting for server at $BASE_URL..."
+for i in $(seq 1 30); do
+    if curl -s -o /dev/null --max-time 2 "$BASE_URL/" 2>/dev/null; then
+        log_info "Server ready."
+        break
+    fi
+    if ! kill -0 "$SERVER_PID" 2>/dev/null; then
+        log_error "Server process exited unexpectedly."
+        exit 1
+    fi
+    if [ "$i" -eq 30 ]; then
+        log_error "Server did not become ready within 30 seconds."
+        exit 1
+    fi
+    sleep 1
+done
+
+# Step 3: Fire requests
+log_header "CAPTURING PROFILE"
+log_info "Firing $REQUESTS requests to $METHOD $ENDPOINT..."
+
+CURL_ARGS=(-s -o /dev/null -X "$METHOD")
+if [ -n "$BODY" ]; then
+    CURL_ARGS+=(-H "Content-Type: application/json" -d "$BODY")
+fi
+
+for i in $(seq 1 "$REQUESTS"); do
+    local_code=$(curl -w "%{http_code}" "${CURL_ARGS[@]}" "${BASE_URL}${ENDPOINT}" --max-time 30 2>/dev/null || echo "000")
+    printf "\r  Request %d/%d (HTTP %s)" "$i" "$REQUESTS" "$local_code"
+done
+echo ""
+log_info "All requests complete."
+
+# Step 4: Stop server (profile is written on exit)
+log_header "COLLECTING PROFILE"
+log_info "Stopping server to flush profile data..."
+
+stop_server
+SERVER_PID=""
+
+# Step 5: Find and move profile file
+# Viceroy writes profiles to guest-profiles/ directory (e.g., guest-profiles/1771483114-2.json)
+# or as guest-profile-*.json in the project root depending on CLI version
+mkdir -p "$PROFILE_DIR"
+TIMESTAMP=$(date '+%Y%m%d-%H%M%S')
+
+GUEST_PROFILES_DIR="$PROJECT_ROOT/guest-profiles"
+if [ -d "$GUEST_PROFILES_DIR" ]; then
+    # Find the most recently modified .json file in guest-profiles/
+    PROFILE_FILE=$(find "$GUEST_PROFILES_DIR" -name "*.json" -newer "$0" -print 2>/dev/null | head -1 || true)
+    if [ -n "$PROFILE_FILE" ]; then
+        DEST="$PROFILE_DIR/profile-${TIMESTAMP}.json"
+        cp "$PROFILE_FILE" "$DEST"
+    fi
+fi
+
+if [ -z "${DEST:-}" ] || [ ! -f "${DEST:-}" ]; then
+    # Fallback: check project root for guest-profile-*.json
+    PROFILE_FILE=$(find "$PROJECT_ROOT" -maxdepth 1 -name "guest-profile-*.json" -newer "$0" -print -quit 2>/dev/null || true)
+    if [ -n "$PROFILE_FILE" ]; then
+        DEST="$PROFILE_DIR/profile-${TIMESTAMP}.json"
+        mv "$PROFILE_FILE" "$DEST"
+    fi
+fi
+
+if [ -z "${DEST:-}" ] || [ ! -f "${DEST:-}" ]; then
+    log_warn "No profile file found."
+    log_warn "Check $GUEST_PROFILES_DIR/ or $PROJECT_ROOT/ for profile output."
+    log_warn "The --profile-guest flag may not be supported by your Fastly CLI version."
+    exit 1
+fi
+
+FILE_SIZE=$(du -h "$DEST" | cut -f1)
+
+log_header "PROFILE CAPTURED"
+log_info "File: $DEST"
+log_info "Size: $FILE_SIZE"
+log_info "Samples: ~$((REQUESTS * 20)) (estimated at 50us intervals)"
+echo ""
+echo -e "${BOLD}To view the flame graph:${RESET}"
+echo "  1. Open https://profiler.firefox.com/"
+echo "  2. Drag and drop: $DEST"
+echo ""
+echo -e "${BOLD}What to look for:${RESET}"
+echo "  - Tall stacks in GzDecoder/GzEncoder = compression overhead"
+echo "  - Wide bars in lol_html = HTML rewriting cost"
+echo "  - Time in format!/replace/to_string = string allocation churn"
+echo "  - Time in Settings::deserialize = init overhead"
+echo ""
+
+# Step 6: Auto-open if requested
+if [ "$AUTO_OPEN" = true ]; then
+    if command -v open &>/dev/null; then
+        log_info "Opening Firefox Profiler..."
+        open "https://profiler.firefox.com/"
+        log_info "Drag the profile file onto the page to load it."
+    else
+        log_warn "--open is only supported on macOS"
+    fi
+fi

From 33b527d9eefde69022632783b1fdc89257fa35a1 Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Thu, 19 Feb 2026 19:51:11 +0530
Subject: [PATCH 05/13] Optimize get_settings() by bypassing redundant config
 crate at runtime
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

build.rs already resolves trusted-server.toml + env vars at compile time
and embeds the result. Replace Settings::from_toml() with direct
toml::from_str() to skip the config crate pipeline on every request.
Profiling confirms: ~5-8% → ~3.3% CPU per request.
---
 OPTIMIZATION.md                    | 254 +++++++++++++++--------------
 crates/common/Cargo.toml           |   1 +
 crates/common/src/settings.rs      |   2 +-
 crates/common/src/settings_data.rs |  18 +-
 4 files changed, 150 insertions(+), 125 deletions(-)

diff --git a/OPTIMIZATION.md b/OPTIMIZATION.md
index 77e7df45..05e23247 100644
--- a/OPTIMIZATION.md
+++ b/OPTIMIZATION.md
@@ -1,82 +1,49 @@
 # Trusted Server Optimization Plan
 
-## Status
+## Summary
 
-| Item | Status |
-|------|--------|
-| Benchmark tooling (`scripts/benchmark.sh`) | **Implemented** |
-| WASM guest profiling (`scripts/profile.sh`) | **Implemented** (flame graphs via `--profile-guest`) |
-| Viceroy baseline measurements | **Complete** |
-| Staging external TTFB baseline | **Complete** (against staging deployment) |
-| Streaming architecture (`stream_to_client`) | **Planned** — see Phase 2 |
-| Code-level optimizations | **Planned** — see Phase 1 |
+This document presents a performance analysis and optimization plan for the Trusted Server running on Fastly Compute (WASM). WASM guest profiling reveals that **HTML processing consumes ~76% of per-request CPU** on the publisher proxy path, with the `lol_html` parser alone accounting for ~47%. The optimization strategy focuses on two phases: (1) low-risk code fixes that reduce memory waste and enable streaming, and (2) an architectural shift to `stream_to_client()` that eliminates response buffering and reduces time-to-last-byte.
 
 ---
 
-## Key Finding: Streaming to Client IS Possible
-
-The Fastly Compute SDK provides `Response::stream_to_client()` which returns a `StreamingBody` handle that implements `std::io::Write`. Headers are sent immediately and body chunks stream as they're written.
-
-```rust
-// Current: fully buffered (no bytes reach client until everything is done)
-let body = response.take_body();
-let mut output = Vec::new();
-pipeline.process(body, &mut output)?;    // blocks until complete
-response.set_body(Body::from(output));   // only NOW does client get anything
-return Ok(response);
-
-// Possible: streaming (headers sent immediately, body chunks as processed)
-let body = response.take_body();
-let mut streaming = response.stream_to_client();  // headers sent NOW
-pipeline.process(body, &mut streaming)?;           // each write() → client
-streaming.finish()?;
-```
+## Profiling Results
 
-This changes the optimization strategy — **time-to-last-byte (TTLB) and peak memory CAN be significantly reduced**. TTFB itself is still gated by the Fastly platform floor (~200ms) plus backend response time, but body bytes start reaching the client as soon as the first chunk is processed instead of waiting for the entire response to be buffered.
+**Methodology**: WASM guest profiling via `fastly compute serve --profile-guest`, 50 requests to `GET /` (publisher proxy to golf.com, 222KB HTML). ~131 samples per request at 50μs intervals. Profiles analyzed in Firefox Profiler.
 
-### Compatibility with `#[fastly::main]` — use undecorated `main()` (recommended)
-
-For streaming final responses, the Fastly SDK docs already define the intended pattern:
-
-- `Request::from_client()` docs explicitly state it is incompatible with `#[fastly::main]` and recommend an undecorated `main()` with explicit response sending.
-- `Response::send_to_client()` / `Response::stream_to_client()` include the same compatibility guidance.
-- `fastly::init()` is public (doc-hidden) and can be called from raw `main()` to initialize the ABI.
-
-This means approach #1 is the correct architecture for streaming paths, and approaches like `std::process::exit(0)` or sentinel responses are unnecessary.
-
-Recommended shape:
-
-```rust
-fn main() -> Result<(), fastly::Error> {
-    fastly::init();
-    let req = fastly::Request::from_client();
-
-    match route_request(req)? {
-        Some(resp) => resp.send_to_client(), // non-streaming path
-        None => {}                           // streaming path already sent + finished
-    }
+### CPU Breakdown — Top Level
 
-    Ok(())
-}
-```
+| % CPU | Function | Notes |
+|-------|----------|-------|
+| ~96% | `trusted_server_fastly::main` | Almost all time is in application code |
+| ~90% | `route_request` → `handle_publisher_request` | Publisher proxy is the hot path |
+| **~76%** | **HTML processing pipeline** (`streaming_processor` → `lol_html`) | **Dominant bottleneck** |
+| ~~5-8%~~ → **3.3%** | `get_settings()` | ~~Redundant config crate parsing~~ **Fixed** — now uses `toml::from_str` |
+| ~5-7% | `handle_publisher_request` (non-HTML) | Backend send, cookie handling |
 
-**Action item**: Do a focused spike on real Fastly Compute to validate runtime behavior (no double-send panics across mixed routes, proper error behavior for partially streamed responses, and observability expectations). The API viability question is resolved.
+### CPU Breakdown — HTML Processing (~76% total)
 
-Non-streaming endpoints (static JS, discovery, auction) continue returning `Response` normally. Only the publisher proxy path (the hot path) would use streaming.
+| % CPU | Function | Notes |
+|-------|----------|-------|
+| **~47%** | `lol_html::parser` state machine | HTML tokenizer/parser — character-by-character parsing |
+| ~11% | `create_html_processor` | Building the lol_html rewriter with all handlers |
+| ~18% | Processing callbacks | URL rewriting, attribute scanning, output sink handling |
 
----
+### CPU Breakdown — Other Components
 
-## How to Use This Document
+| % CPU | Function | Notes |
+|-------|----------|-------|
+| ~2% | `IntegrationRegistry` | Route lookup + attribute rewriting + initialization |
+| ~0.8% | Memory allocation (`RawVec::reserve`) | Buffer growth during processing |
+| ~0.5% | Logging (`fern` / `log_fastly`) | Minimal overhead |
+| ~0.5% | Synthetic ID generation | HMAC computation |
+| ~0.5% | Header extraction | `fastly::http::handle::get_header_values` |
 
-**For any optimization work:**
+### Key Takeaways
 
-1. Run `./scripts/benchmark.sh --save baseline` on `main`
-2. Make your change on a branch
-3. Rebuild: `fastly compute build`
-4. Run `./scripts/benchmark.sh --save branch-name`
-5. Compare: `diff benchmark-results/baseline.txt benchmark-results/branch-name.txt`
-6. For production: `BENCH_URL=https://your-staging.edgecompute.app ./scripts/benchmark.sh --profile`
-7. If the numbers don't improve meaningfully, don't ship it
+1. **The lol_html parser at ~47% cannot be directly optimized** — it's doing its job parsing a 222KB HTML page. The focus should be on reducing unnecessary work around it and enabling streaming so processed chunks reach the client sooner.
+2. **`get_settings()` was ~5-8%, now ~3.3% after fix** — `build.rs` already resolves all config at compile time. Replaced `Settings::from_toml()` with direct `toml::from_str()` to eliminate redundant `config` crate pipeline.
+3. **Memory allocation at ~0.8%** confirms buffer growth during processing. Fixing gzip and HTML streaming (items 1.1 + 1.2) should reduce this.
+4. **Logging is negligible** at ~0.5%, but `log::info!("Settings {settings:?}")` still serializes the entire Settings struct on every request.
 
 ---
 
@@ -107,29 +74,68 @@ Measured externally against staging deployment (golf.com proxy), `main` branch.
 | `GET /` (publisher proxy, golf.com) | ~234 ms | ~441 ms | 230 KB | Backend + processing |
 | `GET /.well-known/trusted-server.json` | ~191 ms | - | - | Returns 500 (needs investigation) |
 
-**Key insight**: Static JS has ~204ms TTFB with zero backend work **from this specific benchmark vantage point**. That number includes client-to-edge RTT, DNS, TLS/connection state, and edge processing; it is **not** a universal Fastly floor. `WASM` instantiation can contribute on cold paths, but warm requests from clients near a POP can be much lower.
+**Key insight**: Static JS has ~204ms TTFB with zero backend work **from this specific benchmark vantage point**. That number includes client-to-edge RTT, DNS, TLS/connection state, and edge processing — it is **not** a universal Fastly floor.
 
 For this dataset, treat static TTFB as an environment baseline and compare deltas: the publisher proxy adds only ~30ms TTFB on top. The larger optimization target is the TTFB→TTLB gap (~207ms here), which streaming can shrink by sending body chunks as they are processed instead of waiting for full buffering.
 
 ---
 
-## Implementation Plan
+## Key Finding: Streaming to Client IS Possible
+
+The Fastly Compute SDK provides `Response::stream_to_client()` which returns a `StreamingBody` handle that implements `std::io::Write`. Headers are sent immediately and body chunks stream as they're written.
 
-### Phase 0: Tooling and Baselines (DONE)
+```rust
+// Current: fully buffered (no bytes reach client until everything is done)
+let body = response.take_body();
+let mut output = Vec::new();
+pipeline.process(body, &mut output)?;    // blocks until complete
+response.set_body(Body::from(output));   // only NOW does client get anything
+return Ok(response);
+
+// Possible: streaming (headers sent immediately, body chunks as processed)
+let body = response.take_body();
+let mut streaming = response.stream_to_client();  // headers sent NOW
+pipeline.process(body, &mut streaming)?;           // each write() → client
+streaming.finish()?;
+```
 
-**Branch**: `feat/optimize-ts`
+This changes the optimization strategy — **time-to-last-byte (TTLB) and peak memory CAN be significantly reduced**. TTFB itself is still gated by the Fastly platform floor plus backend response time, but body bytes start reaching the client as soon as the first chunk is processed instead of waiting for the entire response to be buffered.
 
-Completed:
-- `scripts/benchmark.sh` — HTTP load testing with TTFB analysis, cold start detection, endpoint latency breakdown
-- `scripts/profile.sh` — WASM guest profiling via `fastly compute serve --profile-guest`, outputs Firefox Profiler-compatible flame graphs
-- Viceroy baseline measurements (see tables above)
-- Staging external TTFB baseline
+### Compatibility with `#[fastly::main]` — use undecorated `main()` (recommended)
+
+For streaming final responses, the Fastly SDK docs define the intended pattern:
+
+- `Request::from_client()` docs explicitly state it is incompatible with `#[fastly::main]` and recommend an undecorated `main()` with explicit response sending.
+- `Response::send_to_client()` / `Response::stream_to_client()` include the same compatibility guidance.
+- `fastly::init()` is public (doc-hidden) and can be called from raw `main()` to initialize the ABI.
+
+Recommended shape:
+
+```rust
+fn main() -> Result<(), fastly::Error> {
+    fastly::init();
+    let req = fastly::Request::from_client();
+
+    match route_request(req)? {
+        Some(resp) => resp.send_to_client(), // non-streaming path
+        None => {}                           // streaming path already sent + finished
+    }
+
+    Ok(())
+}
+```
+
+**Action item**: Do a focused spike on real Fastly Compute to validate runtime behavior (no double-send panics across mixed routes, proper error behavior for partially streamed responses, and observability expectations).
+
+Non-streaming endpoints (static JS, discovery, auction) continue returning `Response` normally. Only the publisher proxy path (the hot path) would use streaming.
 
 ---
 
+## Implementation Plan
+
 ### Phase 1: Low-Risk Code Optimizations
 
-These are small, safe changes that reduce CPU and memory waste. Ship as one PR, measure before/after.
+Small, safe changes that reduce CPU and memory waste. Ship as one PR, measure before/after.
 
 #### 1.1 Fix gzip streaming — remove full-body buffering
 
@@ -195,39 +201,18 @@ impl StreamProcessor for HtmlRewriterAdapter {
 |--------|-----|------|
 | **High** (HTML is most common content type; eliminates 222KB+ buffer) | ~30 refactored | Medium — needs test coverage |
 
-#### 1.3 Reduce verbose per-request logging
-
-**Files**: `crates/fastly/src/main.rs:37,64-67,152-177`
-
-**Problem**: `log::info!("Settings {settings:?}")` serializes the entire Settings struct (~2KB) on every request. `FASTLY_SERVICE_VERSION` env var logged at info level. The logger is configured with `max_level(LevelFilter::Debug)`, meaning every `debug!` and above is evaluated.
-
-**Fix**: Downgrade the Settings dump to `log::debug!` and tighten the logger's `max_level` to `LevelFilter::Info` for production. The `log_fastly` crate supports `filter_module()` for per-module levels if we still want debug output from specific modules. When the level is filtered, `log` macros short-circuit before evaluating arguments — so the `Settings` `Debug` format is never even computed.
-
-```rust
-// Before: everything at Debug and above is serialized
-.max_level(log::LevelFilter::Debug)
-
-// After: Info in production, debug only for specific modules if needed
-.max_level(log::LevelFilter::Info)
-// Optional: .filter_module("trusted_server", log::LevelFilter::Debug)
-```
-
-| Impact | LOC | Risk |
-|--------|-----|------|
-| Medium-High | ~3 | None |
-
-#### 1.4 Eliminate redundant `config` crate parsing in `get_settings()` — **22% CPU**
+#### 1.3 ~~Eliminate redundant `config` crate parsing in `get_settings()` — ~5-8% CPU~~ DONE (~3.3% post-fix)
 
 **Files**: `crates/common/src/settings_data.rs`, `crates/common/src/settings.rs`
 
-**Problem**: Flame graph profiling shows `get_settings()` consuming ~22% of per-request CPU. The `build.rs` already merges `trusted-server.toml` + all `TRUSTED_SERVER__*` env vars at compile time and writes a fully-resolved TOML file to `target/trusted-server-out.toml`. But at runtime, `get_settings()` calls `Settings::from_toml()`, which re-runs the entire `config` crate pipeline — `Config::builder().add_source(File).add_source(Environment).build().try_deserialize()` — redundantly scanning env vars and merging sources that were already resolved at build time.
+**Problem**: Profiling shows `get_settings()` consuming ~5-8% of per-request CPU. The `build.rs` already merges `trusted-server.toml` + all `TRUSTED_SERVER__*` env vars at compile time and writes a fully-resolved TOML file to `target/trusted-server-out.toml`. But at runtime, `get_settings()` calls `Settings::from_toml()`, which re-runs the entire `config` crate pipeline — `Config::builder().add_source(File).add_source(Environment).build().try_deserialize()` — redundantly scanning env vars and merging sources that were already resolved at build time.
 
 **Root cause**: `settings_data.rs` embeds the build-time-resolved TOML via `include_bytes!`, then hands it to `from_toml()` which treats it as a raw config source and re-layers env vars on top.
 
 **Fix**: Replace `Settings::from_toml()` with direct `toml::from_str()` in `get_settings()`. The embedded TOML is already fully resolved — no `config` crate needed at runtime.
 
 ```rust
-// Before (22% CPU — re-runs config crate pipeline + env var scan)
+// Before (~5-8% CPU — re-runs config crate pipeline + env var scan)
 let settings = Settings::from_toml(toml_str)?;
 
 // After (near-instant — just TOML deserialization)
@@ -253,7 +238,29 @@ let settings: Settings = postcard::from_bytes(SETTINGS_DATA)
 
 | Impact | LOC | Risk |
 |--------|-----|------|
-| **Very High** (~22% CPU eliminated) | 1-3 | Low — `build.rs` already resolves everything |
+| **Medium** (~5-8% → ~3.3% CPU, verified) | 1-3 | Low — `build.rs` already resolves everything |
+
+**Status**: Done. Replaced `Settings::from_toml()` with `toml::from_str()` + explicit `normalize()` + `validate()`. Profiling confirmed: **~5-8% → ~3.3% CPU per request**.
+
+#### 1.4 Reduce verbose per-request logging — ~0.5% CPU
+
+**Files**: `crates/fastly/src/main.rs:37,64-67,152-177`
+
+**Problem**: `log::info!("Settings {settings:?}")` serializes the entire Settings struct (~2KB) on every request. `FASTLY_SERVICE_VERSION` env var logged at info level. The logger is configured with `max_level(LevelFilter::Debug)`, meaning every `debug!` and above is evaluated.
+
+**Fix**: Downgrade the Settings dump to `log::debug!` and tighten the logger's `max_level` to `LevelFilter::Info` for production. When the level is filtered, `log` macros short-circuit before evaluating arguments — so the `Settings` `Debug` format is never even computed.
+
+```rust
+// Before: everything at Debug and above is serialized
+.max_level(log::LevelFilter::Debug)
+
+// After: Info in production, debug only for specific modules if needed
+.max_level(log::LevelFilter::Info)
+```
+
+| Impact | LOC | Risk |
+|--------|-----|------|
+| Low (~0.5% CPU) | ~3 | None |
 
 #### 1.5 Trivial fixes batch
 
@@ -271,7 +278,7 @@ let settings: Settings = postcard::from_bytes(SETTINGS_DATA)
 
 ### Phase 2: Streaming Response Architecture
 
-This is the high-impact architectural change. Uses Fastly's `stream_to_client()` API to send response headers and body chunks to the client as they're processed, instead of buffering everything.
+The high-impact architectural change. Uses Fastly's `stream_to_client()` API to send response headers and body chunks to the client as they're processed, instead of buffering everything.
 
 #### 2.1 Publisher proxy: `stream_to_client()` integration
 
@@ -344,7 +351,7 @@ The idea: use `req.send_async()` to launch the origin fetch concurrently with au
 
 This would overlap origin fetch time with auction execution, so the browser starts receiving `<head>` content (CSS, fonts) while the auction is still running.
 
-**Note**: This requires significant refactoring of the auction orchestrator and HTML processor to support async injection. The pseudo-code in the teammate's proposal (`origin_pending.poll()`, `run_auction_async`) represents the desired architecture but these APIs don't exist yet and would need to be built.
+**Note**: This requires significant refactoring of the auction orchestrator and HTML processor to support async injection.
 
 | Impact | LOC | Risk |
 |--------|-----|------|
@@ -373,16 +380,15 @@ After implementing Phases 1-2:
 
 ## Optimization Summary Table
 
-| # | Optimization | Impact | LOC | Risk | Phase |
-|---|---|---|---|---|---|
-| **P0** | Tooling and baselines | Prerequisite | Done | None | 0 |
-| **1.1** | Gzip streaming fix | **High** (memory) | -15/+3 | Low | 1 |
-| **1.2** | HTML rewriter streaming | **High** (memory) | ~30 | Medium | 1 |
-| **1.3** | Remove verbose logging | Medium-High | ~3 | None | 1 |
-| **1.4** | Eliminate redundant `config` crate in `get_settings()` | **Very High** (~22% CPU) | 1-3 | Low | 1 |
-| **1.5** | Trivial fixes batch | Low-Medium | ~50 | None | 1 |
-| **2.1** | `stream_to_client()` integration | **High** (TTLB) | ~80-120 | Medium | 2 |
-| **2.2** | Concurrent origin + auction | **Very High** | ~150-200 | High | 2 (future) |
+| # | Optimization | Measured CPU | Impact | LOC | Risk | Phase |
+|---|---|---|---|---|---|---|
+| **1.1** | Gzip streaming fix | Part of ~76% HTML pipeline | **High** (memory) | -15/+3 | Low | 1 |
+| **1.2** | HTML rewriter streaming | Part of ~76% HTML pipeline | **High** (memory) | ~30 | Medium | 1 |
+| **1.3** | ~~Eliminate redundant `config` crate~~ | ~~5-8%~~ → **3.3%** | **Done** | 1-3 | Low | 1 |
+| **1.4** | Reduce verbose logging | ~0.5% | Low | ~3 | None | 1 |
+| **1.5** | Trivial fixes batch | <1% combined | Low | ~50 | None | 1 |
+| **2.1** | `stream_to_client()` integration | N/A (architectural) | **High** (TTLB) | ~80-120 | Medium | 2 |
+| **2.2** | Concurrent origin + auction | N/A (architectural) | **Very High** | ~150-200 | High | 2 (future) |
 
 ---
 
@@ -423,8 +429,8 @@ Client → Fastly Edge → [WASM starts]
   → StreamingBody.finish()                      done
 ```
 
-**Memory**: ~8KB chunk buffer + lol_html internal state (significantly less than 4x response size — exact savings need measurement)
-**TTLB**: client receives first body bytes after first processed chunk, instead of waiting for all processing to complete. For a 222KB page, the savings is the entire processing time (decompression + rewriting + recompression).
+**Memory**: ~8KB chunk buffer + lol_html internal state (significantly less than 4x response size)
+**TTLB**: client receives first body bytes after first processed chunk, instead of waiting for all processing to complete
 
 ---
 
@@ -450,7 +456,7 @@ brew install hey    # HTTP load testing tool (auto-installed by benchmark.sh)
 
 ### WASM Guest Profiling (Flame Graphs)
 
-`fastly compute serve --profile-guest` samples the WASM call stack every 50us and writes a Firefox Profiler-compatible JSON on exit. This shows exactly which Rust functions consume CPU time — compression, HTML rewriting, string operations, init, etc.
+`fastly compute serve --profile-guest` samples the WASM call stack every 50μs and writes a Firefox Profiler-compatible JSON on exit. This shows exactly which Rust functions consume CPU time — compression, HTML rewriting, string operations, init, etc.
 
 ```bash
 ./scripts/profile.sh                           # Profile GET / (publisher proxy)
@@ -486,15 +492,21 @@ The script builds, starts the profiling server, fires requests, stops the server
 
 ---
 
-## Notes for Team
+## How to Use This Document
 
-### What's already on `feat/optimize-ts` branch (uncommitted)
+**For any optimization work:**
 
-| File | Change |
-|------|--------|
-| `scripts/benchmark.sh` | HTTP load testing, TTFB analysis, cold start detection, auto-install `hey` |
-| `scripts/profile.sh` | WASM guest profiling via `--profile-guest`, flame graph workflow |
-| `OPTIMIZATION.md` | This document |
+1. Run `./scripts/benchmark.sh --save baseline` on `main`
+2. Make your change on a branch
+3. Rebuild: `fastly compute build`
+4. Run `./scripts/benchmark.sh --save branch-name`
+5. Compare: `diff benchmark-results/baseline.txt benchmark-results/branch-name.txt`
+6. Run `./scripts/profile.sh` for flame graph comparison
+7. If the numbers don't improve meaningfully, don't ship it
+
+---
+
+## Notes for Team
 
 ### Teammate's `streaming_processor.rs` Changes
 
diff --git a/crates/common/Cargo.toml b/crates/common/Cargo.toml
index 17a0e04b..8554d654 100644
--- a/crates/common/Cargo.toml
+++ b/crates/common/Cargo.toml
@@ -42,6 +42,7 @@ serde_json = { workspace = true }
 sha2 = { workspace = true }
 tokio = { workspace = true }
 trusted-server-js = { path = "../js" }
+toml = { workspace = true }
 url = { workspace = true }
 urlencoding = { workspace = true }
 uuid = { workspace = true }
diff --git a/crates/common/src/settings.rs b/crates/common/src/settings.rs
index 5963b602..69d7df91 100644
--- a/crates/common/src/settings.rs
+++ b/crates/common/src/settings.rs
@@ -56,7 +56,7 @@ impl Publisher {
             .unwrap_or_else(|| self.origin_url.clone())
     }
 
-    fn normalize(&mut self) {
+    pub(crate) fn normalize(&mut self) {
         let trimmed = self.origin_url.trim_end_matches('/');
         if trimmed != self.origin_url {
             log::warn!(
diff --git a/crates/common/src/settings_data.rs b/crates/common/src/settings_data.rs
index 01967add..167208ab 100644
--- a/crates/common/src/settings_data.rs
+++ b/crates/common/src/settings_data.rs
@@ -10,8 +10,15 @@ pub use crate::auction_config_types::AuctionConfig;
 const SETTINGS_DATA: &[u8] = include_bytes!("../../../target/trusted-server-out.toml");
 
 /// Creates a new [`Settings`] instance from the embedded configuration file.
-/// Loads the configuration from the embedded `trusted-server.toml` file
-/// and applies any environment variable overrides.
+///
+/// Deserializes directly via `toml::from_str` instead of [`Settings::from_toml`],
+/// which runs the full `config` crate pipeline (env var scanning, source merging).
+///
+/// This is safe because `build.rs` already calls `Settings::from_toml()` at compile
+/// time — merging `trusted-server.toml` with all `TRUSTED_SERVER__*` env vars — and
+/// writes the fully-resolved result to `target/trusted-server-out.toml`. The embedded
+/// bytes are that resolved output, so re-scanning env vars at runtime is redundant.
+/// See `build.rs::merge_toml()` and the `cargo:rerun-if-env-changed` directives.
 ///
 /// # Errors
 ///
@@ -23,7 +30,12 @@ pub fn get_settings() -> Result<Settings, Report<TrustedServerError>> {
         message: "embedded trusted-server.toml file".to_string(),
     })?;
 
-    let settings = Settings::from_toml(toml_str)?;
+    let mut settings: Settings =
+        toml::from_str(toml_str).change_context(TrustedServerError::Configuration {
+            message: "Failed to deserialize embedded config".to_string(),
+        })?;
+
+    settings.publisher.normalize();
 
     // Validate the settings
     settings

From e49f9f7a4621c2728c88ff954d24b685d0279776 Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Thu, 19 Feb 2026 20:01:48 +0530
Subject: [PATCH 06/13] Removed blank line

---
 crates/common/src/publisher.rs | 1 -
 1 file changed, 1 deletion(-)

diff --git a/crates/common/src/publisher.rs b/crates/common/src/publisher.rs
index 0794f066..fb160f3d 100644
--- a/crates/common/src/publisher.rs
+++ b/crates/common/src/publisher.rs
@@ -9,7 +9,6 @@ use crate::constants::{COOKIE_SYNTHETIC_ID, HEADER_X_COMPRESS_HINT, HEADER_X_SYN
 use crate::cookies::create_synthetic_cookie;
 use crate::error::TrustedServerError;
 use crate::integrations::IntegrationRegistry;
-
 use crate::rsc_flight::RscFlightUrlRewriter;
 use crate::settings::Settings;
 use crate::streaming_processor::{Compression, PipelineConfig, StreamProcessor, StreamingPipeline};

From a7b5a307a11d2adcb77eaea402ba3a269d28d160 Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Thu, 19 Feb 2026 23:16:59 +0530
Subject: [PATCH 07/13] Add optimization plan, WASM profiling, and benchmark
 tooling

- OPTIMIZATION.md: profiling results, CPU breakdown, phased optimization
  plan covering streaming fixes, config crate elimination, and
  stream_to_client() architecture
- scripts/profile.sh: WASM guest profiling via --profile-guest with
  Firefox Profiler-compatible output
- scripts/benchmark.sh: TTFB analysis, cold start detection, endpoint
  latency breakdown, and load testing with save/compare support
---
 crates/common/Cargo.toml           |  1 -
 crates/common/src/lib.rs           |  1 -
 crates/common/src/settings.rs      |  2 +-
 crates/common/src/settings_data.rs | 18 +++---------------
 4 files changed, 4 insertions(+), 18 deletions(-)

diff --git a/crates/common/Cargo.toml b/crates/common/Cargo.toml
index 8554d654..17a0e04b 100644
--- a/crates/common/Cargo.toml
+++ b/crates/common/Cargo.toml
@@ -42,7 +42,6 @@ serde_json = { workspace = true }
 sha2 = { workspace = true }
 tokio = { workspace = true }
 trusted-server-js = { path = "../js" }
-toml = { workspace = true }
 url = { workspace = true }
 urlencoding = { workspace = true }
 uuid = { workspace = true }
diff --git a/crates/common/src/lib.rs b/crates/common/src/lib.rs
index fd6fe5e1..a01865f6 100644
--- a/crates/common/src/lib.rs
+++ b/crates/common/src/lib.rs
@@ -51,7 +51,6 @@ pub mod openrtb;
 pub mod proxy;
 pub mod publisher;
 pub mod request_signing;
-
 pub mod rsc_flight;
 pub mod settings;
 pub mod settings_data;
diff --git a/crates/common/src/settings.rs b/crates/common/src/settings.rs
index 69d7df91..5963b602 100644
--- a/crates/common/src/settings.rs
+++ b/crates/common/src/settings.rs
@@ -56,7 +56,7 @@ impl Publisher {
             .unwrap_or_else(|| self.origin_url.clone())
     }
 
-    pub(crate) fn normalize(&mut self) {
+    fn normalize(&mut self) {
         let trimmed = self.origin_url.trim_end_matches('/');
         if trimmed != self.origin_url {
             log::warn!(
diff --git a/crates/common/src/settings_data.rs b/crates/common/src/settings_data.rs
index 167208ab..01967add 100644
--- a/crates/common/src/settings_data.rs
+++ b/crates/common/src/settings_data.rs
@@ -10,15 +10,8 @@ pub use crate::auction_config_types::AuctionConfig;
 const SETTINGS_DATA: &[u8] = include_bytes!("../../../target/trusted-server-out.toml");
 
 /// Creates a new [`Settings`] instance from the embedded configuration file.
-///
-/// Deserializes directly via `toml::from_str` instead of [`Settings::from_toml`],
-/// which runs the full `config` crate pipeline (env var scanning, source merging).
-///
-/// This is safe because `build.rs` already calls `Settings::from_toml()` at compile
-/// time — merging `trusted-server.toml` with all `TRUSTED_SERVER__*` env vars — and
-/// writes the fully-resolved result to `target/trusted-server-out.toml`. The embedded
-/// bytes are that resolved output, so re-scanning env vars at runtime is redundant.
-/// See `build.rs::merge_toml()` and the `cargo:rerun-if-env-changed` directives.
+/// Loads the configuration from the embedded `trusted-server.toml` file
+/// and applies any environment variable overrides.
 ///
 /// # Errors
 ///
@@ -30,12 +23,7 @@ pub fn get_settings() -> Result<Settings, Report<TrustedServerError>> {
         message: "embedded trusted-server.toml file".to_string(),
     })?;
 
-    let mut settings: Settings =
-        toml::from_str(toml_str).change_context(TrustedServerError::Configuration {
-            message: "Failed to deserialize embedded config".to_string(),
-        })?;
-
-    settings.publisher.normalize();
+    let settings = Settings::from_toml(toml_str)?;
 
     // Validate the settings
     settings

From 9d14d3f3a2cc0748d6768aaf748aebd2dc90906e Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Fri, 20 Feb 2026 23:56:49 +0530
Subject: [PATCH 08/13] Introduce streaming response processing for publisher
 requests, including HTML and RSC Flight URL rewriting, to avoid full-body
 buffering

---
 crates/common/src/html_processor.rs      |  31 ++-
 crates/common/src/publisher.rs           | 201 +++++++++++++++++
 crates/common/src/streaming_processor.rs | 264 ++++++++++-------------
 crates/fastly/src/main.rs                |  95 +++++---
 scripts/benchmark.sh                     |  11 +-
 scripts/profile.sh                       |   4 +-
 6 files changed, 419 insertions(+), 187 deletions(-)

diff --git a/crates/common/src/html_processor.rs b/crates/common/src/html_processor.rs
index fb161e0c..1b705575 100644
--- a/crates/common/src/html_processor.rs
+++ b/crates/common/src/html_processor.rs
@@ -20,6 +20,10 @@ use crate::tsjs;
 struct HtmlWithPostProcessing {
     inner: HtmlRewriterAdapter,
     post_processors: Vec<Arc<dyn IntegrationHtmlPostProcessor>>,
+    /// Accumulated output from intermediate chunks. Only used when
+    /// `post_processors` is non-empty, because post-processors (e.g. RSC
+    /// placeholder substitution) need the complete document to operate on.
+    accumulated_output: Vec<u8>,
     origin_host: String,
     request_host: String,
     request_scheme: String,
@@ -29,12 +33,27 @@ struct HtmlWithPostProcessing {
 impl StreamProcessor for HtmlWithPostProcessing {
     fn process_chunk(&mut self, chunk: &[u8], is_last: bool) -> Result<Vec<u8>, io::Error> {
         let output = self.inner.process_chunk(chunk, is_last)?;
-        if !is_last || output.is_empty() || self.post_processors.is_empty() {
+
+        // No post-processors → stream through immediately (fast path).
+        if self.post_processors.is_empty() {
             return Ok(output);
         }
 
-        let Ok(output_str) = std::str::from_utf8(&output) else {
-            return Ok(output);
+        // Post-processors registered → must accumulate so they can operate on
+        // the complete document (e.g. RSC placeholder substitution).
+        self.accumulated_output.extend_from_slice(&output);
+        if !is_last {
+            return Ok(Vec::new());
+        }
+
+        // All chunks received — run post-processing on the complete output.
+        let full_output = std::mem::take(&mut self.accumulated_output);
+        if full_output.is_empty() {
+            return Ok(full_output);
+        }
+
+        let Ok(output_str) = std::str::from_utf8(&full_output) else {
+            return Ok(full_output);
         };
 
         let ctx = IntegrationHtmlContext {
@@ -50,10 +69,10 @@ impl StreamProcessor for HtmlWithPostProcessing {
             .iter()
             .any(|p| p.should_process(output_str, &ctx))
         {
-            return Ok(output);
+            return Ok(full_output);
         }
 
-        let mut html = String::from_utf8(output).map_err(|e| {
+        let mut html = String::from_utf8(full_output).map_err(|e| {
             io::Error::other(format!(
                 "HTML post-processing expected valid UTF-8 output: {e}"
             ))
@@ -79,6 +98,7 @@ impl StreamProcessor for HtmlWithPostProcessing {
 
     fn reset(&mut self) {
         self.inner.reset();
+        self.accumulated_output.clear();
         self.document_state.clear();
     }
 }
@@ -462,6 +482,7 @@ pub fn create_html_processor(config: HtmlProcessorConfig) -> impl StreamProcesso
     HtmlWithPostProcessing {
         inner: HtmlRewriterAdapter::new(rewriter_settings),
         post_processors,
+        accumulated_output: Vec::new(),
         origin_host: config.origin_host,
         request_host: config.request_host,
         request_scheme: config.request_scheme,
diff --git a/crates/common/src/publisher.rs b/crates/common/src/publisher.rs
index fb160f3d..089e86aa 100644
--- a/crates/common/src/publisher.rs
+++ b/crates/common/src/publisher.rs
@@ -321,6 +321,207 @@ pub fn handle_publisher_request(
     Ok(response)
 }
 
+pub enum RouteResult {
+    /// Response fully buffered — send via send_to_client()
+    Buffered(Response),
+    /// Response already streamed to client
+    Streamed,
+}
+
+/// Streaming version of publisher request handling.
+/// Uses `stream_to_client()` for text responses, falling back to buffered for errors.
+pub fn handle_publisher_request_streaming(
+    settings: &Settings,
+    integration_registry: &IntegrationRegistry,
+    mut req: Request,
+) -> Result<RouteResult, Report<TrustedServerError>> {
+    log::debug!("Streaming: Proxying request to publisher_origin");
+
+    let request_info = RequestInfo::from_request(&req);
+    let request_host = &request_info.host;
+    let request_scheme = &request_info.scheme;
+
+    let synthetic_id = get_or_generate_synthetic_id(settings, &req)?;
+    let has_synthetic_cookie = req
+        .get_header(header::COOKIE)
+        .and_then(|h| h.to_str().ok())
+        .map(|cookies| {
+            cookies.split(';').any(|cookie| {
+                cookie
+                    .trim_start()
+                    .starts_with(&format!("{}=", COOKIE_SYNTHETIC_ID))
+            })
+        })
+        .unwrap_or(false);
+
+    let backend_name = BackendConfig::from_url(
+        &settings.publisher.origin_url,
+        settings.proxy.certificate_check,
+    )?;
+    let origin_host = settings.publisher.origin_host();
+
+    req.set_header("host", &origin_host);
+
+    let mut response = req
+        .send(&backend_name)
+        .change_context(TrustedServerError::Proxy {
+            message: "Failed to proxy request to origin".to_string(),
+        })?;
+
+    let content_type = response
+        .get_header(header::CONTENT_TYPE)
+        .map(|h| h.to_str().unwrap_or_default())
+        .unwrap_or_default()
+        .to_string();
+
+    let should_process = content_type.contains("text/")
+        || content_type.contains("application/javascript")
+        || content_type.contains("application/json");
+
+    // Gate: only stream 2xx processable text responses with a request host
+    // Non-processable but successful responses can still be buffered and passed through efficiently
+    // Wait: if it's successful but NOT processable, should we stream it or buffer it?
+    // It's fine to fall back to the buffered return, it will be sent via `send_to_client()` in main.rs.
+    // Actually, `stream_to_client()` with no processing means we have to pump the body.
+    // Let's just buffer it for now to match exactly what we have in the legacy path, since process_response_streaming
+    // also skips if !should_process.
+    // But wait, the standard path skips `process_response_streaming` but returns the buffered Response.
+    // Returning `RouteResult::Buffered(response)` handles this perfectly.
+
+    // Check if we will stream
+    let will_stream =
+        response.get_status().is_success() && should_process && !request_host.is_empty();
+
+    if !will_stream {
+        log::debug!(
+            "Falling back to buffered for response - status: {}, should_process: {}, request_host: '{}'",
+            response.get_status(),
+            should_process,
+            request_host
+        );
+        response.set_header(HEADER_X_SYNTHETIC_ID, synthetic_id.as_str());
+        if !has_synthetic_cookie {
+            response.set_header(
+                header::SET_COOKIE,
+                create_synthetic_cookie(settings, synthetic_id.as_str()),
+            );
+        }
+        return Ok(RouteResult::Buffered(response));
+    }
+
+    let content_encoding = response
+        .get_header(header::CONTENT_ENCODING)
+        .map(|h| h.to_str().unwrap_or_default())
+        .unwrap_or_default()
+        .to_lowercase();
+
+    log::debug!(
+        "Streaming response - Content-Type: {}, Content-Encoding: {}, Request Host: {}, Origin Host: {}",
+        content_type, content_encoding, request_host, origin_host
+    );
+
+    let body = response.take_body();
+    let compression = Compression::from_content_encoding(&content_encoding);
+
+    response.set_header(HEADER_X_SYNTHETIC_ID, synthetic_id.as_str());
+    if !has_synthetic_cookie {
+        response.set_header(
+            header::SET_COOKIE,
+            create_synthetic_cookie(settings, synthetic_id.as_str()),
+        );
+    }
+
+    // Add global settings headers before streaming since we commit headers
+    for (key, value) in &settings.response_headers {
+        response.set_header(key, value);
+    }
+
+    // Remove content-length since we stream and modify size
+    response.remove_header(header::CONTENT_LENGTH);
+
+    // Commit to streaming — headers (including our additions) sent NOW
+    let streaming_body = response.stream_to_client();
+    let mut buffered_streaming_body = std::io::BufWriter::with_capacity(8192, streaming_body);
+
+    let params = ProcessResponseParams {
+        content_encoding: &content_encoding,
+        origin_host: &origin_host,
+        origin_url: &settings.publisher.origin_url,
+        request_host,
+        request_scheme,
+        settings,
+        content_type: &content_type,
+        integration_registry,
+    };
+
+    let is_html = params.content_type.contains("text/html");
+    let is_rsc_flight = params.content_type.contains("text/x-component");
+
+    let config = PipelineConfig {
+        input_compression: compression,
+        output_compression: compression,
+        chunk_size: 8192,
+    };
+
+    let process_result = if is_html {
+        match create_html_stream_processor(
+            params.origin_host,
+            params.request_host,
+            params.request_scheme,
+            params.settings,
+            params.integration_registry,
+        ) {
+            Ok(processor) => {
+                let mut pipeline = StreamingPipeline::new(config, processor);
+                pipeline.process(body, &mut buffered_streaming_body)
+            }
+            Err(e) => {
+                log::error!("Failed to create html stream processor: {:?}", e);
+                // We've already sent headers, we can't change the status. Just return.
+                return Ok(RouteResult::Streamed);
+            }
+        }
+    } else if is_rsc_flight {
+        let processor = RscFlightUrlRewriter::new(
+            params.origin_host,
+            params.origin_url,
+            params.request_host,
+            params.request_scheme,
+        );
+        let mut pipeline = StreamingPipeline::new(config, processor);
+        pipeline.process(body, &mut buffered_streaming_body)
+    } else {
+        let replacer = create_url_replacer(
+            params.origin_host,
+            params.origin_url,
+            params.request_host,
+            params.request_scheme,
+        );
+        let mut pipeline = StreamingPipeline::new(config, replacer);
+        pipeline.process(body, &mut buffered_streaming_body)
+    };
+
+    match process_result {
+        Ok(()) => match buffered_streaming_body.into_inner() {
+            Ok(streaming_body) => {
+                if let Err(e) = streaming_body.finish() {
+                    log::error!("Failed to finish streaming_body: {:?}", e);
+                } else {
+                    log::debug!("Completed streaming processing of response body");
+                }
+            }
+            Err(e) => {
+                log::error!("Failed to flush buffered streaming body: {:?}", e.error());
+            }
+        },
+        Err(e) => {
+            log::error!("Streaming failed mid-flight: {:?}", e);
+        }
+    }
+
+    Ok(RouteResult::Streamed)
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/crates/common/src/streaming_processor.rs b/crates/common/src/streaming_processor.rs
index cda62e6f..4cbf207d 100644
--- a/crates/common/src/streaming_processor.rs
+++ b/crates/common/src/streaming_processor.rs
@@ -7,7 +7,9 @@
 //! - UTF-8 boundary handling
 
 use error_stack::{Report, ResultExt};
+use std::cell::RefCell;
 use std::io::{self, Read, Write};
+use std::rc::Rc;
 
 use crate::error::TrustedServerError;
 
@@ -179,7 +181,7 @@ impl<P: StreamProcessor> StreamingPipeline<P> {
         Ok(())
     }
 
-    /// Process gzip compressed stream
+    /// Process gzip compressed stream (streaming — no full-body buffering)
     fn process_gzip_to_gzip<R: Read, W: Write>(
         &mut self,
         input: R,
@@ -189,38 +191,13 @@ impl<P: StreamProcessor> StreamingPipeline<P> {
         use flate2::write::GzEncoder;
         use flate2::Compression;
 
-        // Decompress input
-        let mut decoder = GzDecoder::new(input);
-        let mut decompressed = Vec::new();
-        decoder
-            .read_to_end(&mut decompressed)
-            .change_context(TrustedServerError::Proxy {
-                message: "Failed to decompress gzip".to_string(),
-            })?;
-
-        log::info!("Decompressed size: {} bytes", decompressed.len());
-
-        // Process the decompressed content
-        let processed = self
-            .processor
-            .process_chunk(&decompressed, true)
-            .change_context(TrustedServerError::Proxy {
-                message: "Failed to process content".to_string(),
-            })?;
-
-        log::info!("Processed size: {} bytes", processed.len());
+        let decoder = GzDecoder::new(input);
+        let encoder = GzEncoder::new(output, Compression::default());
 
-        // Recompress the output
-        let mut encoder = GzEncoder::new(output, Compression::default());
-        encoder
-            .write_all(&processed)
-            .change_context(TrustedServerError::Proxy {
-                message: "Failed to write to gzip encoder".to_string(),
-            })?;
+        let encoder = self.process_through_compression(decoder, encoder)?;
         encoder.finish().change_context(TrustedServerError::Proxy {
             message: "Failed to finish gzip encoder".to_string(),
         })?;
-
         Ok(())
     }
 
@@ -272,7 +249,7 @@ impl<P: StreamProcessor> StreamingPipeline<P> {
         self.decompress_and_process(GzDecoder::new(input), output, "gzip")
     }
 
-    /// Process deflate compressed stream
+    /// Process deflate compressed stream (streaming)
     fn process_deflate_to_deflate<R: Read, W: Write>(
         &mut self,
         input: R,
@@ -285,7 +262,11 @@ impl<P: StreamProcessor> StreamingPipeline<P> {
         let decoder = ZlibDecoder::new(input);
         let encoder = ZlibEncoder::new(output, Compression::default());
 
-        self.process_through_compression(decoder, encoder)
+        let encoder = self.process_through_compression(decoder, encoder)?;
+        encoder.finish().change_context(TrustedServerError::Proxy {
+            message: "Failed to finish deflate encoder".to_string(),
+        })?;
+        Ok(())
     }
 
     /// Process deflate compressed input to uncompressed output (decompression only)
@@ -299,7 +280,7 @@ impl<P: StreamProcessor> StreamingPipeline<P> {
         self.decompress_and_process(ZlibDecoder::new(input), output, "deflate")
     }
 
-    /// Process brotli compressed stream
+    /// Process brotli compressed stream (streaming)
     fn process_brotli_to_brotli<R: Read, W: Write>(
         &mut self,
         input: R,
@@ -317,7 +298,11 @@ impl<P: StreamProcessor> StreamingPipeline<P> {
         };
         let encoder = CompressorWriter::with_params(output, 4096, &params);
 
-        self.process_through_compression(decoder, encoder)
+        let encoder = self.process_through_compression(decoder, encoder)?;
+        // CompressorWriter finalizes the brotli stream on drop. Unlike gzip/deflate,
+        // brotli has no checksum trailer so drop-based finalization is safe.
+        drop(encoder);
+        Ok(())
     }
 
     /// Process brotli compressed input to uncompressed output (decompression only)
@@ -331,12 +316,17 @@ impl<P: StreamProcessor> StreamingPipeline<P> {
         self.decompress_and_process(Decompressor::new(input, 4096), output, "brotli")
     }
 
-    /// Generic processing through compression layers
+    /// Generic chunk loop through compression layers.
+    ///
+    /// Returns the encoder so the caller can finalize it properly (e.g.
+    /// `GzEncoder::finish()`, `ZlibEncoder::finish()`). This avoids the
+    /// silent error swallowing that `drop(encoder)` causes — gzip/deflate
+    /// trailers contain checksums whose write failures must be propagated.
     fn process_through_compression<R: Read, W: Write>(
         &mut self,
         mut decoder: R,
         mut encoder: W,
-    ) -> Result<(), Report<TrustedServerError>> {
+    ) -> Result<W, Report<TrustedServerError>> {
         let mut buffer = vec![0u8; self.config.chunk_size];
 
         loop {
@@ -380,94 +370,86 @@ impl<P: StreamProcessor> StreamingPipeline<P> {
             }
         }
 
-        // Flush encoder (this also finishes compression)
         encoder.flush().change_context(TrustedServerError::Proxy {
             message: "Failed to flush encoder".to_string(),
         })?;
 
-        // For GzEncoder and similar, we need to finish() to properly close the stream
-        // The flush above might not be enough
-        drop(encoder);
+        Ok(encoder)
+    }
+}
 
-        Ok(())
+/// Output sink that writes lol_html output chunks into a shared `Rc<RefCell<Vec<u8>>>` buffer.
+struct RcVecSink(Rc<RefCell<Vec<u8>>>);
+
+impl lol_html::OutputSink for RcVecSink {
+    fn handle_chunk(&mut self, chunk: &[u8]) {
+        self.0.borrow_mut().extend_from_slice(chunk);
     }
 }
 
-/// Adapter to use `lol_html` `HtmlRewriter` as a `StreamProcessor`
-/// Important: Due to `lol_html`'s ownership model, we must accumulate input
-/// and process it all at once when the stream ends. This is a limitation
-/// of the `lol_html` library's API design.
+/// Adapter to use `lol_html` `HtmlRewriter` as a `StreamProcessor`.
+///
+/// Uses lol_html's incremental streaming API: each incoming chunk is written to
+/// the rewriter immediately, and whatever output lol_html has ready is drained
+/// and returned. This avoids buffering the full document before processing begins.
 pub struct HtmlRewriterAdapter {
-    settings: lol_html::Settings<'static, 'static>,
-    accumulated_input: Vec<u8>,
+    rewriter: Option<lol_html::HtmlRewriter<'static, RcVecSink>>,
+    output: Rc<RefCell<Vec<u8>>>,
 }
 
 impl HtmlRewriterAdapter {
-    /// Create a new HTML rewriter adapter
+    /// Create a new HTML rewriter adapter.
     #[must_use]
     pub fn new(settings: lol_html::Settings<'static, 'static>) -> Self {
+        // Pre-allocate to avoid reallocation churn since lol_html writes incrementally
+        let output = Rc::new(RefCell::new(Vec::with_capacity(8192)));
+        let rewriter = lol_html::HtmlRewriter::new(settings, RcVecSink(Rc::clone(&output)));
         Self {
-            settings,
-            accumulated_input: Vec::new(),
+            rewriter: Some(rewriter),
+            output,
         }
     }
 }
 
 impl StreamProcessor for HtmlRewriterAdapter {
     fn process_chunk(&mut self, chunk: &[u8], is_last: bool) -> Result<Vec<u8>, io::Error> {
-        // Accumulate input chunks
-        self.accumulated_input.extend_from_slice(chunk);
-
-        if !chunk.is_empty() {
-            log::debug!(
-                "Buffering chunk: {} bytes, total buffered: {} bytes",
-                chunk.len(),
-                self.accumulated_input.len()
-            );
+        if let Some(rewriter) = &mut self.rewriter {
+            if !chunk.is_empty() {
+                rewriter.write(chunk).map_err(|e| {
+                    log::error!("Failed to write HTML chunk: {}", e);
+                    io::Error::other(format!("HTML processing failed: {}", e))
+                })?;
+            }
         }
 
-        // Only process when we have all the input
         if is_last {
-            log::info!(
-                "Processing complete document: {} bytes",
-                self.accumulated_input.len()
-            );
-
-            // Process all accumulated input at once
-            let mut output = Vec::new();
-
-            // Create rewriter with output sink
-            let mut rewriter = lol_html::HtmlRewriter::new(
-                std::mem::take(&mut self.settings),
-                |chunk: &[u8]| {
-                    output.extend_from_slice(chunk);
-                },
-            );
-
-            // Process the entire document
-            rewriter.write(&self.accumulated_input).map_err(|e| {
-                log::error!("Failed to process HTML: {}", e);
-                io::Error::other(format!("HTML processing failed: {}", e))
-            })?;
-
-            // Finalize the rewriter
-            rewriter.end().map_err(|e| {
-                log::error!("Failed to finalize: {}", e);
-                io::Error::other(format!("HTML finalization failed: {}", e))
-            })?;
-
-            log::debug!("Output size: {} bytes", output.len());
-            self.accumulated_input.clear();
-            Ok(output)
-        } else {
-            // Return empty until we have all input
-            // This is a limitation of lol_html's API
-            Ok(Vec::new())
+            if let Some(rewriter) = self.rewriter.take() {
+                rewriter.end().map_err(|e| {
+                    log::error!("Failed to finalize HTML rewriter: {}", e);
+                    io::Error::other(format!("HTML finalization failed: {}", e))
+                })?;
+            }
         }
+
+        // Drain whatever lol_html produced for this chunk and return it.
+        // Pre-allocate the next buffer to prevent lol_html from triggering allocations on its many small writes.
+        let result = std::mem::replace(
+            &mut *self.output.borrow_mut(),
+            Vec::with_capacity(std::cmp::max(chunk.len() + 1024, 8192)),
+        );
+        log::debug!(
+            "HtmlRewriterAdapter::process_chunk: input={} bytes, output={} bytes, is_last={}",
+            chunk.len(),
+            result.len(),
+            is_last
+        );
+        Ok(result)
     }
 
     fn reset(&mut self) {
-        self.accumulated_input.clear();
+        // The rewriter is consumed after end(); a new HtmlRewriterAdapter should
+        // be created per document. Clear any remaining output buffer.
+        self.output.borrow_mut().clear();
     }
 }
 
@@ -534,7 +516,7 @@ mod tests {
     }
 
     #[test]
-    fn test_html_rewriter_adapter_accumulates_until_last() {
+    fn test_html_rewriter_adapter_streams_incrementally() {
         use lol_html::{element, Settings};
 
         // Create a simple HTML rewriter that replaces text
@@ -548,30 +530,32 @@ mod tests {
 
         let mut adapter = HtmlRewriterAdapter::new(settings);
 
-        // Test that intermediate chunks return empty
+        // Collect all output across chunks; the rewriter may emit partial output at any point.
+        let mut full_output = Vec::new();
+
         let chunk1 = b"<html><body>";
-        let result1 = adapter
-            .process_chunk(chunk1, false)
-            .expect("should process chunk1");
-        assert_eq!(result1.len(), 0, "Should return empty for non-last chunk");
+        full_output.extend(
+            adapter
+                .process_chunk(chunk1, false)
+                .expect("should process chunk1"),
+        );
 
         let chunk2 = b"<p>original</p>";
-        let result2 = adapter
-            .process_chunk(chunk2, false)
-            .expect("should process chunk2");
-        assert_eq!(result2.len(), 0, "Should return empty for non-last chunk");
+        full_output.extend(
+            adapter
+                .process_chunk(chunk2, false)
+                .expect("should process chunk2"),
+        );
 
-        // Test that last chunk processes everything
         let chunk3 = b"</body></html>";
-        let result3 = adapter
-            .process_chunk(chunk3, true)
-            .expect("should process final chunk");
-        assert!(
-            !result3.is_empty(),
-            "Should return processed content for last chunk"
+        full_output.extend(
+            adapter
+                .process_chunk(chunk3, true)
+                .expect("should process final chunk"),
         );
 
-        let output = String::from_utf8(result3).expect("output should be valid UTF-8");
+        assert!(!full_output.is_empty(), "Should have produced output");
+        let output = String::from_utf8(full_output).expect("output should be valid UTF-8");
         assert!(output.contains("replaced"), "Should have replaced content");
         assert!(output.contains("<html>"), "Should have complete HTML");
     }
@@ -590,27 +574,23 @@ mod tests {
         }
         large_html.push_str("</body></html>");
 
-        // Process in chunks
+        // Process in chunks, collecting all output.
         let chunk_size = 1024;
         let bytes = large_html.as_bytes();
-        let mut chunks = bytes.chunks(chunk_size);
-        let mut last_chunk = chunks.next().unwrap_or(&[]);
+        let chunks: Vec<_> = bytes.chunks(chunk_size).collect();
+        let last_idx = chunks.len().saturating_sub(1);
 
-        for chunk in chunks {
+        let mut full_output = Vec::new();
+        for (i, chunk) in chunks.iter().enumerate() {
+            let is_last = i == last_idx;
             let result = adapter
-                .process_chunk(last_chunk, false)
-                .expect("should process intermediate chunk");
-            assert_eq!(result.len(), 0, "Intermediate chunks should return empty");
-            last_chunk = chunk;
+                .process_chunk(chunk, is_last)
+                .expect("should process chunk");
+            full_output.extend(result);
         }
 
-        // Process last chunk
-        let result = adapter
-            .process_chunk(last_chunk, true)
-            .expect("should process last chunk");
-        assert!(!result.is_empty(), "Last chunk should return content");
-
-        let output = String::from_utf8(result).expect("output should be valid UTF-8");
+        assert!(!full_output.is_empty(), "Should have produced output");
+        let output = String::from_utf8(full_output).expect("output should be valid UTF-8");
         assert!(
             output.contains("Paragraph 999"),
             "Should contain all content"
@@ -618,32 +598,22 @@ mod tests {
     }
 
     #[test]
-    fn test_html_rewriter_adapter_reset() {
+    fn test_html_rewriter_adapter_reset_clears_output_buffer() {
         use lol_html::Settings;
 
+        // reset() is a no-op on the rewriter itself (a new adapter is needed per document),
+        // but it must clear any pending bytes in the output buffer.
         let settings = Settings::default();
         let mut adapter = HtmlRewriterAdapter::new(settings);
 
-        // Process some content
-        adapter
-            .process_chunk(b"<html>", false)
-            .expect("should process html tag");
-        adapter
-            .process_chunk(b"<body>test</body>", false)
-            .expect("should process body");
+        // Write a full document so the rewriter is finished.
+        let _ = adapter
+            .process_chunk(b"<html><body><p>test</p></body></html>", true)
+            .expect("should process complete document");
 
-        // Reset should clear accumulated input
+        // reset() should not panic and should leave the buffer empty.
         adapter.reset();
-
-        // After reset, adapter should be ready for new input
-        let result = adapter
-            .process_chunk(b"<p>new</p>", true)
-            .expect("should process new content after reset");
-        let output = String::from_utf8(result).expect("output should be valid UTF-8");
-        assert_eq!(
-            output, "<p>new</p>",
-            "Should only contain new input after reset"
-        );
+        // No assertion on a subsequent process_chunk — the rewriter is consumed.
     }
 
     #[test]
diff --git a/crates/fastly/src/main.rs b/crates/fastly/src/main.rs
index 0112bd99..1babf2b2 100644
--- a/crates/fastly/src/main.rs
+++ b/crates/fastly/src/main.rs
@@ -12,7 +12,7 @@ use trusted_server_common::proxy::{
     handle_first_party_click, handle_first_party_proxy, handle_first_party_proxy_rebuild,
     handle_first_party_proxy_sign,
 };
-use trusted_server_common::publisher::{handle_publisher_request, handle_tsjs_dynamic};
+use trusted_server_common::publisher::handle_tsjs_dynamic;
 use trusted_server_common::request_signing::{
     handle_deactivate_key, handle_rotate_key, handle_trusted_server_discovery,
     handle_verify_signature,
@@ -23,18 +23,22 @@ use trusted_server_common::settings_data::get_settings;
 mod error;
 use crate::error::to_error_response;
 
-#[fastly::main]
-fn main(req: Request) -> Result<Response, Error> {
+use trusted_server_common::publisher::RouteResult;
+
+fn main() {
+    fastly::init();
     init_logger();
+    let req = Request::from_client();
 
     let settings = match get_settings() {
         Ok(s) => s,
         Err(e) => {
             log::error!("Failed to load settings: {:?}", e);
-            return Ok(to_error_response(&e));
+            to_error_response(&e).send_to_client();
+            return;
         }
     };
-    log::info!("Settings {settings:?}");
+    log::debug!("Settings {settings:?}");
 
     // Build the auction orchestrator once at startup
     let orchestrator = build_orchestrator(&settings);
@@ -43,16 +47,26 @@ fn main(req: Request) -> Result<Response, Error> {
         Ok(r) => r,
         Err(e) => {
             log::error!("Failed to create integration registry: {:?}", e);
-            return Ok(to_error_response(&e));
+            to_error_response(&e).send_to_client();
+            return;
         }
     };
 
-    futures::executor::block_on(route_request(
+    match futures::executor::block_on(route_request(
         &settings,
         &orchestrator,
         &integration_registry,
         req,
-    ))
+    )) {
+        Ok(RouteResult::Buffered(resp)) => resp.send_to_client(),
+        Ok(RouteResult::Streamed) => { /* already streamed */ }
+        Err(e) => {
+            log::error!("Request routing failed: {:?}", e);
+            Response::from_status(fastly::http::StatusCode::INTERNAL_SERVER_ERROR)
+                .with_body(format!("Internal Server Error: {}", e))
+                .send_to_client();
+        }
+    }
 }
 
 async fn route_request(
@@ -60,20 +74,59 @@ async fn route_request(
     orchestrator: &AuctionOrchestrator,
     integration_registry: &IntegrationRegistry,
     req: Request,
-) -> Result<Response, Error> {
-    log::info!(
+) -> Result<RouteResult, Error> {
+    log::debug!(
         "FASTLY_SERVICE_VERSION: {}",
         ::std::env::var("FASTLY_SERVICE_VERSION").unwrap_or_else(|_| String::new())
     );
 
-    if let Some(response) = enforce_basic_auth(settings, &req) {
-        return Ok(response);
+    if let Some(mut response) = enforce_basic_auth(settings, &req) {
+        for (key, value) in &settings.response_headers {
+            response.set_header(key, value);
+        }
+        return Ok(RouteResult::Buffered(response));
     }
 
     // Get path and method for routing
     let path = req.get_path().to_string();
     let method = req.get_method().clone();
 
+    // Check if it's the publisher proxy fallback
+    let is_publisher_proxy = match (method.clone(), path.as_str()) {
+        (Method::GET, p) if p.starts_with("/static/tsjs=") => false,
+        (Method::GET, "/.well-known/trusted-server.json") => false,
+        (Method::POST, "/verify-signature") => false,
+        (Method::POST, "/admin/keys/rotate") => false,
+        (Method::POST, "/admin/keys/deactivate") => false,
+        (Method::POST, "/auction") => false,
+        (Method::GET, "/first-party/proxy") => false,
+        (Method::GET, "/first-party/click") => false,
+        (Method::GET, "/first-party/sign") | (Method::POST, "/first-party/sign") => false,
+        (Method::POST, "/first-party/proxy-rebuild") => false,
+        (m, p) if integration_registry.has_route(&m, p) => false,
+        _ => true,
+    };
+
+    if is_publisher_proxy {
+        log::info!(
+            "No known route matched for path: {}, proxying to publisher origin",
+            path
+        );
+
+        use trusted_server_common::publisher::handle_publisher_request_streaming;
+        match handle_publisher_request_streaming(settings, integration_registry, req) {
+            Ok(route_result) => return Ok(route_result),
+            Err(e) => {
+                log::error!("Failed to proxy to publisher origin: {:?}", e);
+                let mut err_resp = to_error_response(&e);
+                for (key, value) in &settings.response_headers {
+                    err_resp.set_header(key, value);
+                }
+                return Ok(RouteResult::Buffered(err_resp));
+            }
+        }
+    }
+
     // Match known routes and handle them
     let result = match (method, path.as_str()) {
         // Serve the tsjs library
@@ -112,21 +165,7 @@ async fn route_request(
                 }))
             }),
 
-        // No known route matched, proxy to publisher origin as fallback
-        _ => {
-            log::info!(
-                "No known route matched for path: {}, proxying to publisher origin",
-                path
-            );
-
-            match handle_publisher_request(settings, integration_registry, req) {
-                Ok(response) => Ok(response),
-                Err(e) => {
-                    log::error!("Failed to proxy to publisher origin: {:?}", e);
-                    Err(e)
-                }
-            }
-        }
+        _ => unreachable!(),
     };
 
     // Convert any errors to HTTP error responses
@@ -136,7 +175,7 @@ async fn route_request(
         response.set_header(key, value);
     }
 
-    Ok(response)
+    Ok(RouteResult::Buffered(response))
 }
 
 fn init_logger() {
diff --git a/scripts/benchmark.sh b/scripts/benchmark.sh
index daebccb3..92807ab6 100755
--- a/scripts/benchmark.sh
+++ b/scripts/benchmark.sh
@@ -37,6 +37,7 @@ set -euo pipefail
 # --- Configuration ---
 BASE_URL="${BENCH_URL:-http://127.0.0.1:7676}"
 RESULTS_DIR="$(cd "$(dirname "$0")/.." && pwd)/benchmark-results"
+UA="Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
 CURL_FORMAT='
 {
   "dns_ms":        %{time_namelookup},
@@ -117,7 +118,7 @@ timed_curl() {
     local extra_args=("$@")
 
     local result
-    result=$(curl -s -o /dev/null -w "$CURL_FORMAT" \
+    result=$(curl -s -A "$UA" -o /dev/null -w "$CURL_FORMAT" \
         -X "$method" \
         ${extra_args[@]+"${extra_args[@]}"} \
         "$url" \
@@ -229,19 +230,19 @@ run_load_test() {
 
     echo -e "${BOLD}GET / (publisher proxy) - ${total_requests} requests, ${concurrency} concurrent${RESET}"
     echo ""
-    hey -n "$total_requests" -c "$concurrency" -t 30 "$BASE_URL/" 2>&1 | \
+    hey -U "$UA" -n "$total_requests" -c "$concurrency" -t 30 "$BASE_URL/" 2>&1 | \
         grep -E "(Requests/sec|Total:|Slowest:|Fastest:|Average:|requests done)|Status code|Latency distribution" -A 20
     echo ""
 
     echo -e "${BOLD}GET /static/tsjs=tsjs-unified.min.js (static) - ${total_requests} requests, ${concurrency} concurrent${RESET}"
     echo ""
-    hey -n "$total_requests" -c "$concurrency" -t 30 "$BASE_URL/static/tsjs=tsjs-unified.min.js" 2>&1 | \
+    hey -U "$UA" -n "$total_requests" -c "$concurrency" -t 30 "$BASE_URL/static/tsjs=tsjs-unified.min.js" 2>&1 | \
         grep -E "(Requests/sec|Total:|Slowest:|Fastest:|Average:|requests done)|Status code|Latency distribution" -A 20
     echo ""
 
     echo -e "${BOLD}POST /auction - ${total_requests} requests, ${concurrency} concurrent${RESET}"
     echo ""
-    hey -n "$total_requests" -c "$concurrency" -t 30 \
+    hey -U "$UA" -n "$total_requests" -c "$concurrency" -t 30 \
         -m POST \
         -H "Content-Type: application/json" \
         -d "$AUCTION_PAYLOAD" \
@@ -263,7 +264,7 @@ run_first_byte_analysis() {
 
     for i in $(seq 1 20); do
         local result
-        result=$(curl -s -o /dev/null -w "%{time_starttransfer} %{time_total}" \
+        result=$(curl -s -A "$UA" -o /dev/null -w "%{time_starttransfer} %{time_total}" \
             "$BASE_URL/" --max-time 30 2>/dev/null)
         local ttfb total
         ttfb=$(echo "$result" | awk '{printf "%.2f", $1 * 1000}')
diff --git a/scripts/profile.sh b/scripts/profile.sh
index 66cebf0d..a868ac97 100755
--- a/scripts/profile.sh
+++ b/scripts/profile.sh
@@ -34,7 +34,7 @@ SERVER_PID=""
 # Defaults
 ENDPOINT="/"
 METHOD="GET"
-REQUESTS=20
+REQUESTS=100
 BODY=""
 SKIP_BUILD=false
 AUTO_OPEN=false
@@ -162,7 +162,7 @@ fi
 log_header "START PROFILING SERVER"
 log_info "Starting fastly compute serve --profile-guest..."
 
-(cd "$PROJECT_ROOT" && fastly compute serve --profile-guest 2>&1) &
+(cd "$PROJECT_ROOT" &&  set -a && source .env && set +a && fastly compute serve --profile-guest 2>&1) &
 SERVER_PID=$!
 log_info "Server PID: $SERVER_PID"
 

From 5b93249e80cd8e2a69ff7e49bafc55eb570d24f3 Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Sat, 21 Feb 2026 00:19:20 +0530
Subject: [PATCH 09/13] Update OPTIMIZATION.md with streaming architecture
 progress

---
 OPTIMIZATION.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/OPTIMIZATION.md b/OPTIMIZATION.md
index 05e23247..8ee887f5 100644
--- a/OPTIMIZATION.md
+++ b/OPTIMIZATION.md
@@ -376,6 +376,8 @@ After implementing Phases 1-2:
 - No regression on static endpoints or auction
 - Code complexity is justified by measured improvement
 
+**Current Status:** The streaming architecture changes (Phases 1 and 2.1) have been implemented and pushed to the `feat/optimize-html-streaming` branch. Local testing with `curl` has demonstrated significant TTFB improvements (from ~0.716s buffered to ~0.256s streaming) while verifying functional correctness against Fastly Compute's local testing environment. **External environment testing and load testing on the staging edge network is currently due/pending.**
+
 ---
 
 ## Optimization Summary Table

From 63a089b78281902f3ce8f3f2a454a3c428c0e558 Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Sat, 21 Feb 2026 00:44:30 +0530
Subject: [PATCH 10/13] Add clippy attribute to  and improve streaming request
 handling documentation

---
 crates/common/src/publisher.rs           | 7 ++++++-
 crates/common/src/streaming_processor.rs | 6 +++---
 2 files changed, 9 insertions(+), 4 deletions(-)

diff --git a/crates/common/src/publisher.rs b/crates/common/src/publisher.rs
index a6b9f3a0..1714e1fc 100644
--- a/crates/common/src/publisher.rs
+++ b/crates/common/src/publisher.rs
@@ -327,8 +327,9 @@ pub fn handle_publisher_request(
     Ok(response)
 }
 
+#[allow(clippy::large_enum_variant)]
 pub enum RouteResult {
-    /// Response fully buffered — send via send_to_client()
+    /// Response fully buffered — send via `send_to_client()`
     Buffered(Response),
     /// Response already streamed to client
     Streamed,
@@ -336,6 +337,10 @@ pub enum RouteResult {
 
 /// Streaming version of publisher request handling.
 /// Uses `stream_to_client()` for text responses, falling back to buffered for errors.
+///
+/// # Errors
+///
+/// Returns an error if the generation of a synthetic ID fails, or if making the backend HTTP request to the origin fails.
 pub fn handle_publisher_request_streaming(
     settings: &Settings,
     integration_registry: &IntegrationRegistry,
diff --git a/crates/common/src/streaming_processor.rs b/crates/common/src/streaming_processor.rs
index 4cbf207d..f53fbdc5 100644
--- a/crates/common/src/streaming_processor.rs
+++ b/crates/common/src/streaming_processor.rs
@@ -378,7 +378,7 @@ impl<P: StreamProcessor> StreamingPipeline<P> {
     }
 }
 
-/// Output sink that writes lol_html output chunks into a shared `Rc<RefCell<Vec<u8>>>` buffer.
+/// Output sink that writes `lol_html` output chunks into a shared `Rc<RefCell<Vec<u8>>>` buffer.
 struct RcVecSink(Rc<RefCell<Vec<u8>>>);
 
 impl lol_html::OutputSink for RcVecSink {
@@ -389,8 +389,8 @@ impl lol_html::OutputSink for RcVecSink {
 
 /// Adapter to use `lol_html` `HtmlRewriter` as a `StreamProcessor`.
 ///
-/// Uses lol_html's incremental streaming API: each incoming chunk is written to
-/// the rewriter immediately, and whatever output lol_html has ready is drained
+/// Uses `lol_html`'s incremental streaming API: each incoming chunk is written to
+/// the rewriter immediately, and whatever output `lol_html` has ready is drained
 /// and returned. This avoids buffering the full document before processing begins.
 pub struct HtmlRewriterAdapter {
     rewriter: Option<lol_html::HtmlRewriter<'static, RcVecSink>>,

From 6701a999d622aa8a402a1b8f8eac7e176ad18036 Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Mon, 23 Feb 2026 20:39:26 +0530
Subject: [PATCH 11/13] Inject staging identification headers for streamed
 responses

---
 crates/common/src/publisher.rs | 12 +++++++++++-
 1 file changed, 11 insertions(+), 1 deletion(-)

diff --git a/crates/common/src/publisher.rs b/crates/common/src/publisher.rs
index 1714e1fc..a20614e1 100644
--- a/crates/common/src/publisher.rs
+++ b/crates/common/src/publisher.rs
@@ -5,7 +5,10 @@ use fastly::{Body, Request, Response};
 use crate::backend::BackendConfig;
 use crate::http_util::{serve_static_with_etag, RequestInfo};
 
-use crate::constants::{COOKIE_SYNTHETIC_ID, HEADER_X_COMPRESS_HINT, HEADER_X_SYNTHETIC_ID};
+use crate::constants::{
+    COOKIE_SYNTHETIC_ID, ENV_FASTLY_IS_STAGING, ENV_FASTLY_SERVICE_VERSION, HEADER_X_COMPRESS_HINT,
+    HEADER_X_SYNTHETIC_ID, HEADER_X_TS_ENV, HEADER_X_TS_VERSION,
+};
 use crate::cookies::create_synthetic_cookie;
 use crate::error::TrustedServerError;
 use crate::integrations::IntegrationRegistry;
@@ -442,6 +445,13 @@ pub fn handle_publisher_request_streaming(
         );
     }
 
+    if let Ok(v) = ::std::env::var(ENV_FASTLY_SERVICE_VERSION) {
+        response.set_header(HEADER_X_TS_VERSION, v);
+    }
+    if ::std::env::var(ENV_FASTLY_IS_STAGING).as_deref() == Ok("1") {
+        response.set_header(HEADER_X_TS_ENV, "staging");
+    }
+
     // Add global settings headers before streaming since we commit headers
     for (key, value) in &settings.response_headers {
         response.set_header(key, value);

From b110e3fbb3e1214d8db95522fa51de5579da38b4 Mon Sep 17 00:00:00 2001
From: prk-Jr <49094961+prk-Jr@users.noreply.github.com>
Date: Wed, 25 Feb 2026 21:06:08 +0530
Subject: [PATCH 12/13] Feat/optimize html streaming rsc (#376)

* Optimize Next.js RSC streaming with lazy accumulation

Implement lazy buffering that delays accumulation until RSC content is
detected, improving streaming from 0% to 28-37% for RSC pages while
maintaining 100% URL rewriting correctness.

- Add needs_accumulation() trait for conditional buffering
- Add 10MB memory limit for DoS protection
- Create integration test suite with real Next.js fixtures
- Add example Next.js app for testing

Performance: RSC pages stream 28-37% (theoretical max), non-RSC 96%.

* Preserve publisher fallback headers, centralize route classification, and always clean up live test temp files
---
 .gitignore                                    |   6 +-
 crates/common/src/html_processor.rs           | 443 +++++++-
 .../nextjs/fixtures/app-router-large.html     |  37 +
 .../nextjs/fixtures/app-router-simple.html    |  34 +
 .../nextjs/fixtures/app-router-tchunk.html    |  29 +
 .../nextjs/fixtures/non-rsc-page.html         |  38 +
 .../nextjs/fixtures/real-nextjs-about.html    |   1 +
 .../nextjs/fixtures/real-nextjs-blog.html     |   1 +
 .../nextjs/fixtures/real-nextjs-home.html     |   1 +
 .../integrations/nextjs/html_post_process.rs  |  12 +-
 .../integrations/nextjs/rsc_placeholders.rs   |  65 +-
 crates/common/src/integrations/registry.rs    |  20 +
 crates/common/src/publisher.rs                |  26 +-
 crates/common/tests/nextjs_integration.rs     | 629 ++++++++++++
 crates/fastly/src/main.rs                     | 137 +--
 examples/nextjs-rsc-app/README.md             |  93 ++
 examples/nextjs-rsc-app/TESTING.md            | 129 +++
 examples/nextjs-rsc-app/app/about/page.tsx    |  72 ++
 .../nextjs-rsc-app/app/blog/[slug]/page.tsx   |  72 ++
 examples/nextjs-rsc-app/app/layout.tsx        |  37 +
 examples/nextjs-rsc-app/app/page.tsx          |  48 +
 examples/nextjs-rsc-app/next-env.d.ts         |   6 +
 examples/nextjs-rsc-app/next.config.js        |   7 +
 examples/nextjs-rsc-app/package-lock.json     | 952 ++++++++++++++++++
 examples/nextjs-rsc-app/package.json          |  22 +
 .../scripts/capture-fixtures.sh               | 103 ++
 examples/nextjs-rsc-app/test-live-html.sh     | 198 ++++
 examples/nextjs-rsc-app/test-streaming.sh     | 105 ++
 examples/nextjs-rsc-app/tsconfig.json         |  40 +
 29 files changed, 3266 insertions(+), 97 deletions(-)
 create mode 100644 crates/common/src/integrations/nextjs/fixtures/app-router-large.html
 create mode 100644 crates/common/src/integrations/nextjs/fixtures/app-router-simple.html
 create mode 100644 crates/common/src/integrations/nextjs/fixtures/app-router-tchunk.html
 create mode 100644 crates/common/src/integrations/nextjs/fixtures/non-rsc-page.html
 create mode 100644 crates/common/src/integrations/nextjs/fixtures/real-nextjs-about.html
 create mode 100644 crates/common/src/integrations/nextjs/fixtures/real-nextjs-blog.html
 create mode 100644 crates/common/src/integrations/nextjs/fixtures/real-nextjs-home.html
 create mode 100644 crates/common/tests/nextjs_integration.rs
 create mode 100644 examples/nextjs-rsc-app/README.md
 create mode 100644 examples/nextjs-rsc-app/TESTING.md
 create mode 100644 examples/nextjs-rsc-app/app/about/page.tsx
 create mode 100644 examples/nextjs-rsc-app/app/blog/[slug]/page.tsx
 create mode 100644 examples/nextjs-rsc-app/app/layout.tsx
 create mode 100644 examples/nextjs-rsc-app/app/page.tsx
 create mode 100644 examples/nextjs-rsc-app/next-env.d.ts
 create mode 100644 examples/nextjs-rsc-app/next.config.js
 create mode 100644 examples/nextjs-rsc-app/package-lock.json
 create mode 100644 examples/nextjs-rsc-app/package.json
 create mode 100755 examples/nextjs-rsc-app/scripts/capture-fixtures.sh
 create mode 100755 examples/nextjs-rsc-app/test-live-html.sh
 create mode 100755 examples/nextjs-rsc-app/test-streaming.sh
 create mode 100644 examples/nextjs-rsc-app/tsconfig.json

diff --git a/.gitignore b/.gitignore
index 1bd7e773..c1a7bd47 100644
--- a/.gitignore
+++ b/.gitignore
@@ -23,4 +23,8 @@ src/*.html
 *.pem
 
 /guest-profiles
-/benchmark-results/**
\ No newline at end of file
+/benchmark-results/**
+
+# Next.js example app
+examples/nextjs-rsc-app/node_modules/
+examples/nextjs-rsc-app/.next/
diff --git a/crates/common/src/html_processor.rs b/crates/common/src/html_processor.rs
index ace09c7b..8829cb6d 100644
--- a/crates/common/src/html_processor.rs
+++ b/crates/common/src/html_processor.rs
@@ -1,6 +1,32 @@
 //! Simplified HTML processor that combines URL replacement and integration injection
 //!
-//! This module provides a `StreamProcessor` implementation for HTML content.
+//! This module provides a [`StreamProcessor`] implementation for HTML content.
+//!
+//! ## Streaming Behavior with Post-Processing
+//!
+//! When post-processors are registered (e.g., Next.js RSC URL rewriting), the processor
+//! uses **lazy accumulation** to optimize streaming:
+//!
+//! 1. **Initial streaming**: Chunks are streamed immediately until RSC content is detected
+//! 2. **Accumulation trigger**: When RSC scripts or placeholders are found, buffering begins
+//! 3. **Post-processing**: At document end, accumulated HTML is processed to rewrite RSC payloads
+//!
+//! ### Streaming Ratios
+//!
+//! Observed streaming performance:
+//! - **Non-RSC pages**: 96%+ streaming (minimal buffering)
+//! - **RSC pages**: 28-37% streaming (depends on where RSC scripts appear in HTML)
+//! - **Before optimization**: 0% streaming (everything buffered)
+//!
+//! The streaming ratio for RSC pages is limited by Next.js's architecture: RSC scripts
+//! appear at the end of the HTML and make up 60-72% of the document. Bytes already
+//! streamed before RSC detection cannot be recovered, so the post-processor's fallback
+//! re-parse path handles RSC scripts in the already-streamed prefix.
+//!
+//! ## Memory Safety
+//!
+//! Accumulated output is limited to [`MAX_ACCUMULATED_HTML_BYTES`] (10MB) to prevent
+//! unbounded memory growth from malicious or extremely large documents.
 use std::cell::Cell;
 use std::io;
 use std::rc::Rc;
@@ -8,6 +34,10 @@ use std::sync::Arc;
 
 use lol_html::{element, html_content::ContentType, text, Settings as RewriterSettings};
 
+/// Maximum size for accumulated HTML output when post-processing is required.
+/// This prevents unbounded memory growth from malicious or extremely large documents.
+const MAX_ACCUMULATED_HTML_BYTES: usize = 10 * 1024 * 1024; // 10 MB
+
 use crate::integrations::{
     AttributeRewriteOutcome, IntegrationAttributeContext, IntegrationDocumentState,
     IntegrationHtmlContext, IntegrationHtmlPostProcessor, IntegrationRegistry,
@@ -20,16 +50,37 @@ use crate::tsjs;
 struct HtmlWithPostProcessing {
     inner: HtmlRewriterAdapter,
     post_processors: Vec<Arc<dyn IntegrationHtmlPostProcessor>>,
-    /// Accumulated output from intermediate chunks. Only used when
-    /// `post_processors` is non-empty, because post-processors (e.g. RSC
-    /// placeholder substitution) need the complete document to operate on.
+    /// Accumulated output from intermediate chunks. Only populated once we
+    /// detect that post-processing will be needed (e.g. an RSC placeholder was
+    /// inserted or a fragmented RSC script was observed). Before that trigger,
+    /// chunks stream through immediately.
     accumulated_output: Vec<u8>,
+    /// Number of bytes already streamed to the caller before accumulation began.
+    /// When accumulation triggers, we cannot recover those bytes, so we must
+    /// fall back to the post-processor's re-parse path for any RSC scripts in
+    /// the already-streamed prefix.
+    streamed_bytes: usize,
+    /// Whether we are accumulating output for post-processing.
+    accumulating: bool,
     origin_host: String,
     request_host: String,
     request_scheme: String,
     document_state: IntegrationDocumentState,
 }
 
+impl HtmlWithPostProcessing {
+    /// Check whether we need to start accumulating output for post-processing.
+    ///
+    /// Processors may inspect [`IntegrationDocumentState`] to lazily trigger
+    /// accumulation once they detect content that requires whole-document
+    /// post-processing.
+    fn needs_accumulation(&self) -> bool {
+        self.post_processors
+            .iter()
+            .any(|processor| processor.needs_accumulation(&self.document_state))
+    }
+}
+
 impl StreamProcessor for HtmlWithPostProcessing {
     fn process_chunk(&mut self, chunk: &[u8], is_last: bool) -> Result<Vec<u8>, io::Error> {
         let output = self.inner.process_chunk(chunk, is_last)?;
@@ -39,14 +90,83 @@ impl StreamProcessor for HtmlWithPostProcessing {
             return Ok(output);
         }
 
-        // Post-processors registered → must accumulate so they can operate on
-        // the complete document (e.g. RSC placeholder substitution).
+        // If we're not yet accumulating, check if we need to start.
+        // This allows non-RSC pages with post-processors registered to stream
+        // through without buffering.
+        if !self.accumulating && self.needs_accumulation() {
+            self.accumulating = true;
+            log::debug!(
+                "HTML post-processing: switching to accumulation mode, streamed_bytes={}",
+                self.streamed_bytes
+            );
+        }
+
+        if !self.accumulating {
+            if !is_last {
+                self.streamed_bytes += output.len();
+                return Ok(output);
+            }
+
+            // Final chunk, never accumulated — check if post-processing is needed.
+            // This handles the rare case where RSC scripts appear only in the final
+            // chunk, or where fragmented scripts need the fallback re-parse path.
+            let ctx = IntegrationHtmlContext {
+                request_host: &self.request_host,
+                request_scheme: &self.request_scheme,
+                origin_host: &self.origin_host,
+                document_state: &self.document_state,
+            };
+
+            let Ok(output_str) = std::str::from_utf8(&output) else {
+                return Ok(output);
+            };
+
+            if !self
+                .post_processors
+                .iter()
+                .any(|p| p.should_process(output_str, &ctx))
+            {
+                return Ok(output);
+            }
+
+            // Post-processing needed on just the final chunk.
+            // This is only correct if no earlier chunks contained RSC content
+            // (which would mean they were already streamed without rewriting).
+            // In practice, this handles pages where RSC scripts are small
+            // enough to fit in the final chunk.
+            let mut html = String::from_utf8(output).map_err(|e| {
+                io::Error::other(format!(
+                    "HTML post-processing expected valid UTF-8 output: {e}"
+                ))
+            })?;
+
+            for processor in &self.post_processors {
+                if processor.should_process(&html, &ctx) {
+                    processor.post_process(&mut html, &ctx);
+                }
+            }
+
+            return Ok(html.into_bytes());
+        }
+
+        // Accumulating mode: buffer output for end-of-document post-processing.
+        // Check size limit to prevent unbounded memory growth.
+        if self.accumulated_output.len() + output.len() > MAX_ACCUMULATED_HTML_BYTES {
+            return Err(io::Error::other(format!(
+                "HTML post-processing: accumulated output would exceed {}MB size limit \
+                 (current: {} bytes, chunk: {} bytes)",
+                MAX_ACCUMULATED_HTML_BYTES / (1024 * 1024),
+                self.accumulated_output.len(),
+                output.len()
+            )));
+        }
+
         self.accumulated_output.extend_from_slice(&output);
         if !is_last {
             return Ok(Vec::new());
         }
 
-        // All chunks received — run post-processing on the complete output.
+        // All chunks received — run post-processing on the accumulated output.
         let full_output = std::mem::take(&mut self.accumulated_output);
         if full_output.is_empty() {
             return Ok(full_output);
@@ -87,9 +207,10 @@ impl StreamProcessor for HtmlWithPostProcessing {
 
         if changed {
             log::debug!(
-                "HTML post-processing complete: origin_host={}, output_len={}",
+                "HTML post-processing complete: origin_host={}, output_len={}, streamed_prefix_bytes={}",
                 self.origin_host,
-                html.len()
+                html.len(),
+                self.streamed_bytes,
             );
         }
 
@@ -99,6 +220,8 @@ impl StreamProcessor for HtmlWithPostProcessing {
     fn reset(&mut self) {
         self.inner.reset();
         self.accumulated_output.clear();
+        self.streamed_bytes = 0;
+        self.accumulating = false;
         self.document_state.clear();
     }
 }
@@ -485,6 +608,8 @@ pub fn create_html_processor(config: HtmlProcessorConfig) -> impl StreamProcesso
         inner: HtmlRewriterAdapter::new(rewriter_settings),
         post_processors,
         accumulated_output: Vec::new(),
+        streamed_bytes: 0,
+        accumulating: false,
         origin_host: config.origin_host,
         request_host: config.request_host,
         request_scheme: config.request_scheme,
@@ -1009,4 +1134,304 @@ mod tests {
                 .collect::<String>()
         );
     }
+
+    /// E2E test: verifies that RSC pages with Next.js post-processors produce correct output
+    /// when processed through the full streaming pipeline, and quantifies the streaming
+    /// behavior (how much output is emitted before `is_last`).
+    #[test]
+    fn rsc_html_streams_correctly_with_post_processors() {
+        use crate::streaming_processor::StreamProcessor;
+
+        // Simulate a Next.js App Router page with multiple RSC scripts, including
+        // a cross-script T-chunk (header in script 1, content continues in script 2).
+        let html = concat!(
+            "<html><head><title>Next.js RSC Page</title>",
+            "<link rel=\"stylesheet\" href=\"https://origin.example.com/styles.css\">",
+            "</head><body>",
+            "<div id=\"content\">Hello World</div>",
+            // RSC script 1: contains a T-chunk header that spans into script 2
+            r#"<script>self.__next_f.push([1,"0:{\"url\":\"https://origin.example.com/page\"}\n1a:T3e,partial content"])</script>"#,
+            // RSC script 2: continuation of the T-chunk from script 1
+            r#"<script>self.__next_f.push([1," with https://origin.example.com/more goes here"])</script>"#,
+            // Non-RSC script that must be preserved
+            r#"<script>console.log("analytics ready");</script>"#,
+            "<a href=\"https://origin.example.com/about\">About</a>",
+            "</body></html>",
+        );
+
+        let mut settings = create_test_settings();
+        settings
+            .integrations
+            .insert_config(
+                "nextjs",
+                &json!({
+                    "enabled": true,
+                    "rewrite_attributes": ["href", "link", "url"],
+                }),
+            )
+            .expect("should update nextjs config");
+        let registry =
+            IntegrationRegistry::new(&settings).expect("should create integration registry");
+
+        // Verify post-processors ARE registered (this is the key precondition)
+        let post_processors = registry.html_post_processors();
+        assert!(
+            !post_processors.is_empty(),
+            "Next.js post-processors should be registered when enabled"
+        );
+
+        let config = HtmlProcessorConfig::from_settings(
+            &settings,
+            &registry,
+            "origin.example.com",
+            "test.example.com",
+            "https",
+        );
+        let mut processor = create_html_processor(config);
+
+        // Process in chunks to simulate streaming, tracking per-chunk output
+        let bytes = html.as_bytes();
+        let chunk_size = 64;
+        let chunks: Vec<&[u8]> = bytes.chunks(chunk_size).collect();
+        let last_idx = chunks.len().saturating_sub(1);
+
+        let mut intermediate_bytes = 0usize;
+        let mut final_bytes = 0usize;
+        let mut full_output = Vec::new();
+
+        for (i, chunk) in chunks.iter().enumerate() {
+            let is_last = i == last_idx;
+            let result = processor
+                .process_chunk(chunk, is_last)
+                .expect("should process chunk");
+
+            if is_last {
+                final_bytes = result.len();
+            } else {
+                intermediate_bytes += result.len();
+            }
+            full_output.extend_from_slice(&result);
+        }
+
+        let output = String::from_utf8(full_output).expect("output should be valid UTF-8");
+
+        // --- Correctness assertions ---
+
+        // 1. URL rewriting in HTML attributes should work
+        assert!(
+            output.contains("test.example.com/about"),
+            "HTML href URLs should be rewritten. Got: {output}"
+        );
+        assert!(
+            output.contains("test.example.com/styles.css"),
+            "Link href URLs should be rewritten. Got: {output}"
+        );
+
+        // 2. RSC payloads should be rewritten via post-processing
+        assert!(
+            output.contains("test.example.com/page"),
+            "RSC payload URLs should be rewritten. Got: {output}"
+        );
+
+        // 3. No placeholder markers should leak into the output
+        assert!(
+            !output.contains("__ts_rsc_payload_"),
+            "RSC placeholder markers should not appear in final output. Got: {output}"
+        );
+
+        // 4. Non-RSC scripts should be preserved
+        assert!(
+            output.contains("analytics ready"),
+            "Non-RSC scripts should be preserved. Got: {output}"
+        );
+
+        // 5. HTML structure should be intact
+        assert!(
+            output.contains("<html>") || output.contains("<html "),
+            "HTML should be structurally intact. Got: {output}"
+        );
+        assert!(
+            output.contains("Hello World"),
+            "Content should be preserved. Got: {output}"
+        );
+
+        // --- Streaming behavior observation ---
+        // When post-processors are active, intermediate chunks return empty because
+        // the output must be accumulated for post-processing (RSC placeholder
+        // substitution). This is a known limitation documented here for visibility.
+        println!(
+            "Streaming behavior with post-processors: intermediate_bytes={}, final_bytes={}, total={}",
+            intermediate_bytes,
+            final_bytes,
+            intermediate_bytes + final_bytes
+        );
+        println!(
+            "  Streaming ratio: {:.1}% of bytes emitted before is_last",
+            if intermediate_bytes + final_bytes > 0 {
+                intermediate_bytes as f64 / (intermediate_bytes + final_bytes) as f64 * 100.0
+            } else {
+                0.0
+            }
+        );
+    }
+
+    /// E2E test: verifies that HTML pages WITHOUT RSC (no post-processors active)
+    /// stream incrementally — chunks are emitted before `is_last`.
+    #[test]
+    fn non_rsc_html_streams_incrementally_without_post_processors() {
+        use crate::streaming_processor::StreamProcessor;
+
+        let html = concat!(
+            "<html><head><title>Regular Page</title>",
+            "<link rel=\"stylesheet\" href=\"https://origin.example.com/styles.css\">",
+            "</head><body>",
+            "<div>",
+            "<a href=\"https://origin.example.com/page1\">Page 1</a>",
+            "<a href=\"https://origin.example.com/page2\">Page 2</a>",
+            "<a href=\"https://origin.example.com/page3\">Page 3</a>",
+            "</div>",
+            "</body></html>",
+        );
+
+        // No Next.js integration — post_processors will be empty
+        let config = create_test_config();
+        let mut processor = create_html_processor(config);
+
+        let bytes = html.as_bytes();
+        let chunk_size = 64;
+        let chunks: Vec<&[u8]> = bytes.chunks(chunk_size).collect();
+        let last_idx = chunks.len().saturating_sub(1);
+
+        let mut intermediate_bytes = 0usize;
+        let mut final_bytes = 0usize;
+        let mut full_output = Vec::new();
+
+        for (i, chunk) in chunks.iter().enumerate() {
+            let is_last = i == last_idx;
+            let result = processor
+                .process_chunk(chunk, is_last)
+                .expect("should process chunk");
+
+            if is_last {
+                final_bytes = result.len();
+            } else {
+                intermediate_bytes += result.len();
+            }
+            full_output.extend_from_slice(&result);
+        }
+
+        let output = String::from_utf8(full_output).expect("output should be valid UTF-8");
+
+        // Correctness: URLs should be rewritten
+        assert!(
+            output.contains("test.example.com/page1"),
+            "URLs should be rewritten. Got: {output}"
+        );
+        assert!(
+            !output.contains("origin.example.com"),
+            "No origin URLs should remain. Got: {output}"
+        );
+
+        // Streaming: intermediate chunks SHOULD produce output (no post-processors)
+        assert!(
+            intermediate_bytes > 0,
+            "Without post-processors, intermediate chunks should emit output (got 0 bytes). \
+             This confirms true streaming. Final bytes: {final_bytes}"
+        );
+
+        println!(
+            "Streaming behavior without post-processors: intermediate_bytes={}, final_bytes={}, total={}",
+            intermediate_bytes,
+            final_bytes,
+            intermediate_bytes + final_bytes
+        );
+        println!(
+            "  Streaming ratio: {:.1}% of bytes emitted before is_last",
+            intermediate_bytes as f64 / (intermediate_bytes + final_bytes) as f64 * 100.0
+        );
+    }
+
+    /// E2E test: RSC Flight responses (`text/x-component`) stream correctly
+    /// through the pipeline with URL rewriting and T-row length recalculation.
+    #[test]
+    fn rsc_flight_response_streams_with_url_rewriting() {
+        use crate::rsc_flight::RscFlightUrlRewriter;
+        use crate::streaming_processor::StreamProcessor;
+
+        // Simulate a Flight response with mixed row types
+        let t_content = r#"{"url":"https://origin.example.com/dashboard"}"#;
+        let flight_response = format!(
+            "0:[\"https://origin.example.com/page\"]\n\
+             1:T{:x},{}\
+             2:[\"ok\"]\n",
+            t_content.len(),
+            t_content,
+        );
+
+        let mut processor = RscFlightUrlRewriter::new(
+            "origin.example.com",
+            "https://origin.example.com",
+            "test.example.com",
+            "https",
+        );
+
+        // Process in small chunks to exercise cross-chunk state handling
+        let bytes = flight_response.as_bytes();
+        let chunk_size = 11; // intentionally misaligned with row boundaries
+        let chunks: Vec<&[u8]> = bytes.chunks(chunk_size).collect();
+        let last_idx = chunks.len().saturating_sub(1);
+
+        let mut intermediate_bytes = 0usize;
+        let mut full_output = Vec::new();
+
+        for (i, chunk) in chunks.iter().enumerate() {
+            let is_last = i == last_idx;
+            let result = processor
+                .process_chunk(chunk, is_last)
+                .expect("should process flight chunk");
+
+            if !is_last {
+                intermediate_bytes += result.len();
+            }
+            full_output.extend_from_slice(&result);
+        }
+
+        let output = String::from_utf8(full_output).expect("output should be valid UTF-8");
+
+        // URLs should be rewritten
+        assert!(
+            output.contains("test.example.com/page"),
+            "Newline row URLs should be rewritten. Got: {output}"
+        );
+        assert!(
+            output.contains("test.example.com/dashboard"),
+            "T-row URLs should be rewritten. Got: {output}"
+        );
+
+        // T-row length should be recalculated
+        let rewritten_t_content = r#"{"url":"https://test.example.com/dashboard"}"#;
+        let expected_len_hex = format!("{:x}", rewritten_t_content.len());
+        assert!(
+            output.contains(&format!(":T{expected_len_hex},")),
+            "T-row length should be recalculated. Got: {output}"
+        );
+
+        // No origin URLs should remain
+        assert!(
+            !output.contains("origin.example.com"),
+            "No origin URLs should remain. Got: {output}"
+        );
+
+        // Flight rewriter should stream incrementally
+        assert!(
+            intermediate_bytes > 0,
+            "RSC Flight rewriter should emit output for intermediate chunks (got 0 bytes)"
+        );
+
+        // Trailing row should be preserved
+        assert!(
+            output.contains("2:[\"ok\"]\n"),
+            "Trailing rows should be preserved. Got: {output}"
+        );
+    }
 }
diff --git a/crates/common/src/integrations/nextjs/fixtures/app-router-large.html b/crates/common/src/integrations/nextjs/fixtures/app-router-large.html
new file mode 100644
index 00000000..944609d2
--- /dev/null
+++ b/crates/common/src/integrations/nextjs/fixtures/app-router-large.html
@@ -0,0 +1,37 @@
+<!doctype html>
+<html lang="en">
+  <head>
+    <meta charSet="utf-8"/>
+    <meta name="viewport" content="width=device-width, initial-scale=1"/>
+    <title>Blog Post - Next.js RSC Test App</title>
+    <link rel="stylesheet" href="https://origin.example.com/styles/main.css"/>
+    <link rel="preload" as="image" href="https://origin.example.com/images/blog/hello-world/hero.jpg"/>
+  </head>
+  <body>
+    <nav><a href="https://origin.example.com/">Home</a><a href="https://origin.example.com/about">About</a><a href="https://origin.example.com/blog/hello-world">Blog</a></nav>
+    <main>
+      <article>
+        <h1>Blog Post: hello-world</h1>
+        <div><span>Published on </span><a href="https://origin.example.com/blog">the blog</a></div>
+        <div><img src="https://origin.example.com/images/blog/hello-world/hero.jpg" alt="Hero image for hello-world" width="1200" height="630"/></div>
+        <p>Paragraph 1: This content references https://origin.example.com/article/1 and includes links to https://origin.example.com/category/tech.</p>
+        <p>Paragraph 2: This content references https://origin.example.com/article/2 and includes links to https://origin.example.com/category/tech.</p>
+        <p>Paragraph 3: This content references https://origin.example.com/article/3 and includes links to https://origin.example.com/category/tech.</p>
+        <p>Paragraph 4: This content references https://origin.example.com/article/4 and includes links to https://origin.example.com/category/tech.</p>
+        <p>Paragraph 5: This content references https://origin.example.com/article/5 and includes links to https://origin.example.com/category/tech.</p>
+        <nav><h2>Related Posts</h2><ul><li><a href="https://origin.example.com/blog/related-post-1">Related Post 1</a></li><li><a href="https://origin.example.com/blog/related-post-2">Related Post 2</a></li><li><a href="https://origin.example.com/blog/related-post-3">Related Post 3</a></li></ul></nav>
+        <footer><a href="https://origin.example.com/blog/hello-world/comments">View Comments</a><a href="https://origin.example.com/blog/hello-world/share">Share</a></footer>
+      </article>
+    </main>
+    <footer><a href="https://origin.example.com/privacy">Privacy Policy</a><a href="https://origin.example.com/terms">Terms of Service</a></footer>
+    <script>(self.__next_f=self.__next_f||[]).push([0]);self.__next_f.push([2,null])</script>
+    <script>self.__next_f.push([1,"8:{\"title\":\"hello-world\",\"heroUrl\":\"https://origin.example.com/images/blog/hello-world/hero.jpg\"}\n"])</script>
+    <script>self.__next_f.push([1,"9:{\"url\":\"https://origin.example.com/blog/related-post-1\",\"title\":\"Related Post 1\"}\na:{\"url\":\"https://origin.example.com/blog/related-post-2\",\"title\":\"Related Post 2\"}\nb:{\"url\":\"https://origin.example.com/blog/related-post-3\",\"title\":\"Related Post 3\"}\n"])</script>
+    <script>self.__next_f.push([1,"c:T12c,{\"paragraphs\":[\"Paragraph 1 references https://origin.example.com/article/1\",\"Paragraph 2 references https://origin.example.com/article/2\",\"Paragraph 3 references https://origin.example.com/article/3\"],\"categoryUrl\":\"https://origin.example.com/category/tech\",\"authorUrl\":\"https://origin.example.com/author/staff\"}"])</script>
+    <script>self.__next_f.push([1,"d:{\"commentsUrl\":\"https://origin.example.com/blog/hello-world/comments\",\"shareUrl\":\"https://origin.example.com/blog/hello-world/share\"}\n"])</script>
+    <script>self.__next_f.push([1,"e:Te5,{\"nav\":[{\"href\":\"https://origin.example.com/blog/related-post-1\",\"text\":\"Related 1\"},{\"href\":\"https://origin.example.com/blog/related-post-2\",\"text\":\"Related 2\"}],\"footer\":\"https://origin.example.com/privacy\"}"])</script>
+    <script src="https://origin.example.com/_next/static/chunks/main-abc123.js" async=""></script>
+    <script src="https://origin.example.com/_next/static/chunks/webpack-def456.js" async=""></script>
+    <script src="https://origin.example.com/_next/static/chunks/app-layout-ghi789.js" async=""></script>
+  </body>
+</html>
diff --git a/crates/common/src/integrations/nextjs/fixtures/app-router-simple.html b/crates/common/src/integrations/nextjs/fixtures/app-router-simple.html
new file mode 100644
index 00000000..2d631860
--- /dev/null
+++ b/crates/common/src/integrations/nextjs/fixtures/app-router-simple.html
@@ -0,0 +1,34 @@
+<!doctype html>
+<html lang="en">
+  <head>
+    <meta charSet="utf-8"/>
+    <meta name="viewport" content="width=device-width, initial-scale=1"/>
+    <title>Next.js RSC Test App</title>
+    <link rel="stylesheet" href="https://origin.example.com/styles/main.css"/>
+    <link rel="icon" href="https://origin.example.com/favicon.ico"/>
+    <link rel="preload" as="script" href="https://origin.example.com/_next/static/chunks/main-abc123.js"/>
+    <link rel="preload" as="script" href="https://origin.example.com/_next/static/chunks/webpack-def456.js"/>
+  </head>
+  <body>
+    <nav><a href="https://origin.example.com/">Home</a><a href="https://origin.example.com/about">About</a><a href="https://origin.example.com/blog/hello-world">Blog</a></nav>
+    <main>
+      <div>
+        <h1>Welcome to the Test App</h1>
+        <p>Visit our <a href="https://origin.example.com/getting-started">getting started guide</a>.</p>
+        <ul>
+          <li><a href="https://origin.example.com/docs">Documentation</a><span> - Learn about the platform</span></li>
+          <li><a href="https://origin.example.com/api/v1">API Reference</a><span> - Explore the REST API</span></li>
+          <li><a href="https://origin.example.com/dashboard">Dashboard</a><span> - View your analytics</span></li>
+        </ul>
+        <img src="https://origin.example.com/images/hero.jpg" alt="Hero" width="800" height="400"/>
+      </div>
+    </main>
+    <footer><a href="https://origin.example.com/privacy">Privacy Policy</a><a href="https://origin.example.com/terms">Terms of Service</a></footer>
+    <script>(self.__next_f=self.__next_f||[]).push([0]);self.__next_f.push([2,null])</script>
+    <script>self.__next_f.push([1,"1:{\"url\":\"https://origin.example.com/docs\",\"title\":\"Documentation\"}\n"])</script>
+    <script>self.__next_f.push([1,"2:{\"url\":\"https://origin.example.com/api/v1\",\"title\":\"API Reference\"}\n"])</script>
+    <script>self.__next_f.push([1,"3:{\"url\":\"https://origin.example.com/dashboard\",\"title\":\"Dashboard\"}\n"])</script>
+    <script src="https://origin.example.com/_next/static/chunks/main-abc123.js" async=""></script>
+    <script src="https://origin.example.com/_next/static/chunks/webpack-def456.js" async=""></script>
+  </body>
+</html>
diff --git a/crates/common/src/integrations/nextjs/fixtures/app-router-tchunk.html b/crates/common/src/integrations/nextjs/fixtures/app-router-tchunk.html
new file mode 100644
index 00000000..981b131c
--- /dev/null
+++ b/crates/common/src/integrations/nextjs/fixtures/app-router-tchunk.html
@@ -0,0 +1,29 @@
+<!doctype html>
+<html lang="en">
+  <head>
+    <meta charSet="utf-8"/>
+    <meta name="viewport" content="width=device-width, initial-scale=1"/>
+    <title>About Us - Next.js RSC Test App</title>
+    <link rel="stylesheet" href="https://origin.example.com/styles/main.css"/>
+  </head>
+  <body>
+    <nav><a href="https://origin.example.com/">Home</a><a href="https://origin.example.com/about">About</a></nav>
+    <main>
+      <div>
+        <h1>About Us</h1>
+        <p>We are building at <a href="https://origin.example.com/about">origin.example.com</a>.</p>
+        <section>
+          <h2>Our Team</h2>
+          <div><img src="https://origin.example.com/avatars/alice.jpg" alt="Alice Johnson" width="64" height="64"/><h3><a href="https://origin.example.com/team/alice">Alice Johnson</a></h3><p>Engineering Lead</p></div>
+          <div><img src="https://origin.example.com/avatars/bob.jpg" alt="Bob Smith" width="64" height="64"/><h3><a href="https://origin.example.com/team/bob">Bob Smith</a></h3><p>Product Manager</p></div>
+        </section>
+      </div>
+    </main>
+    <footer><a href="https://origin.example.com/privacy">Privacy Policy</a></footer>
+    <script>(self.__next_f=self.__next_f||[]).push([0]);self.__next_f.push([2,null])</script>
+    <script>self.__next_f.push([1,"4:{\"name\":\"Alice\",\"profileUrl\":\"https://origin.example.com/team/alice\"}\n5:T87,{\"html\":\"\\u003cdiv\\u003e\\u003ca href=\\\"https://origin.example.com/team/alice\\\"\\u003eAlice Johnson\\u003c/a\\u003e\\u003c/div\\u003e\"}"])</script>
+    <script>self.__next_f.push([1,"6:{\"name\":\"Bob\",\"profileUrl\":\"https://origin.example.com/team/bob\"}\n"])</script>
+    <script>self.__next_f.push([1,"7:T83,{\"html\":\"\\u003cdiv\\u003e\\u003ca href=\\\"https://origin.example.com/team/bob\\\"\\u003eBob Smith\\u003c/a\\u003e\\u003c/div\\u003e\"}"])</script>
+    <script src="https://origin.example.com/_next/static/chunks/main-abc123.js" async=""></script>
+  </body>
+</html>
diff --git a/crates/common/src/integrations/nextjs/fixtures/non-rsc-page.html b/crates/common/src/integrations/nextjs/fixtures/non-rsc-page.html
new file mode 100644
index 00000000..8997cd86
--- /dev/null
+++ b/crates/common/src/integrations/nextjs/fixtures/non-rsc-page.html
@@ -0,0 +1,38 @@
+<!doctype html>
+<html lang="en">
+  <head>
+    <meta charset="utf-8"/>
+    <meta name="viewport" content="width=device-width, initial-scale=1"/>
+    <title>Static Page - No RSC</title>
+    <link rel="stylesheet" href="https://origin.example.com/styles/main.css"/>
+    <link rel="icon" href="https://origin.example.com/favicon.ico"/>
+  </head>
+  <body>
+    <nav>
+      <a href="https://origin.example.com/">Home</a>
+      <a href="https://origin.example.com/about">About</a>
+      <a href="https://origin.example.com/contact">Contact</a>
+    </nav>
+    <main>
+      <h1>Welcome</h1>
+      <p>This is a static page without any React Server Components.</p>
+      <p>It contains regular HTML with URLs that should be rewritten:</p>
+      <ul>
+        <li><a href="https://origin.example.com/docs">Documentation</a></li>
+        <li><a href="https://origin.example.com/api">API</a></li>
+        <li><a href="https://origin.example.com/support">Support</a></li>
+      </ul>
+      <img src="https://origin.example.com/images/banner.jpg" alt="Banner" width="960" height="320"/>
+      <form action="https://origin.example.com/search" method="get">
+        <input type="text" name="q" placeholder="Search..."/>
+        <button type="submit">Search</button>
+      </form>
+    </main>
+    <footer>
+      <a href="https://origin.example.com/privacy">Privacy</a>
+      <a href="https://origin.example.com/terms">Terms</a>
+    </footer>
+    <script>console.log("analytics loaded");</script>
+    <script>window.dataLayer = window.dataLayer || []; window.dataLayer.push({"page": "static"});</script>
+  </body>
+</html>
diff --git a/crates/common/src/integrations/nextjs/fixtures/real-nextjs-about.html b/crates/common/src/integrations/nextjs/fixtures/real-nextjs-about.html
new file mode 100644
index 00000000..9b30d187
--- /dev/null
+++ b/crates/common/src/integrations/nextjs/fixtures/real-nextjs-about.html
@@ -0,0 +1 @@
+<!DOCTYPE html><!--_0Lth74qNT2E7WJR76kUR--><html lang="en"><head><meta charSet="utf-8"/><meta name="viewport" content="width=device-width, initial-scale=1"/><link rel="preload" as="image" href="https://origin.example.com/avatars/alice.jpg"/><link rel="preload" as="image" href="https://origin.example.com/avatars/bob.jpg"/><link rel="preload" as="image" href="https://origin.example.com/avatars/carol.jpg"/><link rel="preload" as="script" fetchPriority="low" href="/_next/static/chunks/webpack-078f6dfb37dff419.js"/><script src="/_next/static/chunks/4bd1b696-c023c6e3521b1417.js" async=""></script><script src="/_next/static/chunks/255-632950a301ed81a4.js" async=""></script><script src="/_next/static/chunks/main-app-00fb03c24437bd47.js" async=""></script><link rel="icon" href="https://origin.example.com/favicon.ico"/><title>Next.js RSC Test App</title><meta name="description" content="Minimal app for testing Trusted Server RSC integration"/><link rel="stylesheet" href="https://origin.example.com/styles/main.css"/><script src="/_next/static/chunks/polyfills-42372ed130431b0a.js" noModule=""></script></head><body><div hidden=""><!--$--><!--/$--></div><nav><a href="https://origin.example.com/">Home</a><a href="https://origin.example.com/about">About</a><a href="https://origin.example.com/blog/hello-world">Blog</a></nav><main><div><h1>About Us</h1><p>We are building at<!-- --> <a href="https://origin.example.com/about">origin.example.com</a>.</p><section><h2>Our Team</h2><div><img src="https://origin.example.com/avatars/alice.jpg" alt="Alice Johnson" width="64" height="64"/><h3><a href="https://origin.example.com/team/alice">Alice Johnson</a></h3><p>Engineering Lead</p></div><div><img src="https://origin.example.com/avatars/bob.jpg" alt="Bob Smith" width="64" height="64"/><h3><a href="https://origin.example.com/team/bob">Bob Smith</a></h3><p>Product Manager</p></div><div><img src="https://origin.example.com/avatars/carol.jpg" alt="Carol Williams" width="64" height="64"/><h3><a href="https://origin.example.com/team/carol">Carol Williams</a></h3><p>Designer</p></div></section><section><h2>Resources</h2><ul><li><a href="https://origin.example.com/blog">Blog</a></li><li><a href="https://origin.example.com/careers">Careers</a></li><li><a href="https://origin.example.com/contact">Contact</a></li></ul></section></div><!--$--><!--/$--></main><footer><a href="https://origin.example.com/privacy">Privacy Policy</a><a href="https://origin.example.com/terms">Terms of Service</a></footer><script src="/_next/static/chunks/webpack-078f6dfb37dff419.js" id="_R_" async=""></script><script>(self.__next_f=self.__next_f||[]).push([0])</script><script>self.__next_f.push([1,"1:\"$Sreact.fragment\"\n2:I[9766,[],\"\"]\n3:I[8924,[],\"\"]\n4:I[4431,[],\"OutletBoundary\"]\n6:I[5278,[],\"AsyncMetadataOutlet\"]\n8:I[4431,[],\"ViewportBoundary\"]\na:I[4431,[],\"MetadataBoundary\"]\nb:\"$Sreact.suspense\"\nd:I[7150,[],\"\"]\n"])</script><script>self.__next_f.push([1,"0:{\"P\":null,\"b\":\"-0Lth74qNT2E7WJR76kUR\",\"p\":\"\",\"c\":[\"\",\"about\"],\"i\":false,\"f\":[[[\"\",{\"children\":[\"about\",{\"children\":[\"__PAGE__\",{}]}]},\"$undefined\",\"$undefined\",true],[\"\",[\"$\",\"$1\",\"c\",{\"children\":[null,[\"$\",\"html\",null,{\"lang\":\"en\",\"children\":[[\"$\",\"head\",null,{\"children\":[[\"$\",\"link\",null,{\"rel\":\"stylesheet\",\"href\":\"https://origin.example.com/styles/main.css\"}],[\"$\",\"link\",null,{\"rel\":\"icon\",\"href\":\"https://origin.example.com/favicon.ico\"}]]}],[\"$\",\"body\",null,{\"children\":[[\"$\",\"nav\",null,{\"children\":[[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/\",\"children\":\"Home\"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/about\",\"children\":\"About\"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog/hello-world\",\"children\":\"Blog\"}]]}],[\"$\",\"main\",null,{\"children\":[\"$\",\"$L2\",null,{\"parallelRouterKey\":\"children\",\"error\":\"$undefined\",\"errorStyles\":\"$undefined\",\"errorScripts\":\"$undefined\",\"template\":[\"$\",\"$L3\",null,{}],\"templateStyles\":\"$undefined\",\"templateScripts\":\"$undefined\",\"notFound\":[[[\"$\",\"title\",null,{\"children\":\"404: This page could not be found.\"}],[\"$\",\"div\",null,{\"style\":{\"fontFamily\":\"system-ui,\\\"Segoe UI\\\",Roboto,Helvetica,Arial,sans-serif,\\\"Apple Color Emoji\\\",\\\"Segoe UI Emoji\\\"\",\"height\":\"100vh\",\"textAlign\":\"center\",\"display\":\"flex\",\"flexDirection\":\"column\",\"alignItems\":\"center\",\"justifyContent\":\"center\"},\"children\":[\"$\",\"div\",null,{\"children\":[[\"$\",\"style\",null,{\"dangerouslySetInnerHTML\":{\"__html\":\"body{color:#000;background:#fff;margin:0}.next-error-h1{border-right:1px solid rgba(0,0,0,.3)}@media (prefers-color-scheme:dark){body{color:#fff;background:#000}.next-error-h1{border-right:1px solid rgba(255,255,255,.3)}}\"}}],[\"$\",\"h1\",null,{\"className\":\"next-error-h1\",\"style\":{\"display\":\"inline-block\",\"margin\":\"0 20px 0 0\",\"padding\":\"0 23px 0 0\",\"fontSize\":24,\"fontWeight\":500,\"verticalAlign\":\"top\",\"lineHeight\":\"49px\"},\"children\":404}],[\"$\",\"div\",null,{\"style\":{\"display\":\"inline-block\"},\"children\":[\"$\",\"h2\",null,{\"style\":{\"fontSize\":14,\"fontWeight\":400,\"lineHeight\":\"49px\",\"margin\":0},\"children\":\"This page could not be found.\"}]}]]}]}]],[]],\"forbidden\":\"$undefined\",\"unauthorized\":\"$undefined\"}]}],[\"$\",\"footer\",null,{\"children\":[[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/privacy\",\"children\":\"Privacy Policy\"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/terms\",\"children\":\"Terms of Service\"}]]}]]}]]}]]}],{\"children\":[\"about\",[\"$\",\"$1\",\"c\",{\"children\":[null,[\"$\",\"$L2\",null,{\"parallelRouterKey\":\"children\",\"error\":\"$undefined\",\"errorStyles\":\"$undefined\",\"errorScripts\":\"$undefined\",\"template\":[\"$\",\"$L3\",null,{}],\"templateStyles\":\"$undefined\",\"templateScripts\":\"$undefined\",\"notFound\":\"$undefined\",\"forbidden\":\"$undefined\",\"unauthorized\":\"$undefined\"}]]}],{\"children\":[\"__PAGE__\",[\"$\",\"$1\",\"c\",{\"children\":[[\"$\",\"div\",null,{\"children\":[[\"$\",\"h1\",null,{\"children\":\"About Us\"}],[\"$\",\"p\",null,{\"children\":[\"We are building at\",\" \",[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/about\",\"children\":\"origin.example.com\"}],\".\"]}],[\"$\",\"section\",null,{\"children\":[[\"$\",\"h2\",null,{\"children\":\"Our Team\"}],[[\"$\",\"div\",\"Alice Johnson\",{\"children\":[[\"$\",\"img\",null,{\"src\":\"https://origin.example.com/avatars/alice.jpg\",\"alt\":\"Alice Johnson\",\"width\":64,\"height\":64}],[\"$\",\"h3\",null,{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/team/alice\",\"children\":\"Alice Johnson\"}]}],[\"$\",\"p\",null,{\"children\":\"Engineering Lead\"}]]}],[\"$\",\"div\",\"Bob Smith\",{\"children\":[[\"$\",\"img\",null,{\"src\":\"https://origin.example.com/avatars/bob.jpg\",\"alt\":\"Bob Smith\",\"width\":64,\"height\":64}],[\"$\",\"h3\",null,{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/team/bob\",\"children\":\"Bob Smith\"}]}],[\"$\",\"p\",null,{\"children\":\"Product Manager\"}]]}],[\"$\",\"div\",\"Carol Williams\",{\"children\":[[\"$\",\"img\",null,{\"src\":\"https://origin.example.com/avatars/carol.jpg\",\"alt\":\"Carol Williams\",\"width\":64,\"height\":64}],[\"$\",\"h3\",null,{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/team/carol\",\"children\":\"Carol Williams\"}]}],[\"$\",\"p\",null,{\"children\":\"Designer\"}]]}]]]}],[\"$\",\"section\",null,{\"children\":[[\"$\",\"h2\",null,{\"children\":\"Resources\"}],[\"$\",\"ul\",null,{\"children\":[[\"$\",\"li\",null,{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog\",\"children\":\"Blog\"}]}],[\"$\",\"li\",null,{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/careers\",\"children\":\"Careers\"}]}],[\"$\",\"li\",null,{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/contact\",\"children\":\"Contact\"}]}]]}]]}]]}],null,[\"$\",\"$L4\",null,{\"children\":[\"$L5\",[\"$\",\"$L6\",null,{\"promise\":\"$@7\"}]]}]]}],{},null,false]},null,false]},null,false],[\"$\",\"$1\",\"h\",{\"children\":[null,[[\"$\",\"$L8\",null,{\"children\":\"$L9\"}],null],[\"$\",\"$La\",null,{\"children\":[\"$\",\"div\",null,{\"hidden\":true,\"children\":[\"$\",\"$b\",null,{\"fallback\":null,\"children\":\"$Lc\"}]}]}]]}],false]],\"m\":\"$undefined\",\"G\":[\"$d\",[]],\"s\":false,\"S\":true}\n"])</script><script>self.__next_f.push([1,"9:[[\"$\",\"meta\",\"0\",{\"charSet\":\"utf-8\"}],[\"$\",\"meta\",\"1\",{\"name\":\"viewport\",\"content\":\"width=device-width, initial-scale=1\"}]]\n5:null\n"])</script><script>self.__next_f.push([1,"7:{\"metadata\":[[\"$\",\"title\",\"0\",{\"children\":\"Next.js RSC Test App\"}],[\"$\",\"meta\",\"1\",{\"name\":\"description\",\"content\":\"Minimal app for testing Trusted Server RSC integration\"}]],\"error\":null,\"digest\":\"$undefined\"}\n"])</script><script>self.__next_f.push([1,"c:\"$7:metadata\"\n"])</script></body></html>
\ No newline at end of file
diff --git a/crates/common/src/integrations/nextjs/fixtures/real-nextjs-blog.html b/crates/common/src/integrations/nextjs/fixtures/real-nextjs-blog.html
new file mode 100644
index 00000000..607d894f
--- /dev/null
+++ b/crates/common/src/integrations/nextjs/fixtures/real-nextjs-blog.html
@@ -0,0 +1 @@
+<!DOCTYPE html><!--_0Lth74qNT2E7WJR76kUR--><html lang="en"><head><meta charSet="utf-8"/><meta name="viewport" content="width=device-width, initial-scale=1"/><link rel="preload" as="image" href="https://origin.example.com/images/blog/hello-world/hero.jpg"/><link rel="preload" as="script" fetchPriority="low" href="/_next/static/chunks/webpack-078f6dfb37dff419.js"/><script src="/_next/static/chunks/4bd1b696-c023c6e3521b1417.js" async=""></script><script src="/_next/static/chunks/255-632950a301ed81a4.js" async=""></script><script src="/_next/static/chunks/main-app-00fb03c24437bd47.js" async=""></script><link rel="icon" href="https://origin.example.com/favicon.ico"/><title>Next.js RSC Test App</title><meta name="description" content="Minimal app for testing Trusted Server RSC integration"/><link rel="stylesheet" href="https://origin.example.com/styles/main.css"/><script src="/_next/static/chunks/polyfills-42372ed130431b0a.js" noModule=""></script></head><body><div hidden=""><!--$--><!--/$--></div><nav><a href="https://origin.example.com/">Home</a><a href="https://origin.example.com/about">About</a><a href="https://origin.example.com/blog/hello-world">Blog</a></nav><main><article><h1>Blog Post: <!-- -->hello-world</h1><div><span>Published on </span><a href="https://origin.example.com/blog">the blog</a></div><div><img src="https://origin.example.com/images/blog/hello-world/hero.jpg" alt="Hero image for hello-world" width="1200" height="630"/></div><p>Paragraph 1: This content references https://origin.example.com/article/1 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-1.</p><p>Paragraph 2: This content references https://origin.example.com/article/2 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-2.</p><p>Paragraph 3: This content references https://origin.example.com/article/3 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-3.</p><p>Paragraph 4: This content references https://origin.example.com/article/4 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-4.</p><p>Paragraph 5: This content references https://origin.example.com/article/5 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-5.</p><p>Paragraph 6: This content references https://origin.example.com/article/6 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-6.</p><p>Paragraph 7: This content references https://origin.example.com/article/7 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-7.</p><p>Paragraph 8: This content references https://origin.example.com/article/8 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-8.</p><p>Paragraph 9: This content references https://origin.example.com/article/9 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-9.</p><p>Paragraph 10: This content references https://origin.example.com/article/10 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-10.</p><p>Paragraph 11: This content references https://origin.example.com/article/11 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-11.</p><p>Paragraph 12: This content references https://origin.example.com/article/12 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-12.</p><p>Paragraph 13: This content references https://origin.example.com/article/13 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-13.</p><p>Paragraph 14: This content references https://origin.example.com/article/14 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-14.</p><p>Paragraph 15: This content references https://origin.example.com/article/15 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-15.</p><p>Paragraph 16: This content references https://origin.example.com/article/16 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-16.</p><p>Paragraph 17: This content references https://origin.example.com/article/17 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-17.</p><p>Paragraph 18: This content references https://origin.example.com/article/18 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-18.</p><p>Paragraph 19: This content references https://origin.example.com/article/19 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-19.</p><p>Paragraph 20: This content references https://origin.example.com/article/20 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-20.</p><nav><h2>Related Posts</h2><ul><li><a href="https://origin.example.com/blog/related-post-1">Related Post <!-- -->1</a></li><li><a href="https://origin.example.com/blog/related-post-2">Related Post <!-- -->2</a></li><li><a href="https://origin.example.com/blog/related-post-3">Related Post <!-- -->3</a></li><li><a href="https://origin.example.com/blog/related-post-4">Related Post <!-- -->4</a></li><li><a href="https://origin.example.com/blog/related-post-5">Related Post <!-- -->5</a></li></ul></nav><footer><a href="https://origin.example.com/blog/hello-world/comments">View Comments</a><a href="https://origin.example.com/blog/hello-world/share">Share</a></footer></article><!--$--><!--/$--></main><footer><a href="https://origin.example.com/privacy">Privacy Policy</a><a href="https://origin.example.com/terms">Terms of Service</a></footer><script src="/_next/static/chunks/webpack-078f6dfb37dff419.js" id="_R_" async=""></script><script>(self.__next_f=self.__next_f||[]).push([0])</script><script>self.__next_f.push([1,"1:\"$Sreact.fragment\"\n2:I[9766,[],\"\"]\n3:I[8924,[],\"\"]\n5:I[4431,[],\"OutletBoundary\"]\n7:I[5278,[],\"AsyncMetadataOutlet\"]\n9:I[4431,[],\"ViewportBoundary\"]\nb:I[4431,[],\"MetadataBoundary\"]\nc:\"$Sreact.suspense\"\ne:I[7150,[],\"\"]\n"])</script><script>self.__next_f.push([1,"0:{\"P\":null,\"b\":\"-0Lth74qNT2E7WJR76kUR\",\"p\":\"\",\"c\":[\"\",\"blog\",\"hello-world\"],\"i\":false,\"f\":[[[\"\",{\"children\":[\"blog\",{\"children\":[[\"slug\",\"hello-world\",\"d\"],{\"children\":[\"__PAGE__\",{}]}]}]},\"$undefined\",\"$undefined\",true],[\"\",[\"$\",\"$1\",\"c\",{\"children\":[null,[\"$\",\"html\",null,{\"lang\":\"en\",\"children\":[[\"$\",\"head\",null,{\"children\":[[\"$\",\"link\",null,{\"rel\":\"stylesheet\",\"href\":\"https://origin.example.com/styles/main.css\"}],[\"$\",\"link\",null,{\"rel\":\"icon\",\"href\":\"https://origin.example.com/favicon.ico\"}]]}],[\"$\",\"body\",null,{\"children\":[[\"$\",\"nav\",null,{\"children\":[[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/\",\"children\":\"Home\"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/about\",\"children\":\"About\"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog/hello-world\",\"children\":\"Blog\"}]]}],[\"$\",\"main\",null,{\"children\":[\"$\",\"$L2\",null,{\"parallelRouterKey\":\"children\",\"error\":\"$undefined\",\"errorStyles\":\"$undefined\",\"errorScripts\":\"$undefined\",\"template\":[\"$\",\"$L3\",null,{}],\"templateStyles\":\"$undefined\",\"templateScripts\":\"$undefined\",\"notFound\":[[[\"$\",\"title\",null,{\"children\":\"404: This page could not be found.\"}],[\"$\",\"div\",null,{\"style\":{\"fontFamily\":\"system-ui,\\\"Segoe UI\\\",Roboto,Helvetica,Arial,sans-serif,\\\"Apple Color Emoji\\\",\\\"Segoe UI Emoji\\\"\",\"height\":\"100vh\",\"textAlign\":\"center\",\"display\":\"flex\",\"flexDirection\":\"column\",\"alignItems\":\"center\",\"justifyContent\":\"center\"},\"children\":[\"$\",\"div\",null,{\"children\":[[\"$\",\"style\",null,{\"dangerouslySetInnerHTML\":{\"__html\":\"body{color:#000;background:#fff;margin:0}.next-error-h1{border-right:1px solid rgba(0,0,0,.3)}@media (prefers-color-scheme:dark){body{color:#fff;background:#000}.next-error-h1{border-right:1px solid rgba(255,255,255,.3)}}\"}}],[\"$\",\"h1\",null,{\"className\":\"next-error-h1\",\"style\":{\"display\":\"inline-block\",\"margin\":\"0 20px 0 0\",\"padding\":\"0 23px 0 0\",\"fontSize\":24,\"fontWeight\":500,\"verticalAlign\":\"top\",\"lineHeight\":\"49px\"},\"children\":404}],[\"$\",\"div\",null,{\"style\":{\"display\":\"inline-block\"},\"children\":[\"$\",\"h2\",null,{\"style\":{\"fontSize\":14,\"fontWeight\":400,\"lineHeight\":\"49px\",\"margin\":0},\"children\":\"This page could not be found.\"}]}]]}]}]],[]],\"forbidden\":\"$undefined\",\"unauthorized\":\"$undefined\"}]}],[\"$\",\"footer\",null,{\"children\":[[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/privacy\",\"children\":\"Privacy Policy\"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/terms\",\"children\":\"Terms of Service\"}]]}]]}]]}]]}],{\"children\":[\"blog\",[\"$\",\"$1\",\"c\",{\"children\":[null,[\"$\",\"$L2\",null,{\"parallelRouterKey\":\"children\",\"error\":\"$undefined\",\"errorStyles\":\"$undefined\",\"errorScripts\":\"$undefined\",\"template\":[\"$\",\"$L3\",null,{}],\"templateStyles\":\"$undefined\",\"templateScripts\":\"$undefined\",\"notFound\":\"$undefined\",\"forbidden\":\"$undefined\",\"unauthorized\":\"$undefined\"}]]}],{\"children\":[[\"slug\",\"hello-world\",\"d\"],[\"$\",\"$1\",\"c\",{\"children\":[null,[\"$\",\"$L2\",null,{\"parallelRouterKey\":\"children\",\"error\":\"$undefined\",\"errorStyles\":\"$undefined\",\"errorScripts\":\"$undefined\",\"template\":[\"$\",\"$L3\",null,{}],\"templateStyles\":\"$undefined\",\"templateScripts\":\"$undefined\",\"notFound\":\"$undefined\",\"forbidden\":\"$undefined\",\"unauthorized\":\"$undefined\"}]]}],{\"children\":[\"__PAGE__\",[\"$\",\"$1\",\"c\",{\"children\":[\"$L4\",null,[\"$\",\"$L5\",null,{\"children\":[\"$L6\",[\"$\",\"$L7\",null,{\"promise\":\"$@8\"}]]}]]}],{},null,false]},null,false]},null,false]},null,false],[\"$\",\"$1\",\"h\",{\"children\":[null,[[\"$\",\"$L9\",null,{\"children\":\"$La\"}],null],[\"$\",\"$Lb\",null,{\"children\":[\"$\",\"div\",null,{\"hidden\":true,\"children\":[\"$\",\"$c\",null,{\"fallback\":null,\"children\":\"$Ld\"}]}]}]]}],false]],\"m\":\"$undefined\",\"G\":[\"$e\",[]],\"s\":false,\"S\":true}\n"])</script><script>self.__next_f.push([1,"4:[\"$\",\"article\",null,{\"children\":[[\"$\",\"h1\",null,{\"children\":[\"Blog Post: \",\"hello-world\"]}],[\"$\",\"div\",null,{\"children\":[[\"$\",\"span\",null,{\"children\":\"Published on \"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog\",\"children\":\"the blog\"}]]}],[\"$\",\"div\",null,{\"children\":[\"$\",\"img\",null,{\"src\":\"https://origin.example.com/images/blog/hello-world/hero.jpg\",\"alt\":\"Hero image for hello-world\",\"width\":1200,\"height\":630}]}],[[\"$\",\"p\",\"0\",{\"children\":\"Paragraph 1: This content references https://origin.example.com/article/1 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-1.\"}],[\"$\",\"p\",\"1\",{\"children\":\"Paragraph 2: This content references https://origin.example.com/article/2 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-2.\"}],[\"$\",\"p\",\"2\",{\"children\":\"Paragraph 3: This content references https://origin.example.com/article/3 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-3.\"}],[\"$\",\"p\",\"3\",{\"children\":\"Paragraph 4: This content references https://origin.example.com/article/4 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-4.\"}],[\"$\",\"p\",\"4\",{\"children\":\"Paragraph 5: This content references https://origin.example.com/article/5 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-5.\"}],[\"$\",\"p\",\"5\",{\"children\":\"Paragraph 6: This content references https://origin.example.com/article/6 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-6.\"}],[\"$\",\"p\",\"6\",{\"children\":\"Paragraph 7: This content references https://origin.example.com/article/7 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-7.\"}],[\"$\",\"p\",\"7\",{\"children\":\"Paragraph 8: This content references https://origin.example.com/article/8 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-8.\"}],[\"$\",\"p\",\"8\",{\"children\":\"Paragraph 9: This content references https://origin.example.com/article/9 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-9.\"}],[\"$\",\"p\",\"9\",{\"children\":\"Paragraph 10: This content references https://origin.example.com/article/10 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-10.\"}],[\"$\",\"p\",\"10\",{\"children\":\"Paragraph 11: This content references https://origin.example.com/article/11 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-11.\"}],\"$Lf\",\"$L10\",\"$L11\",\"$L12\",\"$L13\",\"$L14\",\"$L15\",\"$L16\",\"$L17\"],\"$L18\",\"$L19\"]}]\n"])</script><script>self.__next_f.push([1,"f:[\"$\",\"p\",\"11\",{\"children\":\"Paragraph 12: This content references https://origin.example.com/article/12 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-12.\"}]\n10:[\"$\",\"p\",\"12\",{\"children\":\"Paragraph 13: This content references https://origin.example.com/article/13 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-13.\"}]\n11:[\"$\",\"p\",\"13\",{\"children\":\"Paragraph 14: This content references https://origin.example.com/article/14 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-14.\"}]\n12:[\"$\",\"p\",\"14\",{\"children\":\"Paragraph 15: This content references https://origin.example.com/article/15 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-15.\"}]\n13:[\"$\",\"p\",\"15\",{\"children\":\"Paragraph 16: This content references https://origin.example.com/article/16 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-16.\"}]\n14:[\"$\",\"p\",\"16\",{\"children\":\"Paragraph 17: This content references https://origin.example.com/article/17 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-17.\"}]\n15:[\"$\",\"p\",\"17\",{\"children\":\"Paragraph 18: This content references https://origin.example.com/article/18 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-18.\"}]\n16:[\""])</script><script>self.__next_f.push([1,"$\",\"p\",\"18\",{\"children\":\"Paragraph 19: This content references https://origin.example.com/article/19 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-19.\"}]\n17:[\"$\",\"p\",\"19\",{\"children\":\"Paragraph 20: This content references https://origin.example.com/article/20 and includes links to https://origin.example.com/category/tech and https://origin.example.com/author/staff. For more information, visit https://origin.example.com/resources/guide-20.\"}]\n"])</script><script>self.__next_f.push([1,"18:[\"$\",\"nav\",null,{\"children\":[[\"$\",\"h2\",null,{\"children\":\"Related Posts\"}],[\"$\",\"ul\",null,{\"children\":[[\"$\",\"li\",\"0\",{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog/related-post-1\",\"children\":[\"Related Post \",1]}]}],[\"$\",\"li\",\"1\",{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog/related-post-2\",\"children\":[\"Related Post \",2]}]}],[\"$\",\"li\",\"2\",{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog/related-post-3\",\"children\":[\"Related Post \",3]}]}],[\"$\",\"li\",\"3\",{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog/related-post-4\",\"children\":[\"Related Post \",4]}]}],[\"$\",\"li\",\"4\",{\"children\":[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog/related-post-5\",\"children\":[\"Related Post \",5]}]}]]}]]}]\n"])</script><script>self.__next_f.push([1,"19:[\"$\",\"footer\",null,{\"children\":[[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog/hello-world/comments\",\"children\":\"View Comments\"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog/hello-world/share\",\"children\":\"Share\"}]]}]\n"])</script><script>self.__next_f.push([1,"a:[[\"$\",\"meta\",\"0\",{\"charSet\":\"utf-8\"}],[\"$\",\"meta\",\"1\",{\"name\":\"viewport\",\"content\":\"width=device-width, initial-scale=1\"}]]\n6:null\n"])</script><script>self.__next_f.push([1,"8:{\"metadata\":[[\"$\",\"title\",\"0\",{\"children\":\"Next.js RSC Test App\"}],[\"$\",\"meta\",\"1\",{\"name\":\"description\",\"content\":\"Minimal app for testing Trusted Server RSC integration\"}]],\"error\":null,\"digest\":\"$undefined\"}\n"])</script><script>self.__next_f.push([1,"d:\"$8:metadata\"\n"])</script></body></html>
\ No newline at end of file
diff --git a/crates/common/src/integrations/nextjs/fixtures/real-nextjs-home.html b/crates/common/src/integrations/nextjs/fixtures/real-nextjs-home.html
new file mode 100644
index 00000000..9782dddc
--- /dev/null
+++ b/crates/common/src/integrations/nextjs/fixtures/real-nextjs-home.html
@@ -0,0 +1 @@
+<!DOCTYPE html><!--_0Lth74qNT2E7WJR76kUR--><html lang="en"><head><meta charSet="utf-8"/><meta name="viewport" content="width=device-width, initial-scale=1"/><link rel="preload" as="image" href="https://origin.example.com/images/hero.jpg"/><link rel="preload" as="script" fetchPriority="low" href="/_next/static/chunks/webpack-078f6dfb37dff419.js"/><script src="/_next/static/chunks/4bd1b696-c023c6e3521b1417.js" async=""></script><script src="/_next/static/chunks/255-632950a301ed81a4.js" async=""></script><script src="/_next/static/chunks/main-app-00fb03c24437bd47.js" async=""></script><link rel="icon" href="https://origin.example.com/favicon.ico"/><title>Next.js RSC Test App</title><meta name="description" content="Minimal app for testing Trusted Server RSC integration"/><link rel="stylesheet" href="https://origin.example.com/styles/main.css"/><script src="/_next/static/chunks/polyfills-42372ed130431b0a.js" noModule=""></script></head><body><div hidden=""><!--$--><!--/$--></div><nav><a href="https://origin.example.com/">Home</a><a href="https://origin.example.com/about">About</a><a href="https://origin.example.com/blog/hello-world">Blog</a></nav><main><div><h1>Welcome to the Test App</h1><p>Visit our <a href="https://origin.example.com/getting-started">getting started guide</a>.</p><ul><li><a href="https://origin.example.com/docs">Documentation</a><span> - <!-- -->Learn about the platform</span></li><li><a href="https://origin.example.com/api/v1">API Reference</a><span> - <!-- -->Explore the REST API</span></li><li><a href="https://origin.example.com/dashboard">Dashboard</a><span> - <!-- -->View your analytics</span></li></ul><img src="https://origin.example.com/images/hero.jpg" alt="Hero" width="800" height="400"/></div><!--$--><!--/$--></main><footer><a href="https://origin.example.com/privacy">Privacy Policy</a><a href="https://origin.example.com/terms">Terms of Service</a></footer><script src="/_next/static/chunks/webpack-078f6dfb37dff419.js" id="_R_" async=""></script><script>(self.__next_f=self.__next_f||[]).push([0])</script><script>self.__next_f.push([1,"1:\"$Sreact.fragment\"\n2:I[9766,[],\"\"]\n3:I[8924,[],\"\"]\n4:I[4431,[],\"OutletBoundary\"]\n6:I[5278,[],\"AsyncMetadataOutlet\"]\n8:I[4431,[],\"ViewportBoundary\"]\na:I[4431,[],\"MetadataBoundary\"]\nb:\"$Sreact.suspense\"\nd:I[7150,[],\"\"]\n"])</script><script>self.__next_f.push([1,"0:{\"P\":null,\"b\":\"-0Lth74qNT2E7WJR76kUR\",\"p\":\"\",\"c\":[\"\",\"\"],\"i\":false,\"f\":[[[\"\",{\"children\":[\"__PAGE__\",{}]},\"$undefined\",\"$undefined\",true],[\"\",[\"$\",\"$1\",\"c\",{\"children\":[null,[\"$\",\"html\",null,{\"lang\":\"en\",\"children\":[[\"$\",\"head\",null,{\"children\":[[\"$\",\"link\",null,{\"rel\":\"stylesheet\",\"href\":\"https://origin.example.com/styles/main.css\"}],[\"$\",\"link\",null,{\"rel\":\"icon\",\"href\":\"https://origin.example.com/favicon.ico\"}]]}],[\"$\",\"body\",null,{\"children\":[[\"$\",\"nav\",null,{\"children\":[[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/\",\"children\":\"Home\"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/about\",\"children\":\"About\"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/blog/hello-world\",\"children\":\"Blog\"}]]}],[\"$\",\"main\",null,{\"children\":[\"$\",\"$L2\",null,{\"parallelRouterKey\":\"children\",\"error\":\"$undefined\",\"errorStyles\":\"$undefined\",\"errorScripts\":\"$undefined\",\"template\":[\"$\",\"$L3\",null,{}],\"templateStyles\":\"$undefined\",\"templateScripts\":\"$undefined\",\"notFound\":[[[\"$\",\"title\",null,{\"children\":\"404: This page could not be found.\"}],[\"$\",\"div\",null,{\"style\":{\"fontFamily\":\"system-ui,\\\"Segoe UI\\\",Roboto,Helvetica,Arial,sans-serif,\\\"Apple Color Emoji\\\",\\\"Segoe UI Emoji\\\"\",\"height\":\"100vh\",\"textAlign\":\"center\",\"display\":\"flex\",\"flexDirection\":\"column\",\"alignItems\":\"center\",\"justifyContent\":\"center\"},\"children\":[\"$\",\"div\",null,{\"children\":[[\"$\",\"style\",null,{\"dangerouslySetInnerHTML\":{\"__html\":\"body{color:#000;background:#fff;margin:0}.next-error-h1{border-right:1px solid rgba(0,0,0,.3)}@media (prefers-color-scheme:dark){body{color:#fff;background:#000}.next-error-h1{border-right:1px solid rgba(255,255,255,.3)}}\"}}],[\"$\",\"h1\",null,{\"className\":\"next-error-h1\",\"style\":{\"display\":\"inline-block\",\"margin\":\"0 20px 0 0\",\"padding\":\"0 23px 0 0\",\"fontSize\":24,\"fontWeight\":500,\"verticalAlign\":\"top\",\"lineHeight\":\"49px\"},\"children\":404}],[\"$\",\"div\",null,{\"style\":{\"display\":\"inline-block\"},\"children\":[\"$\",\"h2\",null,{\"style\":{\"fontSize\":14,\"fontWeight\":400,\"lineHeight\":\"49px\",\"margin\":0},\"children\":\"This page could not be found.\"}]}]]}]}]],[]],\"forbidden\":\"$undefined\",\"unauthorized\":\"$undefined\"}]}],[\"$\",\"footer\",null,{\"children\":[[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/privacy\",\"children\":\"Privacy Policy\"}],[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/terms\",\"children\":\"Terms of Service\"}]]}]]}]]}]]}],{\"children\":[\"__PAGE__\",[\"$\",\"$1\",\"c\",{\"children\":[[\"$\",\"div\",null,{\"children\":[[\"$\",\"h1\",null,{\"children\":\"Welcome to the Test App\"}],[\"$\",\"p\",null,{\"children\":[\"Visit our \",[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/getting-started\",\"children\":\"getting started guide\"}],\".\"]}],[\"$\",\"ul\",null,{\"children\":[[\"$\",\"li\",\"https://origin.example.com/docs\",{\"children\":[[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/docs\",\"children\":\"Documentation\"}],[\"$\",\"span\",null,{\"children\":[\" - \",\"Learn about the platform\"]}]]}],[\"$\",\"li\",\"https://origin.example.com/api/v1\",{\"children\":[[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/api/v1\",\"children\":\"API Reference\"}],[\"$\",\"span\",null,{\"children\":[\" - \",\"Explore the REST API\"]}]]}],[\"$\",\"li\",\"https://origin.example.com/dashboard\",{\"children\":[[\"$\",\"a\",null,{\"href\":\"https://origin.example.com/dashboard\",\"children\":\"Dashboard\"}],[\"$\",\"span\",null,{\"children\":[\" - \",\"View your analytics\"]}]]}]]}],[\"$\",\"img\",null,{\"src\":\"https://origin.example.com/images/hero.jpg\",\"alt\":\"Hero\",\"width\":800,\"height\":400}]]}],null,[\"$\",\"$L4\",null,{\"children\":[\"$L5\",[\"$\",\"$L6\",null,{\"promise\":\"$@7\"}]]}]]}],{},null,false]},null,false],[\"$\",\"$1\",\"h\",{\"children\":[null,[[\"$\",\"$L8\",null,{\"children\":\"$L9\"}],null],[\"$\",\"$La\",null,{\"children\":[\"$\",\"div\",null,{\"hidden\":true,\"children\":[\"$\",\"$b\",null,{\"fallback\":null,\"children\":\"$Lc\"}]}]}]]}],false]],\"m\":\"$undefined\",\"G\":[\"$d\",[]],\"s\":false,\"S\":true}\n"])</script><script>self.__next_f.push([1,"9:[[\"$\",\"meta\",\"0\",{\"charSet\":\"utf-8\"}],[\"$\",\"meta\",\"1\",{\"name\":\"viewport\",\"content\":\"width=device-width, initial-scale=1\"}]]\n5:null\n"])</script><script>self.__next_f.push([1,"7:{\"metadata\":[[\"$\",\"title\",\"0\",{\"children\":\"Next.js RSC Test App\"}],[\"$\",\"meta\",\"1\",{\"name\":\"description\",\"content\":\"Minimal app for testing Trusted Server RSC integration\"}]],\"error\":null,\"digest\":\"$undefined\"}\n"])</script><script>self.__next_f.push([1,"c:\"$7:metadata\"\n"])</script></body></html>
\ No newline at end of file
diff --git a/crates/common/src/integrations/nextjs/html_post_process.rs b/crates/common/src/integrations/nextjs/html_post_process.rs
index c85bf517..e9ea7af4 100644
--- a/crates/common/src/integrations/nextjs/html_post_process.rs
+++ b/crates/common/src/integrations/nextjs/html_post_process.rs
@@ -9,7 +9,8 @@ use crate::integrations::{IntegrationHtmlContext, IntegrationHtmlPostProcessor};
 
 use super::rsc::rewrite_rsc_scripts_combined_with_limit;
 use super::rsc_placeholders::{
-    NextJsRscPostProcessState, RSC_PAYLOAD_PLACEHOLDER_PREFIX, RSC_PAYLOAD_PLACEHOLDER_SUFFIX,
+    needs_post_processing, NextJsRscPostProcessState, RSC_PAYLOAD_PLACEHOLDER_PREFIX,
+    RSC_PAYLOAD_PLACEHOLDER_SUFFIX,
 };
 use super::shared::find_rsc_push_payload_range;
 use super::{NextJsIntegrationConfig, NEXTJS_INTEGRATION_ID};
@@ -29,6 +30,15 @@ impl IntegrationHtmlPostProcessor for NextJsHtmlPostProcessor {
         NEXTJS_INTEGRATION_ID
     }
 
+    fn needs_accumulation(
+        &self,
+        document_state: &crate::integrations::IntegrationDocumentState,
+    ) -> bool {
+        self.config.enabled
+            && !self.config.rewrite_attributes.is_empty()
+            && needs_post_processing(document_state)
+    }
+
     fn should_process(&self, html: &str, ctx: &IntegrationHtmlContext<'_>) -> bool {
         if !self.config.enabled || self.config.rewrite_attributes.is_empty() {
             return false;
diff --git a/crates/common/src/integrations/nextjs/rsc_placeholders.rs b/crates/common/src/integrations/nextjs/rsc_placeholders.rs
index 1aa0b391..8ab9a03e 100644
--- a/crates/common/src/integrations/nextjs/rsc_placeholders.rs
+++ b/crates/common/src/integrations/nextjs/rsc_placeholders.rs
@@ -18,6 +18,14 @@ pub(super) const RSC_PAYLOAD_PLACEHOLDER_SUFFIX: &str = "__";
 #[derive(Default)]
 pub(super) struct NextJsRscPostProcessState {
     pub(super) payloads: Vec<String>,
+    /// Set to `true` when a fragmented script was observed during the streaming
+    /// pass (i.e. `lol_html` delivered script text in multiple chunks). The
+    /// placeholder rewriter cannot process fragmented scripts, so the
+    /// post-processor's fallback re-parse path must handle them. This flag
+    /// ensures accumulation is triggered even when no payloads were captured
+    /// via placeholders. For non-RSC scripts the post-processor's
+    /// `should_process` check will return false, so the only cost is buffering.
+    pub(super) saw_fragmented_script: bool,
 }
 
 impl NextJsRscPostProcessState {
@@ -26,6 +34,31 @@ impl NextJsRscPostProcessState {
     }
 }
 
+/// Returns `true` if the streaming pass detected RSC content that requires
+/// post-processing.
+///
+/// This covers two scenarios:
+/// 1. Unfragmented RSC scripts whose payloads were captured as placeholders.
+/// 2. Fragmented RSC scripts (script text split across `lol_html` chunks)
+///    that the placeholder rewriter could not process — the post-processor's
+///    fallback re-parse path will handle these.
+///
+/// Used by `HtmlWithPostProcessing` to decide whether to start
+/// accumulating output for post-processing.
+#[must_use]
+pub(super) fn needs_post_processing(
+    document_state: &crate::integrations::IntegrationDocumentState,
+) -> bool {
+    document_state
+        .get::<Mutex<NextJsRscPostProcessState>>(NEXTJS_INTEGRATION_ID)
+        .is_some_and(|state| {
+            let guard = state
+                .lock()
+                .unwrap_or_else(std::sync::PoisonError::into_inner);
+            !guard.payloads.is_empty() || guard.saw_fragmented_script
+        })
+}
+
 fn rsc_payload_placeholder(index: usize) -> String {
     format!("{RSC_PAYLOAD_PLACEHOLDER_PREFIX}{index}{RSC_PAYLOAD_PLACEHOLDER_SUFFIX}")
 }
@@ -58,8 +91,20 @@ impl IntegrationScriptRewriter for NextJsRscPlaceholderRewriter {
         // Fragmented scripts are handled by the post-processor which re-parses the final HTML.
         // This avoids corrupting non-RSC scripts that happen to be fragmented during streaming.
         if !ctx.is_last_in_text_node {
-            // Script is fragmented - skip placeholder processing.
-            // The post-processor will handle RSC scripts at end-of-document.
+            // Script is fragmented — skip placeholder processing but flag it so
+            // that `HtmlWithPostProcessing` knows to accumulate output for the
+            // post-processor's fallback re-parse path. We flag any fragmented
+            // script (not just those containing `__next_f`) because the RSC
+            // marker can itself be split across chunk boundaries.
+            let state = ctx
+                .document_state
+                .get_or_insert_with(NEXTJS_INTEGRATION_ID, || {
+                    Mutex::new(NextJsRscPostProcessState::default())
+                });
+            let mut guard = state
+                .lock()
+                .unwrap_or_else(std::sync::PoisonError::into_inner);
+            guard.saw_fragmented_script = true;
             return ScriptRewriteAction::keep();
         }
 
@@ -183,12 +228,18 @@ mod tests {
             "Final chunk of fragmented script should be kept"
         );
 
-        // No payloads should be stored - post-processor will handle this
+        // No payloads should be stored - post-processor will handle this via re-parse
+        let stored = state
+            .get::<Mutex<NextJsRscPostProcessState>>(NEXTJS_INTEGRATION_ID)
+            .expect("RSC state should be created for fragmented RSC scripts");
+        let guard = stored.lock().expect("should lock Next.js RSC state");
+        assert!(
+            guard.payloads.is_empty(),
+            "No payloads should be captured for fragmented scripts"
+        );
         assert!(
-            state
-                .get::<Mutex<NextJsRscPostProcessState>>(NEXTJS_INTEGRATION_ID)
-                .is_none(),
-            "No RSC state should be created for fragmented scripts"
+            guard.saw_fragmented_script,
+            "Fragmented scripts should set the saw_fragmented_script flag"
         );
     }
 
diff --git a/crates/common/src/integrations/registry.rs b/crates/common/src/integrations/registry.rs
index 07fec408..2540c2fc 100644
--- a/crates/common/src/integrations/registry.rs
+++ b/crates/common/src/integrations/registry.rs
@@ -364,6 +364,15 @@ pub trait IntegrationHtmlPostProcessor: Send + Sync {
     /// Identifier for logging/diagnostics.
     fn integration_id(&self) -> &'static str;
 
+    /// Return `true` when this processor requires buffering of subsequent
+    /// streamed output so [`Self::post_process`] can run against complete HTML.
+    ///
+    /// Defaults to `true` for correctness: processors that do not override this
+    /// method will continue to receive whole-document HTML as before.
+    fn needs_accumulation(&self, _document_state: &IntegrationDocumentState) -> bool {
+        true
+    }
+
     /// Fast preflight check to decide whether post-processing should run for this document.
     ///
     /// Implementations should keep this cheap (e.g., a substring check) because it may run on
@@ -945,6 +954,17 @@ mod tests {
         );
     }
 
+    #[test]
+    fn default_html_post_processor_needs_accumulation_is_true() {
+        let processor = NoopHtmlPostProcessor;
+        let document_state = IntegrationDocumentState::default();
+
+        assert!(
+            processor.needs_accumulation(&document_state),
+            "Default `needs_accumulation` should be true for post-processing correctness"
+        );
+    }
+
     #[test]
     fn test_exact_route_matching() {
         let routes = vec![(
diff --git a/crates/common/src/publisher.rs b/crates/common/src/publisher.rs
index 831b4267..9b442942 100644
--- a/crates/common/src/publisher.rs
+++ b/crates/common/src/publisher.rs
@@ -170,6 +170,18 @@ fn create_html_stream_processor(
     Ok(create_html_processor(config))
 }
 
+fn apply_standard_response_headers(settings: &Settings, response: &mut Response) {
+    if let Ok(v) = ::std::env::var(ENV_FASTLY_SERVICE_VERSION) {
+        response.set_header(HEADER_X_TS_VERSION, v);
+    }
+    if ::std::env::var(ENV_FASTLY_IS_STAGING).as_deref() == Ok("1") {
+        response.set_header(HEADER_X_TS_ENV, "staging");
+    }
+    for (key, value) in &settings.response_headers {
+        response.set_header(key, value);
+    }
+}
+
 /// Proxies requests to the publisher's origin server.
 ///
 /// This function forwards incoming requests to the configured origin URL,
@@ -384,6 +396,7 @@ pub fn handle_publisher_request_streaming(
         );
         response.set_header(HEADER_X_SYNTHETIC_ID, synthetic_id.as_str());
         set_synthetic_cookie(settings, &mut response, synthetic_id.as_str());
+        apply_standard_response_headers(settings, &mut response);
         return Ok(RouteResult::Buffered(response));
     }
 
@@ -403,18 +416,7 @@ pub fn handle_publisher_request_streaming(
 
     response.set_header(HEADER_X_SYNTHETIC_ID, synthetic_id.as_str());
     set_synthetic_cookie(settings, &mut response, synthetic_id.as_str());
-
-    if let Ok(v) = ::std::env::var(ENV_FASTLY_SERVICE_VERSION) {
-        response.set_header(HEADER_X_TS_VERSION, v);
-    }
-    if ::std::env::var(ENV_FASTLY_IS_STAGING).as_deref() == Ok("1") {
-        response.set_header(HEADER_X_TS_ENV, "staging");
-    }
-
-    // Add global settings headers before streaming since we commit headers
-    for (key, value) in &settings.response_headers {
-        response.set_header(key, value);
-    }
+    apply_standard_response_headers(settings, &mut response);
 
     // Remove content-length since we stream and modify size
     response.remove_header(header::CONTENT_LENGTH);
diff --git a/crates/common/tests/nextjs_integration.rs b/crates/common/tests/nextjs_integration.rs
new file mode 100644
index 00000000..16e1845b
--- /dev/null
+++ b/crates/common/tests/nextjs_integration.rs
@@ -0,0 +1,629 @@
+//! Fixture-driven integration tests for Next.js RSC URL rewriting.
+//!
+//! These tests exercise the full streaming pipeline against realistic HTML
+//! fixtures captured from a Next.js App Router application. Each fixture is
+//! processed with multiple chunk sizes to exercise both the placeholder path
+//! (unfragmented scripts) and the fallback re-parse path (fragmented scripts).
+
+#![allow(clippy::print_stdout)]
+
+use std::io::Cursor;
+
+use trusted_server_common::html_processor::{create_html_processor, HtmlProcessorConfig};
+use trusted_server_common::integrations::IntegrationRegistry;
+use trusted_server_common::settings::Settings;
+use trusted_server_common::streaming_processor::{
+    Compression, PipelineConfig, StreamProcessor, StreamingPipeline,
+};
+
+// ---------------------------------------------------------------------------
+// Fixtures
+// ---------------------------------------------------------------------------
+
+const FIXTURE_SIMPLE: &str =
+    include_str!("../src/integrations/nextjs/fixtures/app-router-simple.html");
+const FIXTURE_TCHUNK: &str =
+    include_str!("../src/integrations/nextjs/fixtures/app-router-tchunk.html");
+const FIXTURE_LARGE: &str =
+    include_str!("../src/integrations/nextjs/fixtures/app-router-large.html");
+const FIXTURE_NON_RSC: &str = include_str!("../src/integrations/nextjs/fixtures/non-rsc-page.html");
+
+// ---------------------------------------------------------------------------
+// Test helpers
+// ---------------------------------------------------------------------------
+
+const ORIGIN_HOST: &str = "origin.example.com";
+const PROXY_HOST: &str = "proxy.example.com";
+const SCHEME: &str = "https";
+
+/// Small chunk size to maximize script fragmentation and exercise cross-chunk state handling.
+/// With 32-64 byte chunks, `lol_html` frequently fragments script text nodes, forcing the
+/// fallback re-parse path for RSC placeholder substitution.
+const CHUNK_SIZE_SMALL: usize = 32;
+
+/// Medium chunk size - typical for network reads. Balances between fragmentation
+/// and realistic streaming behavior.
+const CHUNK_SIZE_MEDIUM: usize = 256;
+
+/// Large chunk size - can fit small to medium HTML documents in a single chunk.
+/// Tests the placeholder path (unfragmented scripts) vs fallback re-parse path.
+const CHUNK_SIZE_LARGE: usize = 8192;
+
+fn create_nextjs_settings() -> Settings {
+    let toml = r#"
+        [[handlers]]
+        path = "^/secure"
+        username = "user"
+        password = "pass"
+
+        [publisher]
+        domain = "test-publisher.com"
+        cookie_domain = ".test-publisher.com"
+        origin_backend = "publisher_origin"
+        origin_url = "https://origin.example.com"
+        proxy_secret = "unit-test-proxy-secret"
+
+        [integrations.prebid]
+        enabled = false
+
+        [integrations.nextjs]
+        enabled = true
+        rewrite_attributes = ["href", "link", "url"]
+
+        [synthetic]
+        counter_store = "test-counter-store"
+        opid_store = "test-opid-store"
+        secret_key = "test-secret-key"
+        template = "{{client_ip}}:{{user_agent}}"
+
+        [request_signing]
+        config_store_id = "test-config-store-id"
+        secret_store_id = "test-secret-store-id"
+
+        [[backends]]
+        name = "publisher_origin"
+        target = "https://origin.example.com"
+    "#;
+    Settings::from_toml(toml).expect("test settings should parse")
+}
+
+fn create_non_rsc_settings() -> Settings {
+    let toml = r#"
+        [[handlers]]
+        path = "^/secure"
+        username = "user"
+        password = "pass"
+
+        [publisher]
+        domain = "test-publisher.com"
+        cookie_domain = ".test-publisher.com"
+        origin_backend = "publisher_origin"
+        origin_url = "https://origin.example.com"
+        proxy_secret = "unit-test-proxy-secret"
+
+        [integrations.prebid]
+        enabled = false
+
+        [integrations.nextjs]
+        enabled = false
+
+        [synthetic]
+        counter_store = "test-counter-store"
+        opid_store = "test-opid-store"
+        secret_key = "test-secret-key"
+        template = "{{client_ip}}:{{user_agent}}"
+
+        [request_signing]
+        config_store_id = "test-config-store-id"
+        secret_store_id = "test-secret-store-id"
+
+        [[backends]]
+        name = "publisher_origin"
+        target = "https://origin.example.com"
+    "#;
+    Settings::from_toml(toml).expect("test settings should parse")
+}
+
+struct FixtureTestResult {
+    output: String,
+    intermediate_bytes: usize,
+    final_bytes: usize,
+}
+
+impl FixtureTestResult {
+    fn total_bytes(&self) -> usize {
+        self.intermediate_bytes + self.final_bytes
+    }
+
+    fn streaming_ratio(&self) -> f64 {
+        let total = self.total_bytes();
+        if total == 0 {
+            0.0
+        } else {
+            self.intermediate_bytes as f64 / total as f64
+        }
+    }
+}
+
+/// Process a fixture through the full streaming pipeline and return results.
+fn run_pipeline_test(fixture: &str, chunk_size: usize, settings: &Settings) -> FixtureTestResult {
+    let registry = IntegrationRegistry::new(settings).expect("should create registry");
+    let config =
+        HtmlProcessorConfig::from_settings(settings, &registry, ORIGIN_HOST, PROXY_HOST, SCHEME);
+    let processor = create_html_processor(config);
+
+    let pipeline_config = PipelineConfig {
+        input_compression: Compression::None,
+        output_compression: Compression::None,
+        chunk_size,
+    };
+    let mut pipeline = StreamingPipeline::new(pipeline_config, processor);
+    let mut output = Vec::new();
+    pipeline
+        .process(Cursor::new(fixture.as_bytes()), &mut output)
+        .expect("pipeline should process fixture");
+
+    let output_str = String::from_utf8(output).expect("output should be valid UTF-8");
+
+    // StreamingPipeline doesn't expose per-chunk metrics, so we use a
+    // chunk-level processor to measure streaming behavior.
+    FixtureTestResult {
+        output: output_str,
+        intermediate_bytes: 0,
+        final_bytes: 0,
+    }
+}
+
+/// Process a fixture chunk-by-chunk using the raw `StreamProcessor` interface
+/// to measure streaming behavior.
+fn run_chunked_test(fixture: &str, chunk_size: usize, settings: &Settings) -> FixtureTestResult {
+    let registry = IntegrationRegistry::new(settings).expect("should create registry");
+    let config =
+        HtmlProcessorConfig::from_settings(settings, &registry, ORIGIN_HOST, PROXY_HOST, SCHEME);
+    let mut processor = create_html_processor(config);
+
+    let bytes = fixture.as_bytes();
+    let chunks: Vec<&[u8]> = bytes.chunks(chunk_size).collect();
+    let last_idx = chunks.len().saturating_sub(1);
+
+    let mut intermediate_bytes = 0usize;
+    let mut final_bytes = 0usize;
+    let mut full_output = Vec::new();
+
+    for (i, chunk) in chunks.iter().enumerate() {
+        let is_last = i == last_idx;
+        let result = processor
+            .process_chunk(chunk, is_last)
+            .expect("should process chunk");
+
+        if is_last {
+            final_bytes = result.len();
+        } else {
+            intermediate_bytes += result.len();
+        }
+        full_output.extend_from_slice(&result);
+    }
+
+    let output = String::from_utf8(full_output).expect("output should be valid UTF-8");
+
+    FixtureTestResult {
+        output,
+        intermediate_bytes,
+        final_bytes,
+    }
+}
+
+/// Shared correctness assertions for RSC fixtures.
+fn assert_rsc_correctness(result: &FixtureTestResult, fixture_name: &str) {
+    // All origin URLs should be rewritten
+    assert!(
+        result.output.contains(PROXY_HOST),
+        "[{fixture_name}] Output should contain proxy host. Got:\n{}",
+        &result.output[..result.output.len().min(500)]
+    );
+
+    // No RSC placeholder markers should leak
+    assert!(
+        !result.output.contains("__ts_rsc_payload_"),
+        "[{fixture_name}] No RSC placeholder markers should appear in output"
+    );
+
+    // HTML structure should be intact
+    assert!(
+        result.output.contains("<html"),
+        "[{fixture_name}] HTML should be structurally intact"
+    );
+    assert!(
+        result.output.contains("</html>"),
+        "[{fixture_name}] HTML closing tag should be present"
+    );
+
+    // RSC scripts should still be present (even if content is rewritten)
+    assert!(
+        result.output.contains("__next_f"),
+        "[{fixture_name}] RSC scripts should be preserved in output"
+    );
+}
+
+fn assert_non_rsc_correctness(result: &FixtureTestResult, fixture_name: &str) {
+    assert!(
+        result.output.contains(PROXY_HOST),
+        "[{fixture_name}] Output should contain proxy host"
+    );
+    assert!(
+        result.output.contains("<html"),
+        "[{fixture_name}] HTML should be structurally intact"
+    );
+    // Non-RSC pages should NOT have __next_f scripts
+    assert!(
+        !result.output.contains("__next_f"),
+        "[{fixture_name}] Non-RSC page should not have RSC scripts"
+    );
+}
+
+// ===========================================================================
+// Tests: App Router Simple (unfragmented RSC scripts)
+// ===========================================================================
+
+#[test]
+fn app_router_simple_pipeline_large_chunks() {
+    let settings = create_nextjs_settings();
+    let result = run_pipeline_test(FIXTURE_SIMPLE, CHUNK_SIZE_LARGE, &settings);
+    assert_rsc_correctness(&result, "simple/8192");
+}
+
+#[test]
+fn app_router_simple_pipeline_medium_chunks() {
+    let settings = create_nextjs_settings();
+    let result = run_pipeline_test(FIXTURE_SIMPLE, 64, &settings);
+    assert_rsc_correctness(&result, "simple/64");
+}
+
+#[test]
+fn app_router_simple_pipeline_small_chunks() {
+    let settings = create_nextjs_settings();
+    let result = run_pipeline_test(FIXTURE_SIMPLE, CHUNK_SIZE_SMALL, &settings);
+    assert_rsc_correctness(&result, "simple/32");
+}
+
+#[test]
+fn app_router_simple_streaming_behavior() {
+    let settings = create_nextjs_settings();
+
+    // Large chunks: RSC scripts fit in single lol_html text nodes → placeholder path
+    let large = run_chunked_test(FIXTURE_SIMPLE, CHUNK_SIZE_LARGE, &settings);
+    assert_rsc_correctness(&large, "simple/streaming/8192");
+
+    // Small chunks: scripts get fragmented → fallback re-parse path
+    let small = run_chunked_test(FIXTURE_SIMPLE, CHUNK_SIZE_SMALL, &settings);
+    assert_rsc_correctness(&small, "simple/streaming/32");
+
+    println!(
+        "app-router-simple streaming ratios: large={:.1}%, small={:.1}%",
+        large.streaming_ratio() * 100.0,
+        small.streaming_ratio() * 100.0
+    );
+}
+
+// ===========================================================================
+// Tests: App Router T-chunks (escaped HTML in RSC payloads)
+// ===========================================================================
+
+#[test]
+fn app_router_tchunk_pipeline_large_chunks() {
+    let settings = create_nextjs_settings();
+    let result = run_pipeline_test(FIXTURE_TCHUNK, CHUNK_SIZE_LARGE, &settings);
+    assert_rsc_correctness(&result, "tchunk/8192");
+}
+
+#[test]
+fn app_router_tchunk_pipeline_small_chunks() {
+    let settings = create_nextjs_settings();
+    let result = run_pipeline_test(FIXTURE_TCHUNK, CHUNK_SIZE_SMALL, &settings);
+    assert_rsc_correctness(&result, "tchunk/32");
+}
+
+#[test]
+fn app_router_tchunk_streaming_behavior() {
+    let settings = create_nextjs_settings();
+
+    let large = run_chunked_test(FIXTURE_TCHUNK, CHUNK_SIZE_LARGE, &settings);
+    assert_rsc_correctness(&large, "tchunk/streaming/8192");
+
+    let small = run_chunked_test(FIXTURE_TCHUNK, CHUNK_SIZE_SMALL, &settings);
+    assert_rsc_correctness(&small, "tchunk/streaming/32");
+
+    println!(
+        "app-router-tchunk streaming ratios: large={:.1}%, small={:.1}%",
+        large.streaming_ratio() * 100.0,
+        small.streaming_ratio() * 100.0
+    );
+}
+
+// ===========================================================================
+// Tests: App Router Large (multiple RSC scripts, potential cross-script)
+// ===========================================================================
+
+#[test]
+fn app_router_large_pipeline_large_chunks() {
+    let settings = create_nextjs_settings();
+    let result = run_pipeline_test(FIXTURE_LARGE, CHUNK_SIZE_LARGE, &settings);
+    assert_rsc_correctness(&result, "large/8192");
+}
+
+#[test]
+fn app_router_large_pipeline_medium_chunks() {
+    let settings = create_nextjs_settings();
+    let result = run_pipeline_test(FIXTURE_LARGE, 64, &settings);
+    assert_rsc_correctness(&result, "large/64");
+}
+
+#[test]
+fn app_router_large_pipeline_small_chunks() {
+    let settings = create_nextjs_settings();
+    let result = run_pipeline_test(FIXTURE_LARGE, CHUNK_SIZE_SMALL, &settings);
+    assert_rsc_correctness(&result, "large/32");
+}
+
+#[test]
+fn app_router_large_streaming_behavior() {
+    let settings = create_nextjs_settings();
+
+    let large = run_chunked_test(FIXTURE_LARGE, CHUNK_SIZE_LARGE, &settings);
+    assert_rsc_correctness(&large, "large/streaming/8192");
+
+    let small = run_chunked_test(FIXTURE_LARGE, CHUNK_SIZE_SMALL, &settings);
+    assert_rsc_correctness(&small, "large/streaming/32");
+
+    println!(
+        "app-router-large streaming ratios: large={:.1}%, small={:.1}%",
+        large.streaming_ratio() * 100.0,
+        small.streaming_ratio() * 100.0
+    );
+}
+
+// ===========================================================================
+// Tests: Non-RSC page (no __next_f scripts)
+// ===========================================================================
+
+#[test]
+fn non_rsc_page_pipeline() {
+    let settings = create_non_rsc_settings();
+    let result = run_pipeline_test(FIXTURE_NON_RSC, 64, &settings);
+    assert_non_rsc_correctness(&result, "non-rsc/pipeline");
+
+    // No origin URLs should remain (only checking href/src attributes)
+    assert!(
+        !result.output.contains("origin.example.com"),
+        "[non-rsc] No origin URLs should remain in output"
+    );
+}
+
+#[test]
+fn non_rsc_page_streams_incrementally() {
+    // Without Next.js enabled, non-RSC pages should stream fully
+    let settings = create_non_rsc_settings();
+    let result = run_chunked_test(FIXTURE_NON_RSC, 64, &settings);
+    assert_non_rsc_correctness(&result, "non-rsc/streaming");
+
+    assert!(
+        result.intermediate_bytes > 0,
+        "Non-RSC pages should stream incrementally (got 0 intermediate bytes). \
+         Final bytes: {}",
+        result.final_bytes
+    );
+
+    println!(
+        "non-rsc streaming ratio: {:.1}%",
+        result.streaming_ratio() * 100.0
+    );
+}
+
+#[test]
+fn non_rsc_page_streams_with_nextjs_enabled() {
+    // Even with Next.js enabled, non-RSC pages with unfragmented scripts should
+    // stream because the lazy accumulation fix only triggers for RSC content.
+    let settings = create_nextjs_settings();
+
+    // Use a chunk size that produces multiple chunks for the ~1KB fixture,
+    // but is large enough that the small analytics scripts (~30 bytes each)
+    // won't be fragmented by lol_html.
+    let result = run_chunked_test(FIXTURE_NON_RSC, CHUNK_SIZE_MEDIUM, &settings);
+    assert_non_rsc_correctness(&result, "non-rsc/nextjs-enabled/256");
+
+    assert!(
+        result.intermediate_bytes > 0,
+        "Non-RSC pages should stream even when Next.js is enabled \
+         (got 0 intermediate bytes). Final bytes: {}",
+        result.final_bytes
+    );
+
+    println!(
+        "non-rsc with nextjs enabled streaming ratio: {:.1}%",
+        result.streaming_ratio() * 100.0
+    );
+}
+
+// ===========================================================================
+// Tests: URL rewriting completeness across fixtures
+// ===========================================================================
+
+#[test]
+fn all_fixtures_rewrite_html_attribute_urls() {
+    let settings = create_nextjs_settings();
+
+    for (name, fixture) in [
+        ("simple", FIXTURE_SIMPLE),
+        ("tchunk", FIXTURE_TCHUNK),
+        ("large", FIXTURE_LARGE),
+    ] {
+        let result = run_pipeline_test(fixture, 8192, &settings);
+
+        // href attributes should be rewritten
+        assert!(
+            !result.output.contains("href=\"https://origin.example.com"),
+            "[{name}] href attributes should be rewritten to proxy host"
+        );
+
+        // src attributes should be rewritten
+        assert!(
+            !result.output.contains("src=\"https://origin.example.com"),
+            "[{name}] src attributes should be rewritten to proxy host"
+        );
+    }
+}
+
+// ===========================================================================
+// Tests: Real Next.js output (captured from the example app)
+// ===========================================================================
+// These fixtures are actual HTML responses from a Next.js 15 App Router app,
+// not hand-crafted. They exercise the full complexity of real RSC payloads.
+
+const REAL_HOME: &str = include_str!("../src/integrations/nextjs/fixtures/real-nextjs-home.html");
+const REAL_ABOUT: &str = include_str!("../src/integrations/nextjs/fixtures/real-nextjs-about.html");
+const REAL_BLOG: &str = include_str!("../src/integrations/nextjs/fixtures/real-nextjs-blog.html");
+
+#[test]
+fn real_nextjs_home_pipeline() {
+    let settings = create_nextjs_settings();
+    for chunk_size in [32, 64, 256, 8192] {
+        let result = run_pipeline_test(REAL_HOME, chunk_size, &settings);
+
+        assert!(
+            result.output.contains(PROXY_HOST),
+            "[real-home/chunk={chunk_size}] Output should contain proxy host"
+        );
+        assert!(
+            !result.output.contains("__ts_rsc_payload_"),
+            "[real-home/chunk={chunk_size}] No placeholder markers should leak"
+        );
+        assert!(
+            result.output.contains("<html"),
+            "[real-home/chunk={chunk_size}] HTML should be intact"
+        );
+        // RSC payloads should have origin URLs rewritten
+        assert!(
+            !result.output.contains("href=\"https://origin.example.com"),
+            "[real-home/chunk={chunk_size}] href attributes should be rewritten"
+        );
+    }
+}
+
+#[test]
+fn real_nextjs_about_pipeline() {
+    let settings = create_nextjs_settings();
+    for chunk_size in [32, 64, 256, 8192] {
+        let result = run_pipeline_test(REAL_ABOUT, chunk_size, &settings);
+
+        assert!(
+            result.output.contains(PROXY_HOST),
+            "[real-about/chunk={chunk_size}] Output should contain proxy host"
+        );
+        assert!(
+            !result.output.contains("__ts_rsc_payload_"),
+            "[real-about/chunk={chunk_size}] No placeholder markers should leak"
+        );
+        assert!(
+            !result.output.contains("href=\"https://origin.example.com"),
+            "[real-about/chunk={chunk_size}] href attributes should be rewritten"
+        );
+    }
+}
+
+#[test]
+fn real_nextjs_blog_pipeline() {
+    let settings = create_nextjs_settings();
+    for chunk_size in [32, 64, 256, 8192] {
+        let result = run_pipeline_test(REAL_BLOG, chunk_size, &settings);
+
+        assert!(
+            result.output.contains(PROXY_HOST),
+            "[real-blog/chunk={chunk_size}] Output should contain proxy host"
+        );
+        assert!(
+            !result.output.contains("__ts_rsc_payload_"),
+            "[real-blog/chunk={chunk_size}] No placeholder markers should leak"
+        );
+        assert!(
+            !result.output.contains("href=\"https://origin.example.com"),
+            "[real-blog/chunk={chunk_size}] href attributes should be rewritten"
+        );
+    }
+}
+
+#[test]
+fn real_nextjs_rsc_payloads_rewritten() {
+    // Verify that origin URLs inside RSC Flight payloads (not just HTML attributes)
+    // are rewritten. This is the critical test — RSC payloads contain URLs as JSON
+    // strings inside JavaScript, which lol_html can't reach via attribute rewriting.
+    let settings = create_nextjs_settings();
+
+    for (name, fixture) in [
+        ("real-home", REAL_HOME),
+        ("real-about", REAL_ABOUT),
+        ("real-blog", REAL_BLOG),
+    ] {
+        for chunk_size in [32, 64, 256, 8192] {
+            let result = run_pipeline_test(fixture, chunk_size, &settings);
+
+            // Count remaining origin URLs in RSC script content
+            let rsc_origin_count = result
+                .output
+                .match_indices("origin.example.com")
+                .filter(|(pos, _)| {
+                    // Only count occurrences inside <script> content (RSC payloads)
+                    let before = &result.output[..*pos];
+                    let last_script_open = before.rfind("<script");
+                    let last_script_close = before.rfind("</script>");
+                    match (last_script_open, last_script_close) {
+                        (Some(open), Some(close)) => open > close, // inside a script
+                        (Some(_), None) => true,                   // inside first script
+                        _ => false,
+                    }
+                })
+                .count();
+
+            println!(
+                "[{name}/chunk={chunk_size}] RSC payload origin URLs remaining: {rsc_origin_count}"
+            );
+
+            // RSC payloads should be rewritten (origin URLs replaced with proxy URLs)
+            assert_eq!(
+                rsc_origin_count, 0,
+                "[{name}/chunk={chunk_size}] All origin URLs in RSC payloads should be rewritten \
+                 to proxy host. Found {rsc_origin_count} remaining."
+            );
+        }
+    }
+}
+
+#[test]
+fn real_nextjs_streaming_behavior() {
+    let settings = create_nextjs_settings();
+
+    for (name, fixture) in [
+        ("real-home", REAL_HOME),
+        ("real-about", REAL_ABOUT),
+        ("real-blog", REAL_BLOG),
+    ] {
+        // Small chunks to see streaming behavior
+        let result = run_chunked_test(fixture, 64, &settings);
+
+        println!(
+            "[{name}] streaming: {:.1}% ({} intermediate, {} final)",
+            result.streaming_ratio() * 100.0,
+            result.intermediate_bytes,
+            result.final_bytes
+        );
+
+        // Correctness should hold regardless of chunk size
+        assert!(
+            result.output.contains(PROXY_HOST),
+            "[{name}] Output should contain proxy host with 64-byte chunks"
+        );
+        assert!(
+            result.output.contains("<html"),
+            "[{name}] HTML should be intact with 64-byte chunks"
+        );
+    }
+}
diff --git a/crates/fastly/src/main.rs b/crates/fastly/src/main.rs
index daa1a49e..0b41a2d5 100644
--- a/crates/fastly/src/main.rs
+++ b/crates/fastly/src/main.rs
@@ -28,6 +28,57 @@ use crate::error::to_error_response;
 
 use trusted_server_common::publisher::RouteResult;
 
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+enum RouteTarget {
+    TsjsDynamic,
+    Discovery,
+    VerifySignature,
+    RotateKey,
+    DeactivateKey,
+    Auction,
+    FirstPartyProxy,
+    FirstPartyClick,
+    FirstPartySign,
+    FirstPartyProxyRebuild,
+    Integration,
+    PublisherProxy,
+}
+
+fn classify_route(
+    method: &Method,
+    path: &str,
+    integration_registry: &IntegrationRegistry,
+) -> RouteTarget {
+    match (method.clone(), path) {
+        (Method::GET, p) if p.starts_with("/static/tsjs=") => RouteTarget::TsjsDynamic,
+        (Method::GET, "/.well-known/trusted-server.json") => RouteTarget::Discovery,
+        (Method::POST, "/verify-signature") => RouteTarget::VerifySignature,
+        (Method::POST, "/admin/keys/rotate") => RouteTarget::RotateKey,
+        (Method::POST, "/admin/keys/deactivate") => RouteTarget::DeactivateKey,
+        (Method::POST, "/auction") => RouteTarget::Auction,
+        (Method::GET, "/first-party/proxy") => RouteTarget::FirstPartyProxy,
+        (Method::GET, "/first-party/click") => RouteTarget::FirstPartyClick,
+        (Method::GET, "/first-party/sign") | (Method::POST, "/first-party/sign") => {
+            RouteTarget::FirstPartySign
+        }
+        (Method::POST, "/first-party/proxy-rebuild") => RouteTarget::FirstPartyProxyRebuild,
+        (m, p) if integration_registry.has_route(&m, p) => RouteTarget::Integration,
+        _ => RouteTarget::PublisherProxy,
+    }
+}
+
+fn apply_standard_response_headers(response: &mut Response, settings: &Settings) {
+    if let Ok(v) = ::std::env::var(ENV_FASTLY_SERVICE_VERSION) {
+        response.set_header(HEADER_X_TS_VERSION, v);
+    }
+    if ::std::env::var(ENV_FASTLY_IS_STAGING).as_deref() == Ok("1") {
+        response.set_header(HEADER_X_TS_ENV, "staging");
+    }
+    for (key, value) in &settings.response_headers {
+        response.set_header(key, value);
+    }
+}
+
 fn main() {
     fastly::init();
     init_logger();
@@ -84,33 +135,15 @@ async fn route_request(
     );
 
     if let Some(mut response) = enforce_basic_auth(settings, &req) {
-        for (key, value) in &settings.response_headers {
-            response.set_header(key, value);
-        }
+        apply_standard_response_headers(&mut response, settings);
         return Ok(RouteResult::Buffered(response));
     }
 
     // Get path and method for routing
     let path = req.get_path().to_string();
     let method = req.get_method().clone();
-
-    // Check if it's the publisher proxy fallback
-    let is_publisher_proxy = match (method.clone(), path.as_str()) {
-        (Method::GET, p) if p.starts_with("/static/tsjs=") => false,
-        (Method::GET, "/.well-known/trusted-server.json") => false,
-        (Method::POST, "/verify-signature") => false,
-        (Method::POST, "/admin/keys/rotate") => false,
-        (Method::POST, "/admin/keys/deactivate") => false,
-        (Method::POST, "/auction") => false,
-        (Method::GET, "/first-party/proxy") => false,
-        (Method::GET, "/first-party/click") => false,
-        (Method::GET, "/first-party/sign") | (Method::POST, "/first-party/sign") => false,
-        (Method::POST, "/first-party/proxy-rebuild") => false,
-        (m, p) if integration_registry.has_route(&m, p) => false,
-        _ => true,
-    };
-
-    if is_publisher_proxy {
+    let target = classify_route(&method, &path, integration_registry);
+    if target == RouteTarget::PublisherProxy {
         log::info!(
             "No known route matched for path: {}, proxying to publisher origin",
             path
@@ -122,70 +155,40 @@ async fn route_request(
             Err(e) => {
                 log::error!("Failed to proxy to publisher origin: {:?}", e);
                 let mut err_resp = to_error_response(&e);
-                for (key, value) in &settings.response_headers {
-                    err_resp.set_header(key, value);
-                }
+                apply_standard_response_headers(&mut err_resp, settings);
                 return Ok(RouteResult::Buffered(err_resp));
             }
         }
     }
 
     // Match known routes and handle them
-    let result = match (method, path.as_str()) {
-        // Serve the tsjs library
-        (Method::GET, path) if path.starts_with("/static/tsjs=") => {
-            handle_tsjs_dynamic(&req, integration_registry)
-        }
-
-        // Discovery endpoint for trusted-server capabilities and JWKS
-        (Method::GET, "/.well-known/trusted-server.json") => {
-            handle_trusted_server_discovery(settings, req)
-        }
-
-        // Signature verification endpoint
-        (Method::POST, "/verify-signature") => handle_verify_signature(settings, req),
-
-        // Key rotation admin endpoints
-        (Method::POST, "/admin/keys/rotate") => handle_rotate_key(settings, req),
-        (Method::POST, "/admin/keys/deactivate") => handle_deactivate_key(settings, req),
-
-        // Unified auction endpoint (returns creative HTML inline)
-        (Method::POST, "/auction") => handle_auction(settings, orchestrator, req).await,
-
-        // tsjs endpoints
-        (Method::GET, "/first-party/proxy") => handle_first_party_proxy(settings, req).await,
-        (Method::GET, "/first-party/click") => handle_first_party_click(settings, req).await,
-        (Method::GET, "/first-party/sign") | (Method::POST, "/first-party/sign") => {
-            handle_first_party_proxy_sign(settings, req).await
-        }
-        (Method::POST, "/first-party/proxy-rebuild") => {
+    let result = match target {
+        RouteTarget::TsjsDynamic => handle_tsjs_dynamic(&req, integration_registry),
+        RouteTarget::Discovery => handle_trusted_server_discovery(settings, req),
+        RouteTarget::VerifySignature => handle_verify_signature(settings, req),
+        RouteTarget::RotateKey => handle_rotate_key(settings, req),
+        RouteTarget::DeactivateKey => handle_deactivate_key(settings, req),
+        RouteTarget::Auction => handle_auction(settings, orchestrator, req).await,
+        RouteTarget::FirstPartyProxy => handle_first_party_proxy(settings, req).await,
+        RouteTarget::FirstPartyClick => handle_first_party_click(settings, req).await,
+        RouteTarget::FirstPartySign => handle_first_party_proxy_sign(settings, req).await,
+        RouteTarget::FirstPartyProxyRebuild => {
             handle_first_party_proxy_rebuild(settings, req).await
         }
-        (m, path) if integration_registry.has_route(&m, path) => integration_registry
-            .handle_proxy(&m, path, settings, req)
+        RouteTarget::Integration => integration_registry
+            .handle_proxy(&method, &path, settings, req)
             .await
             .unwrap_or_else(|| {
                 Err(Report::new(TrustedServerError::BadRequest {
                     message: format!("Unknown integration route: {path}"),
                 }))
             }),
-
-        _ => unreachable!(),
+        RouteTarget::PublisherProxy => unreachable!(),
     };
 
     // Convert any errors to HTTP error responses
     let mut response = result.unwrap_or_else(|e| to_error_response(&e));
-
-    if let Ok(v) = ::std::env::var(ENV_FASTLY_SERVICE_VERSION) {
-        response.set_header(HEADER_X_TS_VERSION, v);
-    }
-    if ::std::env::var(ENV_FASTLY_IS_STAGING).as_deref() == Ok("1") {
-        response.set_header(HEADER_X_TS_ENV, "staging");
-    }
-
-    for (key, value) in &settings.response_headers {
-        response.set_header(key, value);
-    }
+    apply_standard_response_headers(&mut response, settings);
 
     Ok(RouteResult::Buffered(response))
 }
diff --git a/examples/nextjs-rsc-app/README.md b/examples/nextjs-rsc-app/README.md
new file mode 100644
index 00000000..834aedb4
--- /dev/null
+++ b/examples/nextjs-rsc-app/README.md
@@ -0,0 +1,93 @@
+# Next.js RSC Test App
+
+Minimal Next.js 15 App Router application for testing Trusted Server's RSC
+(React Server Components) URL rewriting integration.
+
+## Purpose
+
+This app generates realistic RSC Flight payloads containing
+`origin.example.com` URLs. These payloads exercise every rewriting path in the
+Trusted Server HTML processor:
+
+| Route | RSC Pattern | Rewriting Path |
+|-------|------------|----------------|
+| `/` | Simple JSON URLs in `__next_f.push` | Placeholder substitution |
+| `/about` | HTML content with URLs (T-chunks) | T-chunk length recalculation |
+| `/blog/hello-world` | Large payload spanning multiple scripts | Cross-script T-chunk handling |
+
+## Quick Start
+
+```bash
+npm install
+npm run dev
+# Visit http://localhost:3099
+```
+
+## Testing RSC Streaming
+
+### Quick Test with Live HTML
+
+Test with HTML from your **currently running** server:
+
+```bash
+# Terminal 1: Start dev server
+npm run dev
+
+# Terminal 2: Test live HTML
+./test-live-html.sh                                    # Test home page
+./test-live-html.sh http://localhost:3099/about        # Test specific route
+```
+
+This fetches fresh HTML from your server and processes it through the trusted-server pipeline. Perfect for rapid iteration during development.
+
+### Full E2E Test
+
+Run a complete end-to-end test (builds production server):
+
+```bash
+./test-streaming.sh
+```
+
+This script:
+1. Builds and starts the Next.js production server
+2. Fetches HTML from all routes
+3. Verifies RSC content is present
+4. Runs Rust integration tests
+5. Shows streaming metrics for each route
+
+**Expected Results:**
+- ✅ RSC payloads contain `origin.example.com` URLs before processing
+- ✅ After processing through trusted-server pipeline: **0 origin URLs remain in RSC payloads**
+- ✅ Streaming ratios: 20-40% for RSC pages (vs 0% before the fix)
+- ✅ Non-RSC pages stream at 96%+
+
+📖 See [TESTING.md](./TESTING.md) for detailed testing documentation.
+
+## Capturing Fixtures
+
+To regenerate the HTML fixtures used by Rust integration tests:
+
+```bash
+npm ci
+npm run capture-fixtures
+```
+
+This installs dependencies with `npm ci`, builds the app, starts `next start`,
+captures HTML from each route, validates that RSC payloads are present, and
+saves the output to `crates/common/src/integrations/nextjs/fixtures/`.
+
+## How It Works
+
+Each page component includes URLs with the `origin.example.com` hostname. When
+Next.js renders these as RSC Flight data (inlined `<script>` tags with
+`self.__next_f.push`), the Trusted Server's streaming HTML processor detects and
+rewrites them to the proxy hostname.
+
+The key RSC patterns exercised:
+
+- **Simple payloads**: `self.__next_f.push([1,"...URL..."])` — single script,
+  unfragmented
+- **T-chunks**: `self.__next_f.push([1,"id:Tlen,<html content>"])` — HTML
+  content with hex-encoded byte length that must be recalculated after rewriting
+- **Cross-script T-chunks**: T-chunk header in one script, content continuing
+  in subsequent scripts — requires combined payload processing
diff --git a/examples/nextjs-rsc-app/TESTING.md b/examples/nextjs-rsc-app/TESTING.md
new file mode 100644
index 00000000..a005492b
--- /dev/null
+++ b/examples/nextjs-rsc-app/TESTING.md
@@ -0,0 +1,129 @@
+# Testing RSC Streaming
+
+This directory contains tools for testing RSC (React Server Components) streaming behavior.
+
+## Quick Test with Live Server
+
+**Test HTML from your running Next.js server:**
+
+```bash
+# 1. Start your Next.js server
+npm run dev
+# Server starts on http://localhost:3099
+
+# 2. In another terminal, test the live HTML
+./test-live-html.sh
+
+# Or test a specific route
+./test-live-html.sh http://localhost:3099/about
+./test-live-html.sh http://localhost:3099/blog/test-post
+```
+
+### What `test-live-html.sh` does:
+
+1. ✅ Checks if server is running
+2. 📥 Fetches fresh HTML from your live server
+3. 📊 Analyzes raw HTML (RSC scripts, origin URLs)
+4. 🔄 Processes through trusted-server pipeline
+5. 📈 Shows streaming ratios for different chunk sizes
+6. ✅ Verifies RSC payload URL rewriting
+
+**Output example:**
+```
+📊 Raw HTML Analysis:
+   RSC scripts: 5
+   origin.example.com occurrences: 28
+
+🧪 Running test with live HTML...
+Chunk size    32B:  27.5% streamed (2014 intermediate, 5301 final)
+Chunk size    64B:  27.6% streamed (2051 intermediate, 5264 final)
+Chunk size   256B:  27.5% streamed (2014 intermediate, 5301 final)
+Chunk size  8192B:   0.0% streamed (0 intermediate, 7315 final)
+
+🔍 RSC Payload Verification (64B chunks):
+   Origin URLs in RSC payloads: 0
+   ✅ All RSC payload URLs successfully rewritten!
+```
+
+## Full Integration Test Suite
+
+**Test with pre-captured fixtures (no server needed):**
+
+```bash
+# From project root
+cargo test --test nextjs_integration -- --nocapture
+```
+
+This runs 20 tests across 7 fixtures:
+- Hand-crafted fixtures (simple, tchunk, large, non-RSC)
+- Real Next.js fixtures (home, about, blog)
+- Multiple chunk sizes (32B, 64B, 256B, 8KB)
+
+## Full E2E Test (Server + Tests)
+
+**Build production server, fetch HTML, and run all tests:**
+
+```bash
+./test-streaming.sh
+```
+
+This script:
+1. Installs dependencies (if needed)
+2. Builds Next.js production bundle
+3. Starts production server on port 3099
+4. Fetches HTML from all routes
+5. Verifies RSC content is present
+6. Runs full integration test suite
+7. Automatically stops server on exit
+
+⚠️ **Note**: This uses production build (`npm run start`), not dev mode.
+
+## Comparison
+
+| Script | Server | HTML Source | Use Case |
+|--------|--------|-------------|----------|
+| `test-live-html.sh` | Uses existing | Live fetch | Quick iteration during development |
+| `test-streaming.sh` | Starts own (prod) | Live fetch | Full E2E verification |
+| `cargo test` | Not needed | Pre-captured fixtures | CI/CD, unit testing |
+
+## Capturing New Fixtures
+
+If you update the Next.js app and want to capture new fixtures:
+
+```bash
+npm ci
+npm run capture-fixtures
+```
+
+This:
+1. Builds production version
+2. Starts server
+3. Fetches HTML from all routes
+4. Validates RSC content
+5. Saves to `crates/common/src/integrations/nextjs/fixtures/`
+
+## Interpreting Results
+
+### Streaming Ratios
+
+- **27-38% for RSC pages** ✅ Optimal (RSC scripts are 60-72% of HTML)
+- **96%+ for non-RSC pages** ✅ Excellent
+- **0% (all buffered)** ❌ RSC detected but not streaming
+
+### RSC Payload Rewriting
+
+- **0 origin URLs remaining** ✅ Perfect rewriting
+- **> 0 origin URLs** ⚠️ Indicates fragmentation or issue
+
+### Why 27-38% is optimal:
+
+Next.js places RSC scripts at the END of the HTML:
+```
+<!DOCTYPE html>...         ← 27-38% streamed immediately
+<html><body>...</body>
+<script>__next_f.push(...) ← RSC detected, start buffering
+<script>__next_f.push(...) ← 60-72% buffered for post-processing
+</html>                    ← ~5 bytes
+```
+
+The RSC scripts themselves make up 60-72% of the document, so streaming more is not possible without streaming unbuffered RSC scripts (which would break URL rewriting).
diff --git a/examples/nextjs-rsc-app/app/about/page.tsx b/examples/nextjs-rsc-app/app/about/page.tsx
new file mode 100644
index 00000000..f53d0985
--- /dev/null
+++ b/examples/nextjs-rsc-app/app/about/page.tsx
@@ -0,0 +1,72 @@
+// About page — produces RSC payloads with HTML content (T-chunks).
+// The RSC Flight data will include rendered HTML containing URLs,
+// which exercises the T-chunk rewriting path.
+const ORIGIN = "https://origin.example.com:3099";
+
+interface TeamMember {
+  name: string;
+  role: string;
+  profileUrl: string;
+  avatarUrl: string;
+}
+
+const team: TeamMember[] = [
+  {
+    name: "Alice Johnson",
+    role: "Engineering Lead",
+    profileUrl: `${ORIGIN}/team/alice`,
+    avatarUrl: `${ORIGIN}/avatars/alice.jpg`,
+  },
+  {
+    name: "Bob Smith",
+    role: "Product Manager",
+    profileUrl: `${ORIGIN}/team/bob`,
+    avatarUrl: `${ORIGIN}/avatars/bob.jpg`,
+  },
+  {
+    name: "Carol Williams",
+    role: "Designer",
+    profileUrl: `${ORIGIN}/team/carol`,
+    avatarUrl: `${ORIGIN}/avatars/carol.jpg`,
+  },
+];
+
+export default function AboutPage() {
+  return (
+    <div>
+      <h1>About Us</h1>
+      <p>
+        We are building at{" "}
+        <a href={`${ORIGIN}/about`}>origin.example.com</a>.
+      </p>
+
+      <section>
+        <h2>Our Team</h2>
+        {team.map((member) => (
+          <div key={member.name}>
+            <img src={member.avatarUrl} alt={member.name} width={64} height={64} />
+            <h3>
+              <a href={member.profileUrl}>{member.name}</a>
+            </h3>
+            <p>{member.role}</p>
+          </div>
+        ))}
+      </section>
+
+      <section>
+        <h2>Resources</h2>
+        <ul>
+          <li>
+            <a href={`${ORIGIN}/blog`}>Blog</a>
+          </li>
+          <li>
+            <a href={`${ORIGIN}/careers`}>Careers</a>
+          </li>
+          <li>
+            <a href={`${ORIGIN}/contact`}>Contact</a>
+          </li>
+        </ul>
+      </section>
+    </div>
+  );
+}
diff --git a/examples/nextjs-rsc-app/app/blog/[slug]/page.tsx b/examples/nextjs-rsc-app/app/blog/[slug]/page.tsx
new file mode 100644
index 00000000..f759b110
--- /dev/null
+++ b/examples/nextjs-rsc-app/app/blog/[slug]/page.tsx
@@ -0,0 +1,72 @@
+// Dynamic blog page — produces larger RSC payloads that may span multiple
+// script tags (cross-script T-chunks). The large content block forces
+// Next.js to split the Flight data across multiple inlined scripts.
+const ORIGIN = "https://origin.example.com:3099";
+
+// Generate enough content to produce cross-script T-chunks
+function generateArticleContent(): string[] {
+  const paragraphs: string[] = [];
+  for (let i = 0; i < 20; i++) {
+    paragraphs.push(
+      `Paragraph ${i + 1}: This content references ${ORIGIN}/article/${i + 1} ` +
+      `and includes links to ${ORIGIN}/category/tech and ${ORIGIN}/author/staff. ` +
+      `For more information, visit ${ORIGIN}/resources/guide-${i + 1}.`
+    );
+  }
+  return paragraphs;
+}
+
+interface PageProps {
+  params: Promise<{ slug: string }>;
+}
+
+export default async function BlogPost({ params }: PageProps) {
+  const { slug } = await params;
+  const paragraphs = generateArticleContent();
+
+  return (
+    <article>
+      <h1>Blog Post: {slug}</h1>
+      <div>
+        <span>Published on </span>
+        <a href={`${ORIGIN}/blog`}>the blog</a>
+      </div>
+
+      <div>
+        <img
+          src={`${ORIGIN}/images/blog/${slug}/hero.jpg`}
+          alt={`Hero image for ${slug}`}
+          width={1200}
+          height={630}
+        />
+      </div>
+
+      {paragraphs.map((text, i) => (
+        <p key={i}>{text}</p>
+      ))}
+
+      <nav>
+        <h2>Related Posts</h2>
+        <ul>
+          {Array.from({ length: 5 }, (_, i) => (
+            <li key={i}>
+              <a href={`${ORIGIN}/blog/related-post-${i + 1}`}>
+                Related Post {i + 1}
+              </a>
+            </li>
+          ))}
+        </ul>
+      </nav>
+
+      <footer>
+        <a href={`${ORIGIN}/blog/${slug}/comments`}>View Comments</a>
+        <a href={`${ORIGIN}/blog/${slug}/share`}>Share</a>
+      </footer>
+    </article>
+  );
+}
+
+// Pre-render a known slug for fixture capture
+export function generateStaticParams() {
+  return [{ slug: "hello-world" }];
+}
diff --git a/examples/nextjs-rsc-app/app/layout.tsx b/examples/nextjs-rsc-app/app/layout.tsx
new file mode 100644
index 00000000..6d776192
--- /dev/null
+++ b/examples/nextjs-rsc-app/app/layout.tsx
@@ -0,0 +1,37 @@
+import type { Metadata } from "next";
+
+// These URLs use origin.example.com to test Trusted Server URL rewriting.
+// In production, Trusted Server rewrites these to the proxy host.
+const ORIGIN = "https://origin.example.com:3099";
+
+export const metadata: Metadata = {
+  title: "Next.js RSC Test App",
+  description: "Minimal app for testing Trusted Server RSC integration",
+};
+
+export default function RootLayout({
+  children,
+}: {
+  children: React.ReactNode;
+}) {
+  return (
+    <html lang="en">
+      <head>
+        <link rel="stylesheet" href={`${ORIGIN}/styles/main.css`} />
+        <link rel="icon" href={`${ORIGIN}/favicon.ico`} />
+      </head>
+      <body>
+        <nav>
+          <a href={`${ORIGIN}/`}>Home</a>
+          <a href={`${ORIGIN}/about`}>About</a>
+          <a href={`${ORIGIN}/blog/hello-world`}>Blog</a>
+        </nav>
+        <main>{children}</main>
+        <footer>
+          <a href={`${ORIGIN}/privacy`}>Privacy Policy</a>
+          <a href={`${ORIGIN}/terms`}>Terms of Service</a>
+        </footer>
+      </body>
+    </html>
+  );
+}
diff --git a/examples/nextjs-rsc-app/app/page.tsx b/examples/nextjs-rsc-app/app/page.tsx
new file mode 100644
index 00000000..f2783f24
--- /dev/null
+++ b/examples/nextjs-rsc-app/app/page.tsx
@@ -0,0 +1,48 @@
+// Home page — produces simple RSC payloads with JSON URLs.
+// The RSC Flight data will contain these URLs as string literals.
+const ORIGIN = "https://origin.example.com:3099";
+
+interface LinkItem {
+  title: string;
+  url: string;
+  description: string;
+}
+
+// These links will appear in the RSC payload as JSON data
+const links: LinkItem[] = [
+  {
+    title: "Documentation",
+    url: `${ORIGIN}/docs`,
+    description: "Learn about the platform",
+  },
+  {
+    title: "API Reference",
+    url: `${ORIGIN}/api/v1`,
+    description: "Explore the REST API",
+  },
+  {
+    title: "Dashboard",
+    url: `${ORIGIN}/dashboard`,
+    description: "View your analytics",
+  },
+];
+
+export default function HomePage() {
+  return (
+    <div>
+      <h1>Welcome to the Test App</h1>
+      <p>
+        Visit our <a href={`${ORIGIN}/getting-started`}>getting started guide</a>.
+      </p>
+      <ul>
+        {links.map((link) => (
+          <li key={link.url}>
+            <a href={link.url}>{link.title}</a>
+            <span> - {link.description}</span>
+          </li>
+        ))}
+      </ul>
+      <img src={`${ORIGIN}/images/hero.jpg`} alt="Hero" width={800} height={400} />
+    </div>
+  );
+}
diff --git a/examples/nextjs-rsc-app/next-env.d.ts b/examples/nextjs-rsc-app/next-env.d.ts
new file mode 100644
index 00000000..830fb594
--- /dev/null
+++ b/examples/nextjs-rsc-app/next-env.d.ts
@@ -0,0 +1,6 @@
+/// <reference types="next" />
+/// <reference types="next/image-types/global" />
+/// <reference path="./.next/types/routes.d.ts" />
+
+// NOTE: This file should not be edited
+// see https://nextjs.org/docs/app/api-reference/config/typescript for more information.
diff --git a/examples/nextjs-rsc-app/next.config.js b/examples/nextjs-rsc-app/next.config.js
new file mode 100644
index 00000000..a33c9446
--- /dev/null
+++ b/examples/nextjs-rsc-app/next.config.js
@@ -0,0 +1,7 @@
+/** @type {import('next').NextConfig} */
+const nextConfig = {
+  // Disable React strict mode to get cleaner RSC output for fixture capture
+  reactStrictMode: false,
+};
+
+module.exports = nextConfig;
diff --git a/examples/nextjs-rsc-app/package-lock.json b/examples/nextjs-rsc-app/package-lock.json
new file mode 100644
index 00000000..4c600eb1
--- /dev/null
+++ b/examples/nextjs-rsc-app/package-lock.json
@@ -0,0 +1,952 @@
+{
+  "name": "nextjs-rsc-app",
+  "version": "0.1.0",
+  "lockfileVersion": 3,
+  "requires": true,
+  "packages": {
+    "": {
+      "name": "nextjs-rsc-app",
+      "version": "0.1.0",
+      "dependencies": {
+        "next": "^15.0.0",
+        "react": "^19.0.0",
+        "react-dom": "^19.0.0"
+      },
+      "devDependencies": {
+        "@types/node": "^22.0.0",
+        "@types/react": "^19.0.0",
+        "typescript": "^5.7.0"
+      }
+    },
+    "node_modules/@emnapi/runtime": {
+      "version": "1.8.1",
+      "resolved": "https://registry.npmjs.org/@emnapi/runtime/-/runtime-1.8.1.tgz",
+      "integrity": "sha512-mehfKSMWjjNol8659Z8KxEMrdSJDDot5SXMq00dM8BN4o+CLNXQ0xH2V7EchNHV4RmbZLmmPdEaXZc5H2FXmDg==",
+      "license": "MIT",
+      "optional": true,
+      "dependencies": {
+        "tslib": "^2.4.0"
+      }
+    },
+    "node_modules/@img/colour": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/@img/colour/-/colour-1.0.0.tgz",
+      "integrity": "sha512-A5P/LfWGFSl6nsckYtjw9da+19jB8hkJ6ACTGcDfEJ0aE+l2n2El7dsVM7UVHZQ9s2lmYMWlrS21YLy2IR1LUw==",
+      "license": "MIT",
+      "optional": true,
+      "engines": {
+        "node": ">=18"
+      }
+    },
+    "node_modules/@img/sharp-darwin-arm64": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-darwin-arm64/-/sharp-darwin-arm64-0.34.5.tgz",
+      "integrity": "sha512-imtQ3WMJXbMY4fxb/Ndp6HBTNVtWCUI0WdobyheGf5+ad6xX8VIDO8u2xE4qc/fr08CKG/7dDseFtn6M6g/r3w==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "Apache-2.0",
+      "optional": true,
+      "os": [
+        "darwin"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-libvips-darwin-arm64": "1.2.4"
+      }
+    },
+    "node_modules/@img/sharp-darwin-x64": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-darwin-x64/-/sharp-darwin-x64-0.34.5.tgz",
+      "integrity": "sha512-YNEFAF/4KQ/PeW0N+r+aVVsoIY0/qxxikF2SWdp+NRkmMB7y9LBZAVqQ4yhGCm/H3H270OSykqmQMKLBhBJDEw==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "Apache-2.0",
+      "optional": true,
+      "os": [
+        "darwin"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-libvips-darwin-x64": "1.2.4"
+      }
+    },
+    "node_modules/@img/sharp-libvips-darwin-arm64": {
+      "version": "1.2.4",
+      "resolved": "https://registry.npmjs.org/@img/sharp-libvips-darwin-arm64/-/sharp-libvips-darwin-arm64-1.2.4.tgz",
+      "integrity": "sha512-zqjjo7RatFfFoP0MkQ51jfuFZBnVE2pRiaydKJ1G/rHZvnsrHAOcQALIi9sA5co5xenQdTugCvtb1cuf78Vf4g==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "darwin"
+      ],
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-libvips-darwin-x64": {
+      "version": "1.2.4",
+      "resolved": "https://registry.npmjs.org/@img/sharp-libvips-darwin-x64/-/sharp-libvips-darwin-x64-1.2.4.tgz",
+      "integrity": "sha512-1IOd5xfVhlGwX+zXv2N93k0yMONvUlANylbJw1eTah8K/Jtpi15KC+WSiaX/nBmbm2HxRM1gZ0nSdjSsrZbGKg==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "darwin"
+      ],
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-libvips-linux-arm": {
+      "version": "1.2.4",
+      "resolved": "https://registry.npmjs.org/@img/sharp-libvips-linux-arm/-/sharp-libvips-linux-arm-1.2.4.tgz",
+      "integrity": "sha512-bFI7xcKFELdiNCVov8e44Ia4u2byA+l3XtsAj+Q8tfCwO6BQ8iDojYdvoPMqsKDkuoOo+X6HZA0s0q11ANMQ8A==",
+      "cpu": [
+        "arm"
+      ],
+      "license": "LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-libvips-linux-arm64": {
+      "version": "1.2.4",
+      "resolved": "https://registry.npmjs.org/@img/sharp-libvips-linux-arm64/-/sharp-libvips-linux-arm64-1.2.4.tgz",
+      "integrity": "sha512-excjX8DfsIcJ10x1Kzr4RcWe1edC9PquDRRPx3YVCvQv+U5p7Yin2s32ftzikXojb1PIFc/9Mt28/y+iRklkrw==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-libvips-linux-ppc64": {
+      "version": "1.2.4",
+      "resolved": "https://registry.npmjs.org/@img/sharp-libvips-linux-ppc64/-/sharp-libvips-linux-ppc64-1.2.4.tgz",
+      "integrity": "sha512-FMuvGijLDYG6lW+b/UvyilUWu5Ayu+3r2d1S8notiGCIyYU/76eig1UfMmkZ7vwgOrzKzlQbFSuQfgm7GYUPpA==",
+      "cpu": [
+        "ppc64"
+      ],
+      "license": "LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-libvips-linux-riscv64": {
+      "version": "1.2.4",
+      "resolved": "https://registry.npmjs.org/@img/sharp-libvips-linux-riscv64/-/sharp-libvips-linux-riscv64-1.2.4.tgz",
+      "integrity": "sha512-oVDbcR4zUC0ce82teubSm+x6ETixtKZBh/qbREIOcI3cULzDyb18Sr/Wcyx7NRQeQzOiHTNbZFF1UwPS2scyGA==",
+      "cpu": [
+        "riscv64"
+      ],
+      "license": "LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-libvips-linux-s390x": {
+      "version": "1.2.4",
+      "resolved": "https://registry.npmjs.org/@img/sharp-libvips-linux-s390x/-/sharp-libvips-linux-s390x-1.2.4.tgz",
+      "integrity": "sha512-qmp9VrzgPgMoGZyPvrQHqk02uyjA0/QrTO26Tqk6l4ZV0MPWIW6LTkqOIov+J1yEu7MbFQaDpwdwJKhbJvuRxQ==",
+      "cpu": [
+        "s390x"
+      ],
+      "license": "LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-libvips-linux-x64": {
+      "version": "1.2.4",
+      "resolved": "https://registry.npmjs.org/@img/sharp-libvips-linux-x64/-/sharp-libvips-linux-x64-1.2.4.tgz",
+      "integrity": "sha512-tJxiiLsmHc9Ax1bz3oaOYBURTXGIRDODBqhveVHonrHJ9/+k89qbLl0bcJns+e4t4rvaNBxaEZsFtSfAdquPrw==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-libvips-linuxmusl-arm64": {
+      "version": "1.2.4",
+      "resolved": "https://registry.npmjs.org/@img/sharp-libvips-linuxmusl-arm64/-/sharp-libvips-linuxmusl-arm64-1.2.4.tgz",
+      "integrity": "sha512-FVQHuwx1IIuNow9QAbYUzJ+En8KcVm9Lk5+uGUQJHaZmMECZmOlix9HnH7n1TRkXMS0pGxIJokIVB9SuqZGGXw==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-libvips-linuxmusl-x64": {
+      "version": "1.2.4",
+      "resolved": "https://registry.npmjs.org/@img/sharp-libvips-linuxmusl-x64/-/sharp-libvips-linuxmusl-x64-1.2.4.tgz",
+      "integrity": "sha512-+LpyBk7L44ZIXwz/VYfglaX/okxezESc6UxDSoyo2Ks6Jxc4Y7sGjpgU9s4PMgqgjj1gZCylTieNamqA1MF7Dg==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-linux-arm": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-linux-arm/-/sharp-linux-arm-0.34.5.tgz",
+      "integrity": "sha512-9dLqsvwtg1uuXBGZKsxem9595+ujv0sJ6Vi8wcTANSFpwV/GONat5eCkzQo/1O6zRIkh0m/8+5BjrRr7jDUSZw==",
+      "cpu": [
+        "arm"
+      ],
+      "license": "Apache-2.0",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-libvips-linux-arm": "1.2.4"
+      }
+    },
+    "node_modules/@img/sharp-linux-arm64": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-linux-arm64/-/sharp-linux-arm64-0.34.5.tgz",
+      "integrity": "sha512-bKQzaJRY/bkPOXyKx5EVup7qkaojECG6NLYswgktOZjaXecSAeCWiZwwiFf3/Y+O1HrauiE3FVsGxFg8c24rZg==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "Apache-2.0",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-libvips-linux-arm64": "1.2.4"
+      }
+    },
+    "node_modules/@img/sharp-linux-ppc64": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-linux-ppc64/-/sharp-linux-ppc64-0.34.5.tgz",
+      "integrity": "sha512-7zznwNaqW6YtsfrGGDA6BRkISKAAE1Jo0QdpNYXNMHu2+0dTrPflTLNkpc8l7MUP5M16ZJcUvysVWWrMefZquA==",
+      "cpu": [
+        "ppc64"
+      ],
+      "license": "Apache-2.0",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-libvips-linux-ppc64": "1.2.4"
+      }
+    },
+    "node_modules/@img/sharp-linux-riscv64": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-linux-riscv64/-/sharp-linux-riscv64-0.34.5.tgz",
+      "integrity": "sha512-51gJuLPTKa7piYPaVs8GmByo7/U7/7TZOq+cnXJIHZKavIRHAP77e3N2HEl3dgiqdD/w0yUfiJnII77PuDDFdw==",
+      "cpu": [
+        "riscv64"
+      ],
+      "license": "Apache-2.0",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-libvips-linux-riscv64": "1.2.4"
+      }
+    },
+    "node_modules/@img/sharp-linux-s390x": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-linux-s390x/-/sharp-linux-s390x-0.34.5.tgz",
+      "integrity": "sha512-nQtCk0PdKfho3eC5MrbQoigJ2gd1CgddUMkabUj+rBevs8tZ2cULOx46E7oyX+04WGfABgIwmMC0VqieTiR4jg==",
+      "cpu": [
+        "s390x"
+      ],
+      "license": "Apache-2.0",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-libvips-linux-s390x": "1.2.4"
+      }
+    },
+    "node_modules/@img/sharp-linux-x64": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-linux-x64/-/sharp-linux-x64-0.34.5.tgz",
+      "integrity": "sha512-MEzd8HPKxVxVenwAa+JRPwEC7QFjoPWuS5NZnBt6B3pu7EG2Ge0id1oLHZpPJdn3OQK+BQDiw9zStiHBTJQQQQ==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "Apache-2.0",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-libvips-linux-x64": "1.2.4"
+      }
+    },
+    "node_modules/@img/sharp-linuxmusl-arm64": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-linuxmusl-arm64/-/sharp-linuxmusl-arm64-0.34.5.tgz",
+      "integrity": "sha512-fprJR6GtRsMt6Kyfq44IsChVZeGN97gTD331weR1ex1c1rypDEABN6Tm2xa1wE6lYb5DdEnk03NZPqA7Id21yg==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "Apache-2.0",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-libvips-linuxmusl-arm64": "1.2.4"
+      }
+    },
+    "node_modules/@img/sharp-linuxmusl-x64": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-linuxmusl-x64/-/sharp-linuxmusl-x64-0.34.5.tgz",
+      "integrity": "sha512-Jg8wNT1MUzIvhBFxViqrEhWDGzqymo3sV7z7ZsaWbZNDLXRJZoRGrjulp60YYtV4wfY8VIKcWidjojlLcWrd8Q==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "Apache-2.0",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-libvips-linuxmusl-x64": "1.2.4"
+      }
+    },
+    "node_modules/@img/sharp-wasm32": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-wasm32/-/sharp-wasm32-0.34.5.tgz",
+      "integrity": "sha512-OdWTEiVkY2PHwqkbBI8frFxQQFekHaSSkUIJkwzclWZe64O1X4UlUjqqqLaPbUpMOQk6FBu/HtlGXNblIs0huw==",
+      "cpu": [
+        "wasm32"
+      ],
+      "license": "Apache-2.0 AND LGPL-3.0-or-later AND MIT",
+      "optional": true,
+      "dependencies": {
+        "@emnapi/runtime": "^1.7.0"
+      },
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-win32-arm64": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-win32-arm64/-/sharp-win32-arm64-0.34.5.tgz",
+      "integrity": "sha512-WQ3AgWCWYSb2yt+IG8mnC6Jdk9Whs7O0gxphblsLvdhSpSTtmu69ZG1Gkb6NuvxsNACwiPV6cNSZNzt0KPsw7g==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "Apache-2.0 AND LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "win32"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-win32-ia32": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-win32-ia32/-/sharp-win32-ia32-0.34.5.tgz",
+      "integrity": "sha512-FV9m/7NmeCmSHDD5j4+4pNI8Cp3aW+JvLoXcTUo0IqyjSfAZJ8dIUmijx1qaJsIiU+Hosw6xM5KijAWRJCSgNg==",
+      "cpu": [
+        "ia32"
+      ],
+      "license": "Apache-2.0 AND LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "win32"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@img/sharp-win32-x64": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/@img/sharp-win32-x64/-/sharp-win32-x64-0.34.5.tgz",
+      "integrity": "sha512-+29YMsqY2/9eFEiW93eqWnuLcWcufowXewwSNIT6UwZdUUCrM3oFjMWH/Z6/TMmb4hlFenmfAVbpWeup2jryCw==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "Apache-2.0 AND LGPL-3.0-or-later",
+      "optional": true,
+      "os": [
+        "win32"
+      ],
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      }
+    },
+    "node_modules/@next/env": {
+      "version": "15.5.12",
+      "resolved": "https://registry.npmjs.org/@next/env/-/env-15.5.12.tgz",
+      "integrity": "sha512-pUvdJN1on574wQHjaBfNGDt9Mz5utDSZFsIIQkMzPgNS8ZvT4H2mwOrOIClwsQOb6EGx5M76/CZr6G8i6pSpLg==",
+      "license": "MIT"
+    },
+    "node_modules/@next/swc-darwin-arm64": {
+      "version": "15.5.12",
+      "resolved": "https://registry.npmjs.org/@next/swc-darwin-arm64/-/swc-darwin-arm64-15.5.12.tgz",
+      "integrity": "sha512-RnRjBtH8S8eXCpUNkQ+543DUc7ys8y15VxmFU9HRqlo9BG3CcBUiwNtF8SNoi2xvGCVJq1vl2yYq+3oISBS0Zg==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "MIT",
+      "optional": true,
+      "os": [
+        "darwin"
+      ],
+      "engines": {
+        "node": ">= 10"
+      }
+    },
+    "node_modules/@next/swc-darwin-x64": {
+      "version": "15.5.12",
+      "resolved": "https://registry.npmjs.org/@next/swc-darwin-x64/-/swc-darwin-x64-15.5.12.tgz",
+      "integrity": "sha512-nqa9/7iQlboF1EFtNhWxQA0rQstmYRSBGxSM6g3GxvxHxcoeqVXfGNr9stJOme674m2V7r4E3+jEhhGvSQhJRA==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "MIT",
+      "optional": true,
+      "os": [
+        "darwin"
+      ],
+      "engines": {
+        "node": ">= 10"
+      }
+    },
+    "node_modules/@next/swc-linux-arm64-gnu": {
+      "version": "15.5.12",
+      "resolved": "https://registry.npmjs.org/@next/swc-linux-arm64-gnu/-/swc-linux-arm64-gnu-15.5.12.tgz",
+      "integrity": "sha512-dCzAjqhDHwmoB2M4eYfVKqXs99QdQxNQVpftvP1eGVppamXh/OkDAwV737Zr0KPXEqRUMN4uCjh6mjO+XtF3Mw==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "MIT",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": ">= 10"
+      }
+    },
+    "node_modules/@next/swc-linux-arm64-musl": {
+      "version": "15.5.12",
+      "resolved": "https://registry.npmjs.org/@next/swc-linux-arm64-musl/-/swc-linux-arm64-musl-15.5.12.tgz",
+      "integrity": "sha512-+fpGWvQiITgf7PUtbWY1H7qUSnBZsPPLyyq03QuAKpVoTy/QUx1JptEDTQMVvQhvizCEuNLEeghrQUyXQOekuw==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "MIT",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": ">= 10"
+      }
+    },
+    "node_modules/@next/swc-linux-x64-gnu": {
+      "version": "15.5.12",
+      "resolved": "https://registry.npmjs.org/@next/swc-linux-x64-gnu/-/swc-linux-x64-gnu-15.5.12.tgz",
+      "integrity": "sha512-jSLvgdRRL/hrFAPqEjJf1fFguC719kmcptjNVDJl26BnJIpjL3KH5h6mzR4mAweociLQaqvt4UyzfbFjgAdDcw==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "MIT",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": ">= 10"
+      }
+    },
+    "node_modules/@next/swc-linux-x64-musl": {
+      "version": "15.5.12",
+      "resolved": "https://registry.npmjs.org/@next/swc-linux-x64-musl/-/swc-linux-x64-musl-15.5.12.tgz",
+      "integrity": "sha512-/uaF0WfmYqQgLfPmN6BvULwxY0dufI2mlN2JbOKqqceZh1G4hjREyi7pg03zjfyS6eqNemHAZPSoP84x17vo6w==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "MIT",
+      "optional": true,
+      "os": [
+        "linux"
+      ],
+      "engines": {
+        "node": ">= 10"
+      }
+    },
+    "node_modules/@next/swc-win32-arm64-msvc": {
+      "version": "15.5.12",
+      "resolved": "https://registry.npmjs.org/@next/swc-win32-arm64-msvc/-/swc-win32-arm64-msvc-15.5.12.tgz",
+      "integrity": "sha512-xhsL1OvQSfGmlL5RbOmU+FV120urrgFpYLq+6U8C6KIym32gZT6XF/SDE92jKzzlPWskkbjOKCpqk5m4i8PEfg==",
+      "cpu": [
+        "arm64"
+      ],
+      "license": "MIT",
+      "optional": true,
+      "os": [
+        "win32"
+      ],
+      "engines": {
+        "node": ">= 10"
+      }
+    },
+    "node_modules/@next/swc-win32-x64-msvc": {
+      "version": "15.5.12",
+      "resolved": "https://registry.npmjs.org/@next/swc-win32-x64-msvc/-/swc-win32-x64-msvc-15.5.12.tgz",
+      "integrity": "sha512-Z1Dh6lhFkxvBDH1FoW6OU/L6prYwPSlwjLiZkExIAh8fbP6iI/M7iGTQAJPYJ9YFlWobCZ1PHbchFhFYb2ADkw==",
+      "cpu": [
+        "x64"
+      ],
+      "license": "MIT",
+      "optional": true,
+      "os": [
+        "win32"
+      ],
+      "engines": {
+        "node": ">= 10"
+      }
+    },
+    "node_modules/@swc/helpers": {
+      "version": "0.5.15",
+      "resolved": "https://registry.npmjs.org/@swc/helpers/-/helpers-0.5.15.tgz",
+      "integrity": "sha512-JQ5TuMi45Owi4/BIMAJBoSQoOJu12oOk/gADqlcUL9JEdHB8vyjUSsxqeNXnmXHjYKMi2WcYtezGEEhqUI/E2g==",
+      "license": "Apache-2.0",
+      "dependencies": {
+        "tslib": "^2.8.0"
+      }
+    },
+    "node_modules/@types/node": {
+      "version": "22.19.11",
+      "resolved": "https://registry.npmjs.org/@types/node/-/node-22.19.11.tgz",
+      "integrity": "sha512-BH7YwL6rA93ReqeQS1c4bsPpcfOmJasG+Fkr6Y59q83f9M1WcBRHR2vM+P9eOisYRcN3ujQoiZY8uk5W+1WL8w==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "undici-types": "~6.21.0"
+      }
+    },
+    "node_modules/@types/react": {
+      "version": "19.2.14",
+      "resolved": "https://registry.npmjs.org/@types/react/-/react-19.2.14.tgz",
+      "integrity": "sha512-ilcTH/UniCkMdtexkoCN0bI7pMcJDvmQFPvuPvmEaYA/NSfFTAgdUSLAoVjaRJm7+6PvcM+q1zYOwS4wTYMF9w==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "csstype": "^3.2.2"
+      }
+    },
+    "node_modules/caniuse-lite": {
+      "version": "1.0.30001774",
+      "resolved": "https://registry.npmjs.org/caniuse-lite/-/caniuse-lite-1.0.30001774.tgz",
+      "integrity": "sha512-DDdwPGz99nmIEv216hKSgLD+D4ikHQHjBC/seF98N9CPqRX4M5mSxT9eTV6oyisnJcuzxtZy4n17yKKQYmYQOA==",
+      "funding": [
+        {
+          "type": "opencollective",
+          "url": "https://opencollective.com/browserslist"
+        },
+        {
+          "type": "tidelift",
+          "url": "https://tidelift.com/funding/github/npm/caniuse-lite"
+        },
+        {
+          "type": "github",
+          "url": "https://github.com/sponsors/ai"
+        }
+      ],
+      "license": "CC-BY-4.0"
+    },
+    "node_modules/client-only": {
+      "version": "0.0.1",
+      "resolved": "https://registry.npmjs.org/client-only/-/client-only-0.0.1.tgz",
+      "integrity": "sha512-IV3Ou0jSMzZrd3pZ48nLkT9DA7Ag1pnPzaiQhpW7c3RbcqqzvzzVu+L8gfqMp/8IM2MQtSiqaCxrrcfu8I8rMA==",
+      "license": "MIT"
+    },
+    "node_modules/csstype": {
+      "version": "3.2.3",
+      "resolved": "https://registry.npmjs.org/csstype/-/csstype-3.2.3.tgz",
+      "integrity": "sha512-z1HGKcYy2xA8AGQfwrn0PAy+PB7X/GSj3UVJW9qKyn43xWa+gl5nXmU4qqLMRzWVLFC8KusUX8T/0kCiOYpAIQ==",
+      "dev": true,
+      "license": "MIT"
+    },
+    "node_modules/detect-libc": {
+      "version": "2.1.2",
+      "resolved": "https://registry.npmjs.org/detect-libc/-/detect-libc-2.1.2.tgz",
+      "integrity": "sha512-Btj2BOOO83o3WyH59e8MgXsxEQVcarkUOpEYrubB0urwnN10yQ364rsiByU11nZlqWYZm05i/of7io4mzihBtQ==",
+      "license": "Apache-2.0",
+      "optional": true,
+      "engines": {
+        "node": ">=8"
+      }
+    },
+    "node_modules/nanoid": {
+      "version": "3.3.11",
+      "resolved": "https://registry.npmjs.org/nanoid/-/nanoid-3.3.11.tgz",
+      "integrity": "sha512-N8SpfPUnUp1bK+PMYW8qSWdl9U+wwNWI4QKxOYDy9JAro3WMX7p2OeVRF9v+347pnakNevPmiHhNmZ2HbFA76w==",
+      "funding": [
+        {
+          "type": "github",
+          "url": "https://github.com/sponsors/ai"
+        }
+      ],
+      "license": "MIT",
+      "bin": {
+        "nanoid": "bin/nanoid.cjs"
+      },
+      "engines": {
+        "node": "^10 || ^12 || ^13.7 || ^14 || >=15.0.1"
+      }
+    },
+    "node_modules/next": {
+      "version": "15.5.12",
+      "resolved": "https://registry.npmjs.org/next/-/next-15.5.12.tgz",
+      "integrity": "sha512-Fi/wQ4Etlrn60rz78bebG1i1SR20QxvV8tVp6iJspjLUSHcZoeUXCt+vmWoEcza85ElZzExK/jJ/F6SvtGktjA==",
+      "license": "MIT",
+      "dependencies": {
+        "@next/env": "15.5.12",
+        "@swc/helpers": "0.5.15",
+        "caniuse-lite": "^1.0.30001579",
+        "postcss": "8.4.31",
+        "styled-jsx": "5.1.6"
+      },
+      "bin": {
+        "next": "dist/bin/next"
+      },
+      "engines": {
+        "node": "^18.18.0 || ^19.8.0 || >= 20.0.0"
+      },
+      "optionalDependencies": {
+        "@next/swc-darwin-arm64": "15.5.12",
+        "@next/swc-darwin-x64": "15.5.12",
+        "@next/swc-linux-arm64-gnu": "15.5.12",
+        "@next/swc-linux-arm64-musl": "15.5.12",
+        "@next/swc-linux-x64-gnu": "15.5.12",
+        "@next/swc-linux-x64-musl": "15.5.12",
+        "@next/swc-win32-arm64-msvc": "15.5.12",
+        "@next/swc-win32-x64-msvc": "15.5.12",
+        "sharp": "^0.34.3"
+      },
+      "peerDependencies": {
+        "@opentelemetry/api": "^1.1.0",
+        "@playwright/test": "^1.51.1",
+        "babel-plugin-react-compiler": "*",
+        "react": "^18.2.0 || 19.0.0-rc-de68d2f4-20241204 || ^19.0.0",
+        "react-dom": "^18.2.0 || 19.0.0-rc-de68d2f4-20241204 || ^19.0.0",
+        "sass": "^1.3.0"
+      },
+      "peerDependenciesMeta": {
+        "@opentelemetry/api": {
+          "optional": true
+        },
+        "@playwright/test": {
+          "optional": true
+        },
+        "babel-plugin-react-compiler": {
+          "optional": true
+        },
+        "sass": {
+          "optional": true
+        }
+      }
+    },
+    "node_modules/picocolors": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/picocolors/-/picocolors-1.1.1.tgz",
+      "integrity": "sha512-xceH2snhtb5M9liqDsmEw56le376mTZkEX/jEb/RxNFyegNul7eNslCXP9FDj/Lcu0X8KEyMceP2ntpaHrDEVA==",
+      "license": "ISC"
+    },
+    "node_modules/postcss": {
+      "version": "8.4.31",
+      "resolved": "https://registry.npmjs.org/postcss/-/postcss-8.4.31.tgz",
+      "integrity": "sha512-PS08Iboia9mts/2ygV3eLpY5ghnUcfLV/EXTOW1E2qYxJKGGBUtNjN76FYHnMs36RmARn41bC0AZmn+rR0OVpQ==",
+      "funding": [
+        {
+          "type": "opencollective",
+          "url": "https://opencollective.com/postcss/"
+        },
+        {
+          "type": "tidelift",
+          "url": "https://tidelift.com/funding/github/npm/postcss"
+        },
+        {
+          "type": "github",
+          "url": "https://github.com/sponsors/ai"
+        }
+      ],
+      "license": "MIT",
+      "dependencies": {
+        "nanoid": "^3.3.6",
+        "picocolors": "^1.0.0",
+        "source-map-js": "^1.0.2"
+      },
+      "engines": {
+        "node": "^10 || ^12 || >=14"
+      }
+    },
+    "node_modules/react": {
+      "version": "19.2.4",
+      "resolved": "https://registry.npmjs.org/react/-/react-19.2.4.tgz",
+      "integrity": "sha512-9nfp2hYpCwOjAN+8TZFGhtWEwgvWHXqESH8qT89AT/lWklpLON22Lc8pEtnpsZz7VmawabSU0gCjnj8aC0euHQ==",
+      "license": "MIT",
+      "engines": {
+        "node": ">=0.10.0"
+      }
+    },
+    "node_modules/react-dom": {
+      "version": "19.2.4",
+      "resolved": "https://registry.npmjs.org/react-dom/-/react-dom-19.2.4.tgz",
+      "integrity": "sha512-AXJdLo8kgMbimY95O2aKQqsz2iWi9jMgKJhRBAxECE4IFxfcazB2LmzloIoibJI3C12IlY20+KFaLv+71bUJeQ==",
+      "license": "MIT",
+      "dependencies": {
+        "scheduler": "^0.27.0"
+      },
+      "peerDependencies": {
+        "react": "^19.2.4"
+      }
+    },
+    "node_modules/scheduler": {
+      "version": "0.27.0",
+      "resolved": "https://registry.npmjs.org/scheduler/-/scheduler-0.27.0.tgz",
+      "integrity": "sha512-eNv+WrVbKu1f3vbYJT/xtiF5syA5HPIMtf9IgY/nKg0sWqzAUEvqY/xm7OcZc/qafLx/iO9FgOmeSAp4v5ti/Q==",
+      "license": "MIT"
+    },
+    "node_modules/semver": {
+      "version": "7.7.4",
+      "resolved": "https://registry.npmjs.org/semver/-/semver-7.7.4.tgz",
+      "integrity": "sha512-vFKC2IEtQnVhpT78h1Yp8wzwrf8CM+MzKMHGJZfBtzhZNycRFnXsHk6E5TxIkkMsgNS7mdX3AGB7x2QM2di4lA==",
+      "license": "ISC",
+      "optional": true,
+      "bin": {
+        "semver": "bin/semver.js"
+      },
+      "engines": {
+        "node": ">=10"
+      }
+    },
+    "node_modules/sharp": {
+      "version": "0.34.5",
+      "resolved": "https://registry.npmjs.org/sharp/-/sharp-0.34.5.tgz",
+      "integrity": "sha512-Ou9I5Ft9WNcCbXrU9cMgPBcCK8LiwLqcbywW3t4oDV37n1pzpuNLsYiAV8eODnjbtQlSDwZ2cUEeQz4E54Hltg==",
+      "hasInstallScript": true,
+      "license": "Apache-2.0",
+      "optional": true,
+      "dependencies": {
+        "@img/colour": "^1.0.0",
+        "detect-libc": "^2.1.2",
+        "semver": "^7.7.3"
+      },
+      "engines": {
+        "node": "^18.17.0 || ^20.3.0 || >=21.0.0"
+      },
+      "funding": {
+        "url": "https://opencollective.com/libvips"
+      },
+      "optionalDependencies": {
+        "@img/sharp-darwin-arm64": "0.34.5",
+        "@img/sharp-darwin-x64": "0.34.5",
+        "@img/sharp-libvips-darwin-arm64": "1.2.4",
+        "@img/sharp-libvips-darwin-x64": "1.2.4",
+        "@img/sharp-libvips-linux-arm": "1.2.4",
+        "@img/sharp-libvips-linux-arm64": "1.2.4",
+        "@img/sharp-libvips-linux-ppc64": "1.2.4",
+        "@img/sharp-libvips-linux-riscv64": "1.2.4",
+        "@img/sharp-libvips-linux-s390x": "1.2.4",
+        "@img/sharp-libvips-linux-x64": "1.2.4",
+        "@img/sharp-libvips-linuxmusl-arm64": "1.2.4",
+        "@img/sharp-libvips-linuxmusl-x64": "1.2.4",
+        "@img/sharp-linux-arm": "0.34.5",
+        "@img/sharp-linux-arm64": "0.34.5",
+        "@img/sharp-linux-ppc64": "0.34.5",
+        "@img/sharp-linux-riscv64": "0.34.5",
+        "@img/sharp-linux-s390x": "0.34.5",
+        "@img/sharp-linux-x64": "0.34.5",
+        "@img/sharp-linuxmusl-arm64": "0.34.5",
+        "@img/sharp-linuxmusl-x64": "0.34.5",
+        "@img/sharp-wasm32": "0.34.5",
+        "@img/sharp-win32-arm64": "0.34.5",
+        "@img/sharp-win32-ia32": "0.34.5",
+        "@img/sharp-win32-x64": "0.34.5"
+      }
+    },
+    "node_modules/source-map-js": {
+      "version": "1.2.1",
+      "resolved": "https://registry.npmjs.org/source-map-js/-/source-map-js-1.2.1.tgz",
+      "integrity": "sha512-UXWMKhLOwVKb728IUtQPXxfYU+usdybtUrK/8uGE8CQMvrhOpwvzDBwj0QhSL7MQc7vIsISBG8VQ8+IDQxpfQA==",
+      "license": "BSD-3-Clause",
+      "engines": {
+        "node": ">=0.10.0"
+      }
+    },
+    "node_modules/styled-jsx": {
+      "version": "5.1.6",
+      "resolved": "https://registry.npmjs.org/styled-jsx/-/styled-jsx-5.1.6.tgz",
+      "integrity": "sha512-qSVyDTeMotdvQYoHWLNGwRFJHC+i+ZvdBRYosOFgC+Wg1vx4frN2/RG/NA7SYqqvKNLf39P2LSRA2pu6n0XYZA==",
+      "license": "MIT",
+      "dependencies": {
+        "client-only": "0.0.1"
+      },
+      "engines": {
+        "node": ">= 12.0.0"
+      },
+      "peerDependencies": {
+        "react": ">= 16.8.0 || 17.x.x || ^18.0.0-0 || ^19.0.0-0"
+      },
+      "peerDependenciesMeta": {
+        "@babel/core": {
+          "optional": true
+        },
+        "babel-plugin-macros": {
+          "optional": true
+        }
+      }
+    },
+    "node_modules/tslib": {
+      "version": "2.8.1",
+      "resolved": "https://registry.npmjs.org/tslib/-/tslib-2.8.1.tgz",
+      "integrity": "sha512-oJFu94HQb+KVduSUQL7wnpmqnfmLsOA/nAh6b6EH0wCEoK0/mPeXU6c3wKDV83MkOuHPRHtSXKKU99IBazS/2w==",
+      "license": "0BSD"
+    },
+    "node_modules/typescript": {
+      "version": "5.9.3",
+      "resolved": "https://registry.npmjs.org/typescript/-/typescript-5.9.3.tgz",
+      "integrity": "sha512-jl1vZzPDinLr9eUt3J/t7V6FgNEw9QjvBPdysz9KfQDD41fQrC2Y4vKQdiaUpFT4bXlb1RHhLpp8wtm6M5TgSw==",
+      "dev": true,
+      "license": "Apache-2.0",
+      "bin": {
+        "tsc": "bin/tsc",
+        "tsserver": "bin/tsserver"
+      },
+      "engines": {
+        "node": ">=14.17"
+      }
+    },
+    "node_modules/undici-types": {
+      "version": "6.21.0",
+      "resolved": "https://registry.npmjs.org/undici-types/-/undici-types-6.21.0.tgz",
+      "integrity": "sha512-iwDZqg0QAGrg9Rav5H4n0M64c3mkR59cJ6wQp+7C4nI0gsmExaedaYLNO44eT4AtBBwjbTiGPMlt2Md0T9H9JQ==",
+      "dev": true,
+      "license": "MIT"
+    }
+  }
+}
diff --git a/examples/nextjs-rsc-app/package.json b/examples/nextjs-rsc-app/package.json
new file mode 100644
index 00000000..06100387
--- /dev/null
+++ b/examples/nextjs-rsc-app/package.json
@@ -0,0 +1,22 @@
+{
+  "name": "nextjs-rsc-app",
+  "version": "0.1.0",
+  "private": true,
+  "description": "Minimal Next.js App Router app for testing Trusted Server RSC integration",
+  "scripts": {
+    "dev": "next dev --port 3099",
+    "build": "next build",
+    "start": "next start --port 3099",
+    "capture-fixtures": "bash scripts/capture-fixtures.sh"
+  },
+  "dependencies": {
+    "next": "^15.0.0",
+    "react": "^19.0.0",
+    "react-dom": "^19.0.0"
+  },
+  "devDependencies": {
+    "@types/node": "^22.0.0",
+    "@types/react": "^19.0.0",
+    "typescript": "^5.7.0"
+  }
+}
diff --git a/examples/nextjs-rsc-app/scripts/capture-fixtures.sh b/examples/nextjs-rsc-app/scripts/capture-fixtures.sh
new file mode 100755
index 00000000..240ea942
--- /dev/null
+++ b/examples/nextjs-rsc-app/scripts/capture-fixtures.sh
@@ -0,0 +1,103 @@
+#!/usr/bin/env bash
+# capture-fixtures.sh — Start the Next.js production server, capture HTML from each
+# route, and save as test fixtures for Trusted Server integration tests.
+#
+# Usage:
+#   cd examples/nextjs-rsc-app
+#   npm ci
+#   bash scripts/capture-fixtures.sh
+#
+# Prerequisites: Node.js 18+, npm, curl
+
+set -euo pipefail
+
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+APP_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"
+FIXTURE_DIR="$(cd "$APP_DIR/../../crates/common/src/integrations/nextjs/fixtures" && pwd)"
+PORT=3099
+DEV_PID=""
+
+cleanup() {
+  if [ -n "$DEV_PID" ]; then
+    echo "Stopping production server (PID $DEV_PID)..."
+    kill "$DEV_PID" 2>/dev/null || true
+    wait "$DEV_PID" 2>/dev/null || true
+  fi
+}
+trap cleanup EXIT
+
+echo "=== Next.js Fixture Capture ==="
+echo "App directory: $APP_DIR"
+echo "Fixture output: $FIXTURE_DIR"
+echo ""
+
+if ! command -v curl >/dev/null 2>&1; then
+  echo "ERROR: curl is required but was not found in PATH"
+  exit 1
+fi
+
+mkdir -p "$FIXTURE_DIR"
+
+echo "Installing dependencies with npm ci..."
+cd "$APP_DIR"
+npm ci
+
+echo "Building Next.js app for deterministic fixture output..."
+npm run build
+
+# Start production server in background for stable HTML output.
+echo "Starting Next.js production server on port $PORT..."
+npm run start &
+DEV_PID=$!
+
+# Wait for server to be ready
+echo "Waiting for server..."
+for i in $(seq 1 30); do
+  if curl -fsS "http://localhost:$PORT/" > /dev/null 2>&1; then
+    echo "Server ready after ${i}s"
+    break
+  fi
+  if [ "$i" -eq 30 ]; then
+    echo "ERROR: Server did not start within 30s"
+    exit 1
+  fi
+  sleep 1
+done
+
+echo ""
+
+# Capture routes in a fixed order for predictable logs.
+route_pairs=(
+  "app-router-simple.html|/"
+  "app-router-tchunk.html|/about"
+  "app-router-large.html|/blog/hello-world"
+)
+
+for pair in "${route_pairs[@]}"; do
+  fixture="${pair%%|*}"
+  route="${pair##*|}"
+  output="$FIXTURE_DIR/$fixture"
+  echo "Capturing $route -> $fixture"
+  curl -fsS "http://localhost:$PORT$route" > "$output"
+
+  if ! grep -q "<html" "$output"; then
+    echo "ERROR: Captured fixture $fixture does not contain <html>"
+    exit 1
+  fi
+
+  if ! grep -q "__next_f" "$output"; then
+    echo "ERROR: Captured fixture $fixture does not contain __next_f payloads"
+    exit 1
+  fi
+
+  size=$(wc -c < "$output" | tr -d ' ')
+  scripts=$(grep -c '__next_f' "$output" 2>/dev/null || echo "0")
+  echo "  Size: ${size} bytes, RSC scripts: ${scripts}"
+done
+
+echo ""
+echo "=== Capture complete ==="
+echo "Fixtures saved to: $FIXTURE_DIR"
+echo ""
+echo "Files:"
+ls -la "$FIXTURE_DIR"/*.html
diff --git a/examples/nextjs-rsc-app/test-live-html.sh b/examples/nextjs-rsc-app/test-live-html.sh
new file mode 100755
index 00000000..5e08d36f
--- /dev/null
+++ b/examples/nextjs-rsc-app/test-live-html.sh
@@ -0,0 +1,198 @@
+#!/bin/bash
+# Test RSC streaming with LIVE HTML from running Next.js server
+#
+# Prerequisites: Next.js server must be running on localhost:3099
+# Usage: ./test-live-html.sh [url]
+#
+# This script:
+# 1. Fetches HTML from your running Next.js server
+# 2. Processes it through trusted-server pipeline
+# 3. Shows streaming metrics and verifies RSC rewriting
+
+set -e
+
+PORT=3099
+URL=${1:-"http://localhost:$PORT/"}
+PROJECT_ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/../.." && pwd)"
+
+cleanup() {
+    rm -f "${TEST_FILE:-}" "${TEMP_FIXTURE:-}"
+}
+trap cleanup EXIT
+
+echo "╔════════════════════════════════════════════════════════════╗"
+echo "║         LIVE RSC STREAMING TEST                            ║"
+echo "╚════════════════════════════════════════════════════════════╝"
+echo
+
+# Check if server is running
+if ! curl -s "$URL" > /dev/null 2>&1; then
+    echo "❌ Next.js server not running on $URL"
+    echo
+    echo "Start it first with:"
+    echo "  cd examples/nextjs-rsc-app"
+    echo "  npm run dev    # or npm run start"
+    exit 1
+fi
+
+echo "✅ Server is running at $URL"
+echo
+
+# Fetch HTML
+echo "📥 Fetching HTML from live server..."
+HTML=$(curl -s "$URL")
+SIZE=$(echo "$HTML" | wc -c | tr -d ' ')
+echo "   Downloaded: $SIZE bytes"
+echo
+
+# Analyze raw HTML
+RSC_COUNT=$(echo "$HTML" | grep -c "__next_f.push" || echo "0")
+ORIGIN_COUNT=$(echo "$HTML" | grep -o "origin.example.com" | wc -l | tr -d ' ')
+
+echo "📊 Raw HTML Analysis:"
+echo "   RSC scripts: $RSC_COUNT"
+echo "   origin.example.com occurrences: $ORIGIN_COUNT"
+
+if [ "$RSC_COUNT" -eq 0 ]; then
+    echo "   ⚠️  No RSC content found - this might not be an RSC page"
+fi
+echo
+
+# Save to temp fixture for processing
+TEMP_FIXTURE="$PROJECT_ROOT/crates/common/src/integrations/nextjs/fixtures/live-test.html"
+echo "$HTML" > "$TEMP_FIXTURE"
+echo "💾 Saved to temp fixture: live-test.html"
+echo
+
+# Create a test that uses this fixture
+TEST_FILE="$PROJECT_ROOT/crates/common/tests/test_live_html.rs"
+cat > "$TEST_FILE" << 'RUST_TEST_EOF'
+//! Test live HTML from running Next.js server
+//! This file is auto-generated by test-live-html.sh
+
+use trusted_server_common::html_processor::{create_html_processor, HtmlProcessorConfig};
+use trusted_server_common::integrations::IntegrationRegistry;
+use trusted_server_common::settings::Settings;
+use trusted_server_common::streaming_processor::StreamProcessor;
+
+fn create_test_settings() -> Settings {
+    let toml = r#"
+        [[handlers]]
+        path = "^/secure"
+        username = "user"
+        password = "pass"
+
+        [publisher]
+        domain = "test-publisher.com"
+        cookie_domain = ".test-publisher.com"
+        origin_backend = "publisher_origin"
+        origin_url = "https://origin.example.com"
+        proxy_secret = "unit-test-proxy-secret"
+
+        [integrations.prebid]
+        enabled = false
+
+        [integrations.nextjs]
+        enabled = true
+        rewrite_attributes = ["href", "link", "url"]
+
+        [synthetic]
+        counter_store = "test-counter-store"
+        opid_store = "test-opid-store"
+        secret_key = "test-secret-key"
+        template = "{{client_ip}}:{{user_agent}}"
+
+        [request_signing]
+        config_store_id = "test-config-store-id"
+        secret_store_id = "test-secret-store-id"
+
+        [[backends]]
+        name = "publisher_origin"
+        target = "https://origin.example.com"
+    "#;
+    Settings::from_toml(toml).expect("test settings should parse")
+}
+
+#[test]
+fn test_live_html_streaming() {
+    let html = include_str!("../src/integrations/nextjs/fixtures/live-test.html");
+
+    println!("\n╔════════════════════════════════════════════════════════════╗");
+    println!("║              PROCESSING LIVE HTML                          ║");
+    println!("╚════════════════════════════════════════════════════════════╝\n");
+
+    let settings = create_test_settings();
+    let registry = IntegrationRegistry::new(&settings).expect("Failed to create registry");
+    let config = HtmlProcessorConfig::from_settings(
+        &settings,
+        &registry,
+        "origin.example.com",
+        "trusted.example.com",
+        "https",
+    );
+
+    // Test with different chunk sizes
+    for &chunk_size in &[32, 64, 256, 8192] {
+        let mut processor = create_html_processor(config.clone());
+        let mut intermediate = 0;
+        let mut final_bytes = 0;
+        let mut output = Vec::new();
+
+        let total_chunks = (html.len() + chunk_size - 1) / chunk_size;
+        for (i, chunk) in html.as_bytes().chunks(chunk_size).enumerate() {
+            let is_last = i == total_chunks - 1;
+            let result = processor.process_chunk(chunk, is_last).unwrap();
+
+            if is_last {
+                final_bytes = result.len();
+            } else {
+                intermediate += result.len();
+            }
+            output.extend_from_slice(&result);
+        }
+
+        let total = intermediate + final_bytes;
+        let ratio = if total > 0 {
+            (intermediate as f64 / total as f64) * 100.0
+        } else {
+            0.0
+        };
+
+        println!("Chunk size {:5}B: {:5.1}% streamed ({} intermediate, {} final)",
+            chunk_size, ratio, intermediate, final_bytes);
+
+        // For 64-byte chunks, verify RSC rewriting
+        if chunk_size == 64 {
+            let output_str = String::from_utf8_lossy(&output);
+
+            // Count origin URLs in RSC scripts
+            let rsc_origin_count: usize = output_str
+                .split("<script>")
+                .filter(|s| s.contains("__next_f.push"))
+                .map(|s| s.matches("origin.example.com").count())
+                .sum();
+
+            println!("\n🔍 RSC Payload Verification (64B chunks):");
+            println!("   Origin URLs in RSC payloads: {}", rsc_origin_count);
+
+            if rsc_origin_count == 0 {
+                println!("   ✅ All RSC payload URLs successfully rewritten!");
+            } else {
+                println!("   ⚠️  {} origin URLs remain (may indicate fragmentation)", rsc_origin_count);
+            }
+        }
+    }
+
+    println!("\n╔════════════════════════════════════════════════════════════╗");
+    println!("║                  TEST COMPLETE                             ║");
+    println!("╚════════════════════════════════════════════════════════════╝");
+}
+RUST_TEST_EOF
+
+echo "🧪 Running test with live HTML..."
+cd "$PROJECT_ROOT"
+cargo test --test test_live_html -- --nocapture
+
+# Cleanup
+echo
+echo "✅ Test complete!"
diff --git a/examples/nextjs-rsc-app/test-streaming.sh b/examples/nextjs-rsc-app/test-streaming.sh
new file mode 100755
index 00000000..bab4b363
--- /dev/null
+++ b/examples/nextjs-rsc-app/test-streaming.sh
@@ -0,0 +1,105 @@
+#!/bin/bash
+# Test RSC streaming with the Next.js example app
+#
+# This script:
+# 1. Starts the Next.js dev server
+# 2. Fetches pages and saves them
+# 3. Runs the Rust integration tests to verify streaming
+# 4. Shows streaming metrics
+
+set -e
+
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+PROJECT_ROOT="$(cd "$SCRIPT_DIR/../.." && pwd)"
+
+echo "╔════════════════════════════════════════════════════════════╗"
+echo "║         RSC STREAMING INTEGRATION TEST                    ║"
+echo "╚════════════════════════════════════════════════════════════╝"
+echo
+
+# Check if Next.js dependencies are installed
+if [ ! -d "$SCRIPT_DIR/node_modules" ]; then
+    echo "📦 Installing Next.js dependencies..."
+    cd "$SCRIPT_DIR"
+    npm install
+    echo
+fi
+
+# Build Next.js app
+echo "🔨 Building Next.js app..."
+cd "$SCRIPT_DIR"
+npm run build
+echo
+
+# Start Next.js server in background
+echo "🚀 Starting Next.js server..."
+PORT=3099
+npm run start -- -p $PORT > /dev/null 2>&1 &
+NEXT_PID=$!
+
+# Ensure server is killed on exit
+trap "echo; echo '🛑 Stopping Next.js server...'; kill $NEXT_PID 2>/dev/null || true" EXIT
+
+# Wait for server to be ready
+echo "⏳ Waiting for server to start..."
+for i in {1..30}; do
+    if curl -s "http://localhost:$PORT" > /dev/null 2>&1; then
+        echo "✅ Server ready!"
+        break
+    fi
+    if [ $i -eq 30 ]; then
+        echo "❌ Server failed to start"
+        exit 1
+    fi
+    sleep 1
+done
+echo
+
+# Fetch pages
+echo "📥 Fetching pages from Next.js app..."
+mkdir -p /tmp/nextjs-test-output
+
+curl -s "http://localhost:$PORT/" -o /tmp/nextjs-test-output/home.html
+echo "   ✓ Home page: $(wc -c < /tmp/nextjs-test-output/home.html) bytes"
+
+curl -s "http://localhost:$PORT/about" -o /tmp/nextjs-test-output/about.html
+echo "   ✓ About page: $(wc -c < /tmp/nextjs-test-output/about.html) bytes"
+
+curl -s "http://localhost:$PORT/blog/test-post" -o /tmp/nextjs-test-output/blog.html
+echo "   ✓ Blog page: $(wc -c < /tmp/nextjs-test-output/blog.html) bytes"
+echo
+
+# Check for RSC markers
+echo "🔍 Verifying RSC content in fetched pages..."
+for file in /tmp/nextjs-test-output/*.html; do
+    page=$(basename "$file" .html)
+    if grep -q "__next_f.push" "$file"; then
+        echo "   ✓ $page: RSC content detected"
+    else
+        echo "   ⚠️  $page: No RSC content found"
+    fi
+done
+echo
+
+# Count origin URLs before processing
+echo "📊 Origin URLs in fetched HTML (before processing):"
+for file in /tmp/nextjs-test-output/*.html; do
+    page=$(basename "$file" .html)
+    count=$(grep -o "origin\.example\.com" "$file" | wc -l | tr -d ' ')
+    echo "   $page: $count occurrences"
+done
+echo
+
+# Run Rust integration tests
+echo "🧪 Running Rust integration tests..."
+cd "$PROJECT_ROOT"
+cargo test --test nextjs_integration -- --nocapture 2>&1 | grep -A 1 "streaming ratio\|RSC payload"
+echo
+
+echo "╔════════════════════════════════════════════════════════════╗"
+echo "║                  TEST COMPLETED                            ║"
+echo "╠════════════════════════════════════════════════════════════╣"
+echo "║ ✅ Next.js app successfully generated RSC content          ║"
+echo "║ ✅ Integration tests verify streaming behavior             ║"
+echo "║ ✅ RSC payloads are correctly rewritten                    ║"
+echo "╚════════════════════════════════════════════════════════════╝"
diff --git a/examples/nextjs-rsc-app/tsconfig.json b/examples/nextjs-rsc-app/tsconfig.json
new file mode 100644
index 00000000..94fda0a1
--- /dev/null
+++ b/examples/nextjs-rsc-app/tsconfig.json
@@ -0,0 +1,40 @@
+{
+  "compilerOptions": {
+    "target": "ES2017",
+    "lib": [
+      "dom",
+      "dom.iterable",
+      "esnext"
+    ],
+    "allowJs": true,
+    "skipLibCheck": true,
+    "strict": true,
+    "noEmit": true,
+    "esModuleInterop": true,
+    "module": "esnext",
+    "moduleResolution": "bundler",
+    "resolveJsonModule": true,
+    "isolatedModules": true,
+    "jsx": "preserve",
+    "incremental": true,
+    "plugins": [
+      {
+        "name": "next"
+      }
+    ],
+    "paths": {
+      "@/*": [
+        "./*"
+      ]
+    }
+  },
+  "include": [
+    "**/*.ts",
+    "**/*.tsx",
+    "next-env.d.ts",
+    ".next/types/**/*.ts"
+  ],
+  "exclude": [
+    "node_modules"
+  ]
+}

From ce2b2b4e7de3c1151e8ad0199f1269975952dd99 Mon Sep 17 00:00:00 2001
From: prk-Jr <prakashsagwara@gmail.com>
Date: Thu, 26 Feb 2026 19:26:44 +0530
Subject: [PATCH 13/13] Remove legacy buffered path and clean up review
 findings

---
 OPTIMIZATION.md                |  42 +++---
 crates/common/src/publisher.rs | 255 ++-------------------------------
 crates/fastly/src/main.rs      |  52 +++----
 3 files changed, 47 insertions(+), 302 deletions(-)

diff --git a/OPTIMIZATION.md b/OPTIMIZATION.md
index 8ee887f5..14fd162c 100644
--- a/OPTIMIZATION.md
+++ b/OPTIMIZATION.md
@@ -15,10 +15,10 @@ This document presents a performance analysis and optimization plan for the Trus
 | % CPU | Function | Notes |
 |-------|----------|-------|
 | ~96% | `trusted_server_fastly::main` | Almost all time is in application code |
-| ~90% | `route_request` → `handle_publisher_request` | Publisher proxy is the hot path |
+| ~90% | `route_request` → `handle_publisher_request_streaming` | Publisher proxy is the hot path |
 | **~76%** | **HTML processing pipeline** (`streaming_processor` → `lol_html`) | **Dominant bottleneck** |
 | ~~5-8%~~ → **3.3%** | `get_settings()` | ~~Redundant config crate parsing~~ **Fixed** — now uses `toml::from_str` |
-| ~5-7% | `handle_publisher_request` (non-HTML) | Backend send, cookie handling |
+| ~5-7% | `handle_publisher_request_streaming` (non-HTML) | Backend send, cookie handling |
 
 ### CPU Breakdown — HTML Processing (~76% total)
 
@@ -242,26 +242,20 @@ let settings: Settings = postcard::from_bytes(SETTINGS_DATA)
 
 **Status**: Done. Replaced `Settings::from_toml()` with `toml::from_str()` + explicit `normalize()` + `validate()`. Profiling confirmed: **~5-8% → ~3.3% CPU per request**.
 
-#### 1.4 Reduce verbose per-request logging — ~0.5% CPU
+#### 1.4 ~~Reduce verbose per-request logging — ~0.5% CPU~~ DONE
 
-**Files**: `crates/fastly/src/main.rs:37,64-67,152-177`
+**Files**: `crates/fastly/src/main.rs`
 
-**Problem**: `log::info!("Settings {settings:?}")` serializes the entire Settings struct (~2KB) on every request. `FASTLY_SERVICE_VERSION` env var logged at info level. The logger is configured with `max_level(LevelFilter::Debug)`, meaning every `debug!` and above is evaluated.
+**Problem**: The logger was configured with `max_level(LevelFilter::Debug)`, meaning every `debug!` and above was evaluated — including `log::debug!("Settings {settings:?}")` which serializes the entire Settings struct (~2KB) on every request.
 
-**Fix**: Downgrade the Settings dump to `log::debug!` and tighten the logger's `max_level` to `LevelFilter::Info` for production. When the level is filtered, `log` macros short-circuit before evaluating arguments — so the `Settings` `Debug` format is never even computed.
-
-```rust
-// Before: everything at Debug and above is serialized
-.max_level(log::LevelFilter::Debug)
-
-// After: Info in production, debug only for specific modules if needed
-.max_level(log::LevelFilter::Info)
-```
+**Fix**: Tightened `max_level` to `LevelFilter::Info`. Debug macros now short-circuit before evaluating arguments.
 
 | Impact | LOC | Risk |
 |--------|-----|------|
 | Low (~0.5% CPU) | ~3 | None |
 
+**Status**: Done. Logger `max_level` set to `Info` in production.
+
 #### 1.5 Trivial fixes batch
 
 | Fix | File | LOC |
@@ -284,14 +278,14 @@ The high-impact architectural change. Uses Fastly's `stream_to_client()` API to
 
 **Files**: `crates/common/src/publisher.rs`, `crates/fastly/src/main.rs`
 
-**Current flow** (fully buffered):
+**Previous flow** (fully buffered, removed):
 ```
 req.send() → wait for full response → take_body()
   → process_response_streaming() → collects into Vec<u8>
   → Body::from(output) → return complete Response
 ```
 
-**New flow** (streaming):
+**Current flow** (streaming, implemented in `handle_publisher_request_streaming`):
 ```
 req.send() → take_body() → set response headers
   → stream_to_client() → returns StreamingBody (headers sent immediately)
@@ -343,6 +337,8 @@ match pipeline.process(backend_body, &mut client_body) {
 |--------|-----|------|
 | **High** — reduces time-to-last-byte and peak memory for all proxied pages | ~80-120 | Medium — error handling requires careful design |
 
+**Status**: Done. Implemented in `handle_publisher_request_streaming`. Legacy buffered path removed. External monitoring confirmed 70-75% TTFB reduction.
+
 #### 2.2 Concurrent origin fetch + auction (future)
 
 **Not applicable for golf.com** (no on-page auction), but for publishers with auction.
@@ -376,7 +372,7 @@ After implementing Phases 1-2:
 - No regression on static endpoints or auction
 - Code complexity is justified by measured improvement
 
-**Current Status:** The streaming architecture changes (Phases 1 and 2.1) have been implemented and pushed to the `feat/optimize-html-streaming` branch. Local testing with `curl` has demonstrated significant TTFB improvements (from ~0.716s buffered to ~0.256s streaming) while verifying functional correctness against Fastly Compute's local testing environment. **External environment testing and load testing on the staging edge network is currently due/pending.**
+**Current Status:** The streaming architecture changes (Phases 1 and 2.1) have been implemented on the `feat/optimize-html-streaming` branch. The legacy buffered path (`handle_publisher_request` + `process_response_streaming`) has been removed — all publisher proxy traffic now uses `handle_publisher_request_streaming`. Local testing with `curl` demonstrated significant TTFB improvements (from ~0.716s buffered to ~0.256s streaming). External synthetic monitoring confirmed 70-75% Wait Time (TTFB) reduction on staging. **External load testing on the staging edge network is currently due/pending.**
 
 ---
 
@@ -387,16 +383,16 @@ After implementing Phases 1-2:
 | **1.1** | Gzip streaming fix | Part of ~76% HTML pipeline | **High** (memory) | -15/+3 | Low | 1 |
 | **1.2** | HTML rewriter streaming | Part of ~76% HTML pipeline | **High** (memory) | ~30 | Medium | 1 |
 | **1.3** | ~~Eliminate redundant `config` crate~~ | ~~5-8%~~ → **3.3%** | **Done** | 1-3 | Low | 1 |
-| **1.4** | Reduce verbose logging | ~0.5% | Low | ~3 | None | 1 |
+| **1.4** | ~~Reduce verbose logging~~ | ~~~0.5%~~ | **Done** | ~3 | None | 1 |
 | **1.5** | Trivial fixes batch | <1% combined | Low | ~50 | None | 1 |
-| **2.1** | `stream_to_client()` integration | N/A (architectural) | **High** (TTLB) | ~80-120 | Medium | 2 |
+| **2.1** | ~~`stream_to_client()` integration~~ | N/A (architectural) | **Done** (70-75% TTFB reduction) | ~80-120 | Medium | 2 |
 | **2.2** | Concurrent origin + auction | N/A (architectural) | **Very High** | ~150-200 | High | 2 (future) |
 
 ---
 
-## Architecture: Current vs Target
+## Architecture: Previous vs Current
 
-### Current (fully buffered)
+### Previous (fully buffered, removed)
 
 ```
 Client → Fastly Edge → [WASM starts]
@@ -414,12 +410,12 @@ Client → Fastly Edge → [WASM starts]
 **Memory**: compressed + decompressed + processed + recompressed = ~4x response size
 **TTLB**: cannot send any bytes until all processing is complete
 
-### Target (streaming)
+### Current (streaming, implemented)
 
 ```
 Client → Fastly Edge → [WASM starts]
   → init (settings, orchestrator, registry)     ~1ms
-  → req.send(backend)                           blocks for full response (same as current)
+  → req.send(backend)                           blocks for full response
   → response.take_body()                        body available as Read stream
   → validate status, set response headers
   → stream_to_client()                          headers sent to client NOW
diff --git a/crates/common/src/publisher.rs b/crates/common/src/publisher.rs
index 9b442942..a54a6bb8 100644
--- a/crates/common/src/publisher.rs
+++ b/crates/common/src/publisher.rs
@@ -1,6 +1,6 @@
 use error_stack::{Report, ResultExt};
 use fastly::http::{header, StatusCode};
-use fastly::{Body, Request, Response};
+use fastly::{Request, Response};
 
 use crate::backend::BackendConfig;
 use crate::http_util::{serve_static_with_etag, RequestInfo};
@@ -53,7 +53,6 @@ pub fn handle_tsjs_dynamic(
 
 /// Parameters for processing response streaming
 struct ProcessResponseParams<'a> {
-    content_encoding: &'a str,
     origin_host: &'a str,
     origin_url: &'a str,
     request_host: &'a str,
@@ -63,92 +62,6 @@ struct ProcessResponseParams<'a> {
     integration_registry: &'a IntegrationRegistry,
 }
 
-/// Process response body in streaming fashion with compression preservation
-fn process_response_streaming(
-    body: Body,
-    params: &ProcessResponseParams,
-) -> Result<Body, Report<TrustedServerError>> {
-    // Check if this is HTML content
-    let is_html = params.content_type.contains("text/html");
-    let is_rsc_flight = params.content_type.contains("text/x-component");
-    log::debug!(
-        "process_response_streaming: content_type={}, content_encoding={}, is_html={}, is_rsc_flight={}, origin_host={}",
-        params.content_type,
-        params.content_encoding,
-        is_html,
-        is_rsc_flight,
-        params.origin_host
-    );
-
-    // Determine compression type
-    let compression = Compression::from_content_encoding(params.content_encoding);
-
-    // Create output body to collect results
-    let mut output = Vec::new();
-
-    // Choose processor based on content type
-    if is_html {
-        // Use HTML rewriter for HTML content
-        let processor = create_html_stream_processor(
-            params.origin_host,
-            params.request_host,
-            params.request_scheme,
-            params.settings,
-            params.integration_registry,
-        )?;
-
-        let config = PipelineConfig {
-            input_compression: compression,
-            output_compression: compression,
-            chunk_size: 8192,
-        };
-
-        let mut pipeline = StreamingPipeline::new(config, processor);
-        pipeline.process(body, &mut output)?;
-    } else if is_rsc_flight {
-        // RSC Flight responses are length-prefixed (T rows). A naive string replacement will
-        // corrupt the stream by changing byte lengths without updating the prefixes.
-        let processor = RscFlightUrlRewriter::new(
-            params.origin_host,
-            params.origin_url,
-            params.request_host,
-            params.request_scheme,
-        );
-
-        let config = PipelineConfig {
-            input_compression: compression,
-            output_compression: compression,
-            chunk_size: 8192,
-        };
-
-        let mut pipeline = StreamingPipeline::new(config, processor);
-        pipeline.process(body, &mut output)?;
-    } else {
-        // Use simple text replacer for non-HTML content
-        let replacer = create_url_replacer(
-            params.origin_host,
-            params.origin_url,
-            params.request_host,
-            params.request_scheme,
-        );
-
-        let config = PipelineConfig {
-            input_compression: compression,
-            output_compression: compression,
-            chunk_size: 8192,
-        };
-
-        let mut pipeline = StreamingPipeline::new(config, replacer);
-        pipeline.process(body, &mut output)?;
-    }
-
-    log::debug!(
-        "Streaming processing complete - output size: {} bytes",
-        output.len()
-    );
-    Ok(Body::from(output))
-}
-
 /// Create a unified HTML stream processor
 fn create_html_stream_processor(
     origin_host: &str,
@@ -170,7 +83,11 @@ fn create_html_stream_processor(
     Ok(create_html_processor(config))
 }
 
-fn apply_standard_response_headers(settings: &Settings, response: &mut Response) {
+/// Apply standard Trusted Server response headers (version, staging flag, custom headers).
+///
+/// This should be called on every response before sending to the client, regardless of
+/// whether the response is buffered or streamed.
+pub fn apply_standard_response_headers(settings: &Settings, response: &mut Response) {
     if let Ok(v) = ::std::env::var(ENV_FASTLY_SERVICE_VERSION) {
         response.set_header(HEADER_X_TS_VERSION, v);
     }
@@ -182,146 +99,6 @@ fn apply_standard_response_headers(settings: &Settings, response: &mut Response)
     }
 }
 
-/// Proxies requests to the publisher's origin server.
-///
-/// This function forwards incoming requests to the configured origin URL,
-/// preserving headers and request body. It's used as a fallback for routes
-/// not explicitly handled by the trusted server.
-///
-/// # Errors
-///
-/// Returns a [`TrustedServerError`] if:
-/// - The proxy request fails
-/// - The origin backend is unreachable
-pub fn handle_publisher_request(
-    settings: &Settings,
-    integration_registry: &IntegrationRegistry,
-    mut req: Request,
-) -> Result<Response, Report<TrustedServerError>> {
-    log::debug!("Proxying request to publisher_origin");
-
-    // Prebid.js requests are not intercepted here anymore. The HTML processor removes
-    // publisher-supplied Prebid scripts; the unified TSJS bundle includes Prebid.js when enabled.
-
-    // Extract request host and scheme from headers (supports X-Forwarded-Host/Proto for chained proxies)
-    let request_info = RequestInfo::from_request(&req);
-    let request_host = &request_info.host;
-    let request_scheme = &request_info.scheme;
-
-    log::debug!(
-        "Request info: host={}, scheme={} (X-Forwarded-Host: {:?}, Host: {:?}, X-Forwarded-Proto: {:?})",
-        request_host,
-        request_scheme,
-        req.get_header("x-forwarded-host"),
-        req.get_header(header::HOST),
-        req.get_header("x-forwarded-proto"),
-    );
-
-    // Generate synthetic identifiers before the request body is consumed.
-    let synthetic_id = get_or_generate_synthetic_id(settings, &req)?;
-
-    log::debug!("Proxy synthetic IDs - trusted: {}", synthetic_id);
-
-    let backend_name = BackendConfig::from_url(
-        &settings.publisher.origin_url,
-        settings.proxy.certificate_check,
-    )?;
-    let origin_host = settings.publisher.origin_host();
-
-    log::debug!(
-        "Proxying to dynamic backend: {} (from {})",
-        backend_name,
-        settings.publisher.origin_url
-    );
-    req.set_header("host", &origin_host);
-
-    let mut response = req
-        .send(&backend_name)
-        .change_context(TrustedServerError::Proxy {
-            message: "Failed to proxy request to origin".to_string(),
-        })?;
-
-    // Log all response headers for debugging
-    log::debug!("Response headers:");
-    for (name, value) in response.get_headers() {
-        log::debug!("  {}: {:?}", name, value);
-    }
-
-    // Check if the response has a text-based content type that we should process
-    let content_type = response
-        .get_header(header::CONTENT_TYPE)
-        .map(|h| h.to_str().unwrap_or_default())
-        .unwrap_or_default()
-        .to_string();
-
-    let should_process = content_type.contains("text/")
-        || content_type.contains("application/javascript")
-        || content_type.contains("application/json");
-
-    if should_process && !request_host.is_empty() {
-        // Check if the response is compressed
-        let content_encoding = response
-            .get_header(header::CONTENT_ENCODING)
-            .map(|h| h.to_str().unwrap_or_default())
-            .unwrap_or_default()
-            .to_lowercase();
-
-        // Log response details for debugging
-        log::debug!(
-            "Processing response - Content-Type: {}, Content-Encoding: {}, Request Host: {}, Origin Host: {}",
-            content_type, content_encoding, request_host, origin_host
-        );
-
-        // Take the response body for streaming processing
-        let body = response.take_body();
-
-        // Process the body using streaming approach
-        let params = ProcessResponseParams {
-            content_encoding: &content_encoding,
-            origin_host: &origin_host,
-            origin_url: &settings.publisher.origin_url,
-            request_host,
-            request_scheme,
-            settings,
-            content_type: &content_type,
-            integration_registry,
-        };
-        match process_response_streaming(body, &params) {
-            Ok(processed_body) => {
-                // Set the processed body back
-                response.set_body(processed_body);
-
-                // Remove Content-Length as the size has likely changed
-                response.remove_header(header::CONTENT_LENGTH);
-
-                // Keep Content-Encoding header since we're returning compressed content
-                log::debug!(
-                    "Preserved Content-Encoding: {} for compressed response",
-                    content_encoding
-                );
-
-                log::debug!("Completed streaming processing of response body");
-            }
-            Err(e) => {
-                log::error!("Failed to process response body: {:?}", e);
-                // Return an error response
-                return Err(e);
-            }
-        }
-    } else {
-        log::debug!(
-            "Skipping response processing - should_process: {}, request_host: '{}'",
-            should_process,
-            request_host
-        );
-    }
-
-    response.set_header(HEADER_X_SYNTHETIC_ID, synthetic_id.as_str());
-    set_synthetic_cookie(settings, &mut response, synthetic_id.as_str());
-
-    Ok(response)
-}
-
 #[allow(clippy::large_enum_variant)]
 pub enum RouteResult {
     /// Response fully buffered — send via `send_to_client()`
@@ -373,17 +150,8 @@ pub fn handle_publisher_request_streaming(
         || content_type.contains("application/javascript")
         || content_type.contains("application/json");
 
-    // Gate: only stream 2xx processable text responses with a request host
-    // Non-processable but successful responses can still be buffered and passed through efficiently
-    // Wait: if it's successful but NOT processable, should we stream it or buffer it?
-    // It's fine to fall back to the buffered return, it will be sent via `send_to_client()` in main.rs.
-    // Actually, `stream_to_client()` with no processing means we have to pump the body.
-    // Let's just buffer it for now to match exactly what we have in the legacy path, since process_response_streaming
-    // also skips if !should_process.
-    // But wait, the standard path skips `process_response_streaming` but returns the buffered Response.
-    // Returning `RouteResult::Buffered(response)` handles this perfectly.
-
-    // Check if we will stream
+    // Only stream 2xx text responses that need processing. Non-processable responses
+    // fall back to buffered return via `RouteResult::Buffered`.
     let will_stream =
         response.get_status().is_success() && should_process && !request_host.is_empty();
 
@@ -426,7 +194,6 @@ pub fn handle_publisher_request_streaming(
     let mut buffered_streaming_body = std::io::BufWriter::with_capacity(8192, streaming_body);
 
     let params = ProcessResponseParams {
-        content_encoding: &content_encoding,
         origin_host: &origin_host,
         origin_url: &settings.publisher.origin_url,
         request_host,
@@ -595,12 +362,6 @@ mod tests {
         }
     }
 
-    // Note: test_streaming_compressed_content removed as it directly tested private function
-    // process_response_streaming. The functionality is tested through handle_publisher_request.
-
-    // Note: test_streaming_brotli_content removed as it directly tested private function
-    // process_response_streaming. The functionality is tested through handle_publisher_request.
-
     #[test]
     fn test_content_encoding_detection() {
         // Test that we properly handle responses with various content encodings
diff --git a/crates/fastly/src/main.rs b/crates/fastly/src/main.rs
index 0b41a2d5..8eff3e71 100644
--- a/crates/fastly/src/main.rs
+++ b/crates/fastly/src/main.rs
@@ -6,16 +6,13 @@ use log_fastly::Logger;
 use trusted_server_common::auction::endpoints::handle_auction;
 use trusted_server_common::auction::{build_orchestrator, AuctionOrchestrator};
 use trusted_server_common::auth::enforce_basic_auth;
-use trusted_server_common::constants::{
-    ENV_FASTLY_IS_STAGING, ENV_FASTLY_SERVICE_VERSION, HEADER_X_TS_ENV, HEADER_X_TS_VERSION,
-};
 use trusted_server_common::error::TrustedServerError;
 use trusted_server_common::integrations::IntegrationRegistry;
 use trusted_server_common::proxy::{
     handle_first_party_click, handle_first_party_proxy, handle_first_party_proxy_rebuild,
     handle_first_party_proxy_sign,
 };
-use trusted_server_common::publisher::handle_tsjs_dynamic;
+use trusted_server_common::publisher::{apply_standard_response_headers, handle_tsjs_dynamic};
 use trusted_server_common::request_signing::{
     handle_deactivate_key, handle_rotate_key, handle_trusted_server_discovery,
     handle_verify_signature,
@@ -49,36 +46,27 @@ fn classify_route(
     path: &str,
     integration_registry: &IntegrationRegistry,
 ) -> RouteTarget {
-    match (method.clone(), path) {
-        (Method::GET, p) if p.starts_with("/static/tsjs=") => RouteTarget::TsjsDynamic,
-        (Method::GET, "/.well-known/trusted-server.json") => RouteTarget::Discovery,
-        (Method::POST, "/verify-signature") => RouteTarget::VerifySignature,
-        (Method::POST, "/admin/keys/rotate") => RouteTarget::RotateKey,
-        (Method::POST, "/admin/keys/deactivate") => RouteTarget::DeactivateKey,
-        (Method::POST, "/auction") => RouteTarget::Auction,
-        (Method::GET, "/first-party/proxy") => RouteTarget::FirstPartyProxy,
-        (Method::GET, "/first-party/click") => RouteTarget::FirstPartyClick,
-        (Method::GET, "/first-party/sign") | (Method::POST, "/first-party/sign") => {
+    if path.starts_with("/static/tsjs=") && method == Method::GET {
+        return RouteTarget::TsjsDynamic;
+    }
+
+    match (method, path) {
+        (&Method::GET, "/.well-known/trusted-server.json") => RouteTarget::Discovery,
+        (&Method::POST, "/verify-signature") => RouteTarget::VerifySignature,
+        (&Method::POST, "/admin/keys/rotate") => RouteTarget::RotateKey,
+        (&Method::POST, "/admin/keys/deactivate") => RouteTarget::DeactivateKey,
+        (&Method::POST, "/auction") => RouteTarget::Auction,
+        (&Method::GET, "/first-party/proxy") => RouteTarget::FirstPartyProxy,
+        (&Method::GET, "/first-party/click") => RouteTarget::FirstPartyClick,
+        (&Method::GET, "/first-party/sign") | (&Method::POST, "/first-party/sign") => {
             RouteTarget::FirstPartySign
         }
-        (Method::POST, "/first-party/proxy-rebuild") => RouteTarget::FirstPartyProxyRebuild,
-        (m, p) if integration_registry.has_route(&m, p) => RouteTarget::Integration,
+        (&Method::POST, "/first-party/proxy-rebuild") => RouteTarget::FirstPartyProxyRebuild,
+        (m, p) if integration_registry.has_route(m, p) => RouteTarget::Integration,
         _ => RouteTarget::PublisherProxy,
     }
 }
 
-fn apply_standard_response_headers(response: &mut Response, settings: &Settings) {
-    if let Ok(v) = ::std::env::var(ENV_FASTLY_SERVICE_VERSION) {
-        response.set_header(HEADER_X_TS_VERSION, v);
-    }
-    if ::std::env::var(ENV_FASTLY_IS_STAGING).as_deref() == Ok("1") {
-        response.set_header(HEADER_X_TS_ENV, "staging");
-    }
-    for (key, value) in &settings.response_headers {
-        response.set_header(key, value);
-    }
-}
-
 fn main() {
     fastly::init();
     init_logger();
@@ -135,7 +123,7 @@ async fn route_request(
     );
 
     if let Some(mut response) = enforce_basic_auth(settings, &req) {
-        apply_standard_response_headers(&mut response, settings);
+        apply_standard_response_headers(settings, &mut response);
         return Ok(RouteResult::Buffered(response));
     }
 
@@ -155,7 +143,7 @@ async fn route_request(
             Err(e) => {
                 log::error!("Failed to proxy to publisher origin: {:?}", e);
                 let mut err_resp = to_error_response(&e);
-                apply_standard_response_headers(&mut err_resp, settings);
+                apply_standard_response_headers(settings, &mut err_resp);
                 return Ok(RouteResult::Buffered(err_resp));
             }
         }
@@ -188,7 +176,7 @@ async fn route_request(
 
     // Convert any errors to HTTP error responses
     let mut response = result.unwrap_or_else(|e| to_error_response(&e));
-    apply_standard_response_headers(&mut response, settings);
+    apply_standard_response_headers(settings, &mut response);
 
     Ok(RouteResult::Buffered(response))
 }
@@ -197,7 +185,7 @@ fn init_logger() {
     let logger = Logger::builder()
         .default_endpoint("tslog")
         .echo_stdout(true)
-        .max_level(log::LevelFilter::Debug)
+        .max_level(log::LevelFilter::Info)
         .build()
         .expect("Failed to build Logger");