diff --git a/.config/nextest.toml b/.config/nextest.toml
index 386ef0f..642ce83 100644
--- a/.config/nextest.toml
+++ b/.config/nextest.toml
@@ -11,8 +11,23 @@ leak-timeout = "1s"
 filter = 'test(server::tests::) | binary(client_server)'
 test-group = 'serial-sd-port'
 
+# bare_metal_e2e tests share static channel pools declared via
+# `define_static_channels!` — pool slots are not reclaimed until the
+# process exits, so parallel tests exhaust the pools. Run serially.
+[[profile.default.overrides]]
+filter = 'binary(bare_metal_e2e)'
+test-group = 'serial-static-pools'
+
+# static_channels_alloc_witness tests share a counting global allocator
+# and static channel pools. The internal MEASURE_LOCK serializes allocation
+# measurement, but pool exhaustion still requires serial execution.
+[[profile.default.overrides]]
+filter = 'binary(static_channels_alloc_witness)'
+test-group = 'serial-static-pools'
+
 [test-groups]
 serial-sd-port = { max-threads = 1 }
+serial-static-pools = { max-threads = 1 }
 
 [profile.default.junit]  # Output the junit coverage for tools
 path = "junit.xml"
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index fa278bd..671c115 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -65,6 +65,22 @@ jobs:
         with:
           tool: cargo-llvm-cov, cargo-nextest
       - run: cargo test --no-default-features
+      - name: Build matrix — partial feature subsets
+        run: |
+          cargo build --no-default-features --features bare_metal
+          cargo build --no-default-features --features embassy_channels
+          cargo build --no-default-features --features client
+          cargo build --no-default-features --features server
+          cargo build --no-default-features --features client,server
+      - name: Doc — partial feature subsets (catch unresolved intra-doc links)
+        env:
+          RUSTDOCFLAGS: -D warnings
+        run: |
+          cargo doc --no-deps --no-default-features --features client
+          cargo doc --no-deps --no-default-features --features server,bare_metal
+          cargo doc --no-deps --all-features
+      - name: No-alloc witness (explicit gate)
+        run: cargo test --features client,bare_metal --test no_alloc_witness
       - run: cargo llvm-cov nextest --all-features --lcov --output-path ./target/lcov.info
       - name: Upload Coverage report
         uses: codecov/codecov-action@v5
diff --git a/.gitignore b/.gitignore
index 93edde4..1daa9fa 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,7 +1,6 @@
-.DS_Store
-
-/target
 
+.claude/
 CLAUDE.md
-
+.DS_Store
 lcov.info
+/target
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 128fece..c39d428 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,11 +1,56 @@
 # Changelog
 
-## [Unreleased]
+## [0.8.0]
+
+### Added
+
+- **`client::Error::Capacity(&'static str)`** — new variant returned when a fixed-capacity internal structure is full. Current tags: `"unicast_sockets"`, `"udp_buffer"`, `"pending_responses"`, `"request_queue"`. Because `client::Error` is not `#[non_exhaustive]`, this is a breaking change for downstream crates that match the enum exhaustively.
+- **`client::Error::Transport(crate::transport::TransportError)`** — new variant surfacing failures from the pluggable transport backend (`#[from]`-converted, displays transparently). Same exhaustive-match caveat as above.
+- **`client::Error::Shutdown`** — new variant returned by every `Client` method when the control channel is closed (run-loop future was dropped, cancelled, or exited). Replaces the previous `.unwrap()`-on-closed-channel panic path.
+- **`server::SubscribeError`** — new public enum (`SubscribersPerGroupFull`, `EventGroupsFull`) returned by `SubscriptionManager::subscribe` and `EventPublisher::register_subscriber` when a bounded capacity rejects a subscription. Re-exported from `server::mod`.
+- **`Client::new_with_loopback(interface, multicast_loopback)`** — constructor that exposes the previously-internal `multicast_loopback` knob for same-host integration tests.
+- **`Client::new_with_spawner_and_loopback(interface, multicast_loopback, spawner)`** — executor-agnostic constructor that accepts a caller-supplied `Spawner` impl. Bare-metal callers swap `TokioSpawner` for their own task pool.
+- **`Client::new_with_deps_local`** — constructor for single-threaded / `!Send` executors. Accepts a `LocalSpawner` instead of `Spawner` and relaxes the `Send` bound on the transport socket.
+- **`transport::Spawner` trait** (re-exported as `simple_someip::Spawner`) — executor-agnostic task-spawn abstraction. `tokio_transport::TokioSpawner` is the default `std + tokio` impl.
+- **`transport::LocalSpawner` trait** — single-threaded task-spawn abstraction for `!Send` futures. Enables use on runtimes like `tokio::LocalSet` or embassy's single-threaded executor.
+- **`transport::TransportSocket` / `TransportFactory` / `Timer` traits** — executor-agnostic UDP transport abstraction. Default `tokio_transport::TokioTransport` / `TokioSocket` / `TokioTimer` impls available behind the `client-tokio` / `server-tokio` features.
+- **`bare_metal` cargo feature** — activates embassy-sync as the channel backend and enables the `static_channels` module, `AtomicInterfaceHandle`, and `StaticE2EHandle` types. The heap-backed `EmbassySyncChannels` factory is separately gated by the `embassy_channels` feature (which implies `bare_metal`). See `examples/bare_metal_client/` and `examples/bare_metal_server/` for runnable integration examples. Validate with `cargo build -p bare_metal_client` / `cargo build -p bare_metal_server`, NOT `cargo build --workspace` (workspace builds may unify features and mask regressions).
+- **`SubscriptionManager::subscribe` returning a `Result`** — see "Changed" below; the regression test list now exercises the major-version mismatch path explicitly.
 
 ### Changed
 
-- **`std` is now the default feature** — the crate enables `std` (with `thiserror` and `tracing`) by default. Users targeting `no_std` environments must set `default-features = false` in their `Cargo.toml`.
-- **`thiserror` and `tracing` use `default-features = false`** — both dependencies are always included but their `std` features are only enabled when the crate's `std` feature is active. This removes the need for `#[cfg(feature = "std")]` gating on error types and logging macros.
+- **Breaking: `Client::new(interface)` return shape** — previously returned `(Client, ClientUpdates)`; now returns `(Client, ClientUpdates, impl Future<Output = ()> + Send + 'static)`. The third element is the run-loop future, which the caller MUST drive (typically via `tokio::spawn`) for any `Client` method to make progress. Migration: change destructuring to a 3-tuple and spawn or otherwise actively poll the future.
+- **Breaking: `Server::start_announcing` removed → `Server::announcement_loop`** — the new method returns `Result<impl Future<Output = ()> + Send + 'static, Error>` (annotated `#[must_use]`). Spawn the returned future to fire announcements; calling and dropping the future is a silent no-op.
+- **Breaking: `Client::start_sd_announcements` renamed to `Client::sd_announcements_loop`** — same semantic shift as `announcement_loop`: returns an `impl Future` instead of spawning internally, so the caller drives execution.
+- **Breaking: `Client::reboot_flag(&self)` now returns `Result<protocol::sd::RebootFlag, Error>`** — previously returned the bare flag and could panic if the run-loop had exited. All other public `Client` methods migrated to the same `Err(Error::Shutdown)` policy in this release; `reboot_flag` is now consistent.
+- **Breaking: `server::SubscriptionManager::subscribe` signature change** — now returns `Result<(), server::SubscribeError>` instead of `()`. Previously, capacity rejections were silently dropped with only a `warn!` log, which let the server emit a `SubscribeAck` for a subscription that had not been recorded. Callers must now handle the `Err` path (the server's own SD loop emits `SubscribeNack` on `Err`).
+- **Breaking: `server::EventPublisher::register_subscriber` signature change** — now returns `Result<(), server::SubscribeError>` instead of `()`, surfacing the same capacity-rejection signal to externally managed subscription dispatchers.
+- **Breaking: `Server::unicast_local_addr` return type changed** — previously returned `Result<std::net::SocketAddr, std::io::Error>`; now returns `Result<std::net::SocketAddr, server::Error>`. Callers that pattern-matched on `std::io::Error` must update to `server::Error::Transport(e)` and access the inner `TransportError` from there.
+- **Breaking: default features changed `default = []` → `default = ["std"]`** — previously `embedded-io/std`, `thiserror/std`, and `tracing/std` were always-on; they are now gated behind the new `std` feature. Downstream consumers building with `default-features = false` who relied on the implicit `std` propagation must add `features = ["std"]` (or one of `client` / `server`, which both imply `std`).
+- **Breaking: `Client::new` type signature now `Client::<M, R, I, C>::new`** — the `Client` struct gained three additional type parameters for the executor traits (`R: TransportFactory`, `I: InterfaceHandle`, `C: ChannelFactory`). The tokio-default convenience constructor is now gated behind the `client-tokio` feature (was `client`). Migration: add `features = ["client-tokio"]` to continue using `Client::new`; trait-surface consumers use `Client::new_with_deps`.
+- **Breaking: `Server::new` type signature now `Server::<R, S, F, Tm>::new`** — the `Server` struct gained type parameters for the pluggable backends. The tokio-default convenience constructor is now gated behind the `server-tokio` feature (was `server`). Migration: add `features = ["server-tokio"]` to continue using `Server::new`; trait-surface consumers use `Server::new_with_deps`.
+- **Breaking: `SubscriptionHandle` trait redesigned** — the previous `get_subscribers(&self, …) -> impl Future<Output = Vec<Subscriber>>` method has been replaced with `for_each_subscriber(&self, …, f: FnMut)` visitor pattern. This allows `EventPublisher::publish_event` to copy subscriber addresses into a stack buffer (`heapless::Vec<_, 16>`) instead of allocating per-event. Implementors of custom `SubscriptionHandle` must migrate.
+- **Breaking: `SubscriptionHandle` RPITIT futures no longer `+ Send`** — the `subscribe`, `unsubscribe`, and `for_each_subscriber` methods now return `impl Future<…>` without a `+ Send` bound. This enables single-threaded lock-free implementations on bare-metal targets, but means `SubscriptionHandle` trait objects cannot be held across `.await` points in multi-threaded executors. Direct usage with the default `Arc<RwLock<SubscriptionManager>>` is unaffected.
+- New optional dependency `dep:futures` (default-features-off) for `futures::select!` + `FusedFuture` plumbing — pulled in transitively by both `client` and `server` features.
+- `client::Error::Transport` adopts `#[error(transparent)]` Display delegation (the previous wrapping with `{:?}` debug-formatted the inner `TransportError`); user-facing error strings are now stable.
+- Subscribe-NACK reason strings normalized to `snake_case` for log consistency: `wrong_service_id`, `wrong_instance_id`, `wrong_major_version`, `no_endpoint_in_options`, `subscribers_per_group_full`, `event_groups_full`. Wire format is unchanged (NACK is signalled by `TTL=0`).
+
+### Fixed
+
+- **`server::EventPublisher::publish_event` no longer silently sends UNPROTECTED payloads on E2E protect failure** — counter exhaustion / key-lookup races etc. now surface as `Err(Error::E2e(_))` rather than logging and falling through (which had been emitting an unprotected message claiming an E2E-protected channel).
+- **SD `Subscribe` with mismatched `major_version` is now NACKed** — previously an Ack would be returned and the subscription registered, leaving the application stack to silently mis-decode incompatible-version traffic.
+- **`SocketManager::send` no longer panics on a dropped response oneshot** — user-supplied `Spawner` made this path reachable; failures now return `Err(Error::SocketClosedUnexpectedly)`.
+- **`client::Inner` request-queue overflow no longer drops control messages silently** — full queue now invokes `reject_with_capacity("request_queue")` on the rejected message, so callers see a typed `Err(Error::Capacity("request_queue"))` instead of a `RecvError` mapped to `Error::Shutdown`.
+- **Per-socket recv-error hot loop bounded** — `SocketManager`'s socket loop now closes after `MAX_CONSECUTIVE_RECV_ERRORS = 16` consecutive `recv_from` failures rather than spinning indefinitely on a permanently broken fd.
+- **`Client::send` fails fast on oversize messages** — pre-encode size check returns `Err(Error::Capacity("udp_buffer"))` for messages whose `required_size()` exceeds `UDP_BUFFER_SIZE`. Mirrors the existing `EventPublisher::publish_event` capacity guard.
+
+### Notes
+
+- **Crate version bumped to 0.8.0** — reflects the breaking changes above. Downstream `Cargo.toml` snippets in `README.md` were updated accordingly.
+
+### Test runner
+
+- `tests/client_server.rs` integration tests share the SD multicast port (30490) via `SO_REUSEPORT` and rely on Linux's reuseport hashing for traffic delivery. Under cargo's default parallel test runner cross-test Subscribe deliveries flake. The crate's `.config/nextest.toml` serializes `client_server` via the `serial-sd-port` test-group, so `cargo nextest run` (used by CI) gives stable results. For the legacy harness, pass `--test-threads=1`: `cargo test --test client_server -- --test-threads=1`.
 
 
 ## [0.6.0](https://github.com/luminartech/simple_someip/compare/v0.5.3...v0.6.0) - 2026-04-20
diff --git a/Cargo.lock b/Cargo.lock
index 3fd7af0..25f4daa 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -2,6 +2,24 @@
 # It is not intended for manual editing.
 version = 4
 
+[[package]]
+name = "bare_metal_client"
+version = "0.0.0"
+dependencies = [
+ "critical-section",
+ "simple-someip",
+ "tokio",
+]
+
+[[package]]
+name = "bare_metal_server"
+version = "0.0.0"
+dependencies = [
+ "critical-section",
+ "simple-someip",
+ "tokio",
+]
+
 [[package]]
 name = "byteorder"
 version = "1.5.0"
@@ -39,23 +57,134 @@ version = "2.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "19d374276b40fb8bbdee95aef7c7fa6b5316ec764510eb64b8dd0e2ed0d7e7f5"
 
+[[package]]
+name = "critical-section"
+version = "1.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "790eea4361631c5e7d22598ecd5723ff611904e3344ce8720784c93e3d83d40b"
+
 [[package]]
 name = "discovery_client"
 version = "0.0.0"
 dependencies = [
- "embedded-io",
+ "embedded-io 0.7.1",
  "simple-someip",
  "tokio",
  "tracing",
  "tracing-subscriber",
 ]
 
+[[package]]
+name = "embassy-sync"
+version = "0.6.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8d2c8cdff05a7a51ba0087489ea44b0b1d97a296ca6b1d6d1a33ea7423d34049"
+dependencies = [
+ "cfg-if",
+ "critical-section",
+ "embedded-io-async",
+ "futures-sink",
+ "futures-util",
+ "heapless 0.8.0",
+]
+
+[[package]]
+name = "embedded-io"
+version = "0.6.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "edd0f118536f44f5ccd48bcb8b111bdc3de888b58c74639dfb034a357d0f206d"
+
 [[package]]
 name = "embedded-io"
 version = "0.7.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "9eb1aa714776b75c7e67e1da744b81a129b3ff919c8712b5e1b32252c1f07cc7"
 
+[[package]]
+name = "embedded-io-async"
+version = "0.6.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3ff09972d4073aa8c299395be75161d582e7629cd663171d62af73c8d50dba3f"
+dependencies = [
+ "embedded-io 0.6.1",
+]
+
+[[package]]
+name = "futures"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8b147ee9d1f6d097cef9ce628cd2ee62288d963e16fb287bd9286455b241382d"
+dependencies = [
+ "futures-channel",
+ "futures-core",
+ "futures-io",
+ "futures-sink",
+ "futures-task",
+ "futures-util",
+]
+
+[[package]]
+name = "futures-channel"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "07bbe89c50d7a535e539b8c17bc0b49bdb77747034daa8087407d655f3f7cc1d"
+dependencies = [
+ "futures-core",
+ "futures-sink",
+]
+
+[[package]]
+name = "futures-core"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7e3450815272ef58cec6d564423f6e755e25379b217b0bc688e295ba24df6b1d"
+
+[[package]]
+name = "futures-io"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cecba35d7ad927e23624b22ad55235f2239cfa44fd10428eecbeba6d6a717718"
+
+[[package]]
+name = "futures-macro"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e835b70203e41293343137df5c0664546da5745f82ec9b84d40be8336958447b"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn",
+]
+
+[[package]]
+name = "futures-sink"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c39754e157331b013978ec91992bde1ac089843443c49cbc7f46150b0fad0893"
+
+[[package]]
+name = "futures-task"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "037711b3d59c33004d3856fbdc83b99d4ff37a24768fa1be9ce3538a1cde4393"
+
+[[package]]
+name = "futures-util"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "389ca41296e6190b48053de0321d02a77f32f8a5d2461dd38762c0593805c6d6"
+dependencies = [
+ "futures-channel",
+ "futures-core",
+ "futures-io",
+ "futures-macro",
+ "futures-sink",
+ "futures-task",
+ "memchr",
+ "pin-project-lite",
+ "slab",
+]
+
 [[package]]
 name = "hash32"
 version = "0.3.1"
@@ -65,6 +194,16 @@ dependencies = [
  "byteorder",
 ]
 
+[[package]]
+name = "heapless"
+version = "0.8.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0bfb9eb618601c89945a70e254898da93b13be0388091d42117462b265bb3fad"
+dependencies = [
+ "hash32",
+ "stable_deref_trait",
+]
+
 [[package]]
 name = "heapless"
 version = "0.9.2"
@@ -93,6 +232,12 @@ version = "0.4.29"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "5e5032e24019045c762d3c0f28f5b6b8bbf38563a65908389bf7978758920897"
 
+[[package]]
+name = "memchr"
+version = "2.8.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f8ca58f447f06ed17d5fc4043ce1b10dd205e060fb3ce5b979b8ed8e59ff3f79"
+
 [[package]]
 name = "mio"
 version = "1.2.0"
@@ -154,11 +299,14 @@ dependencies = [
 
 [[package]]
 name = "simple-someip"
-version = "0.7.0"
+version = "0.8.0"
 dependencies = [
  "crc",
- "embedded-io",
- "heapless",
+ "critical-section",
+ "embassy-sync",
+ "embedded-io 0.7.1",
+ "futures",
+ "heapless 0.9.2",
  "socket2 0.5.10",
  "thiserror",
  "tokio",
@@ -166,6 +314,12 @@ dependencies = [
  "tracing-subscriber",
 ]
 
+[[package]]
+name = "slab"
+version = "0.4.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0c790de23124f9ab44544d7ac05d60440adc586479ce501c1d6d7da3cd8c9cf5"
+
 [[package]]
 name = "smallvec"
 version = "1.15.1"
diff --git a/Cargo.toml b/Cargo.toml
index 45bde7f..bb25e8f 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,9 +1,15 @@
 [workspace]
-members = [".", "examples/discovery_client", "examples/client_server"]
+members = [
+    ".",
+    "examples/bare_metal_client",
+    "examples/bare_metal_server",
+    "examples/client_server",
+    "examples/discovery_client",
+]
 
 [package]
 name = "simple-someip"
-version = "0.7.0"
+version = "0.8.0"
 edition = "2024"
 license = "MIT OR Apache-2.0"
 description = "A lightweight SOME/IP serialization and communication library"
@@ -11,7 +17,21 @@ repository = "https://github.com/luminartech/simple_someip"
 
 [dependencies]
 crc = "3.4"
+# embassy-sync provides no_std-compatible bounded channels used as the
+# channel backend when the `bare_metal` feature is active. The
+# `critical-section` and `portable-atomic` deps ship with embassy-sync and
+# are satisfiable on the Infineon AURIX TriCore target (HighTec toolchain)
+# per the bare_metal_plan_v2 TriCore delta.
+embassy-sync = { version = "0.6", optional = true }
 embedded-io = { version = "0.7" }
+# `futures` pulls in `futures-util` which provides the executor-agnostic
+# `select!` macro and `FutureExt::fuse` / `pin_mut!` helpers — used by
+# the client/server event loops in place of `tokio::select!`. Default
+# features disabled so we only pull in the parts we use.
+futures = { version = "0.3", default-features = false, features = [
+    "async-await",
+    "std",
+], optional = true }
 heapless = "0.9"
 socket2 = { version = "0.5", optional = true, features = ["all"] }
 thiserror = { version = "2", default-features = false }
@@ -25,15 +45,82 @@ tokio = { version = "1", default-features = false, features = [
 tracing = { version = "0.1", default-features = false }
 
 [dev-dependencies]
-tokio = { version = "1", features = ["rt-multi-thread"] }
+# `critical-section/std` provides a host-platform impl so integration
+# tests that exercise `EmbassySyncChannels` (which depends on
+# `embassy-sync`'s critical-section calls) can link on host. This is
+# test-only; firmware builds supply their own platform impl.
+critical-section = { version = "1", features = ["std"] }
+tokio = { version = "1", features = ["rt-multi-thread", "macros", "time"] }
 tracing-subscriber = "0.3"
 
 [features]
 default = ["std"]
 std = ["embedded-io/std", "thiserror/std", "tracing/std"]
-client = ["std", "dep:tokio", "dep:socket2"]
-server = ["std", "dep:tokio", "dep:socket2"]
+# Feature split: `client` exposes the protocol/trait-surface client
+# (no tokio, no socket2); `client-tokio` layers the tokio + socket2
+# convenience defaults on top. Consumers of the bare-metal trait surface
+# enable `client` only (and supply their own `Spawner` / `Timer` /
+# `ChannelFactory` / `TransportFactory` impls). Consumers who want the
+# `Client::new` shortcut (defaulting to `TokioSpawner` / `TokioTimer` /
+# `TokioChannels` / `TokioTransport`) enable `client-tokio`.
+client = ["std", "dep:futures"]
+client-tokio = ["client", "dep:tokio", "dep:socket2"]
+# Feature split (matches the client side): `server` exposes the
+# trait-surface server (no tokio, no socket2). The engine itself uses
+# `futures::select!` so `dep:futures` lives here. `server-tokio` adds
+# the tokio + socket2 convenience defaults (`Server::new`,
+# `Server::new_with_loopback`, `Server::new_passive`), bringing
+# `Arc<Mutex<E2ERegistry>>` / `Arc<RwLock<SubscriptionManager>>` /
+# / `TokioTransport` / `TokioTimer` defaults into scope.
+server = ["std", "dep:futures"]
+server-tokio = ["server", "dep:tokio", "dep:socket2"]
+# Marks a build as intended for bare-metal / no_std consumption.
+# Activates embassy-sync as the channel backend, the `static_channels`
+# module, `AtomicInterfaceHandle`, and `StaticE2EHandle`.
+#
+# **To demonstrate the bare-metal trait surface, use the
+# `examples/bare_metal_client` / `examples/bare_metal_server` workspace
+# members directly:** `cargo build -p bare_metal_client`. Those workspace
+# members depend on `simple-someip` with `default-features = false,
+# features = ["bare_metal", "client"]` / `["bare_metal", "server"]`,
+# so they exercise the actual bare-metal configuration.
+#
+# Enabling `bare_metal` on its own does NOT make the crate
+# bare-metal-complete: the `client` and `server` feature paths still
+# require a user-provided `Spawner` impl and `TransportFactory` impl.
+# With `bare_metal` enabled, `static_channels` and `define_static_channels!`
+# are available as the no-alloc `ChannelFactory` impl.
+bare_metal = ["dep:embassy-sync"]
+# Heap-backed embassy-sync channel backend (`EmbassySyncChannels`).
+# Implies `bare_metal` and pulls in `alloc` for `Arc<Channel<...>>`.
+# Useful for tests or early prototypes before sizing static pools.
+embassy_channels = ["bare_metal"]
 
 [[test]]
 name = "client_server"
-required-features = ["client", "server"]
+required-features = ["client-tokio", "server-tokio"]
+
+[[test]]
+name = "bare_metal_client"
+required-features = ["client", "bare_metal"]
+
+[[test]]
+name = "bare_metal_client_local"
+required-features = ["client", "bare_metal"]
+
+[[test]]
+name = "static_channels_alloc_witness"
+required-features = ["client", "bare_metal"]
+
+[[test]]
+name = "no_alloc_witness"
+required-features = ["client", "bare_metal"]
+harness = false
+
+[[test]]
+name = "bare_metal_server"
+required-features = ["server", "bare_metal"]
+
+[[test]]
+name = "bare_metal_e2e"
+required-features = ["client", "server", "bare_metal"]
diff --git a/README.md b/README.md
index 1f827a3..a8ef040 100644
--- a/README.md
+++ b/README.md
@@ -10,9 +10,10 @@ The library supports both `std` and `no_std` environments, making it suitable fo
 
 ## Features
 
-- **`no_std` compatible** — the `protocol`, `traits`, and `e2e` modules work without the standard library
+- **`no_std` compatible** — `protocol`, `traits`, `transport`, and `e2e` modules work without the standard library
 - **Service Discovery** — SD entry/option encoding and decoding via fixed-capacity `heapless` collections (no heap allocation)
 - **End-to-End protection** — Profile 4 (CRC-32) and Profile 5 (CRC-16) with zero-allocation APIs
+- **Executor-agnostic transport traits** — `TransportSocket`, `TransportFactory`, `Timer`, `Spawner` (default `tokio` impls behind feature gates)
 - **Async client and server** — tokio-based, gated behind optional feature flags
 - **`embedded-io`** traits for serialization — abstracts over `std::io::Read`/`Write`
 
@@ -20,9 +21,11 @@ The library supports both `std` and `no_std` environments, making it suitable fo
 
 - `protocol` — Wire format layer: SOME/IP header, `MessageId`, `MessageType`, `ReturnCode`, SD entries/options
 - `traits` — `WireFormat` and `PayloadWireFormat` traits for custom message types
+- `transport` — Executor-agnostic UDP socket / factory / timer / spawner traits (no_std-compatible)
 - `e2e` — End-to-End protection profiles (always available, no heap allocation)
-- `client` — High-level async tokio client (requires `feature = "client"`)
-- `server` — Async tokio server with SD announcements and event publishing (requires `feature = "server"`)
+- `tokio_transport` — Default `std + tokio` impls of the transport traits (requires `feature = "client-tokio"` or `feature = "server-tokio"`)
+- `client` — High-level async client trait surface (requires `feature = "client"`; add `client-tokio` for the `Client::new` convenience constructor)
+- `server` — Async server with SD announcements and event publishing (requires `feature = "server"`; add `server-tokio` for the `Server::new` convenience constructor)
 
 ## Usage
 
@@ -31,19 +34,19 @@ Add to your `Cargo.toml`:
 ```toml
 [dependencies]
 # Default — includes std, thiserror, and tracing
-simple-someip = "0.5"
+simple-someip = "0.8"
 
-# no_std only (protocol/E2E/traits, no heap allocation)
-simple-someip = { version = "0.5", default-features = false }
+# no_std only (protocol/transport/E2E/traits, no heap allocation)
+simple-someip = { version = "0.8", default-features = false }
 
-# Client only
-simple-someip = { version = "0.5", features = ["client"] }
+# Client only (with tokio convenience constructors)
+simple-someip = { version = "0.8", features = ["client-tokio"] }
 
-# Server only
-simple-someip = { version = "0.5", features = ["server"] }
+# Server only (with tokio convenience constructors)
+simple-someip = { version = "0.8", features = ["server-tokio"] }
 
 # Both client and server
-simple-someip = { version = "0.5", features = ["client", "server"] }
+simple-someip = { version = "0.8", features = ["client-tokio", "server-tokio"] }
 ```
 
 ### Feature flags
@@ -51,13 +54,19 @@ simple-someip = { version = "0.5", features = ["client", "server"] }
 | Feature | Default | Description |
 |---------|---------|-------------|
 | `std` | **yes** | Enables `thiserror`, `tracing`, and `embedded-io/std` |
-| `client` | no | Async tokio client; implies `std` + tokio + socket2 |
-| `server` | no | Async tokio server; implies `std` + tokio + socket2 |
+| `client` | no | Client trait surface; implies `std` + futures (no tokio) |
+| `client-tokio` | no | Adds `Client::new` / `TokioSpawner` / `TokioTransport` defaults; implies `client` + tokio + socket2 |
+| `server` | no | Server trait surface; implies `std` + futures (no tokio) |
+| `server-tokio` | no | Adds `Server::new` / `TokioTimer` / `TokioTransport` defaults; implies `server` + tokio + socket2 |
+| `bare_metal` | no | Activates embassy-sync, no-alloc `static_channels` module, `AtomicInterfaceHandle`, and `StaticE2EHandle`. See `examples/bare_metal_client` and `examples/bare_metal_server`; verify with `cargo build -p bare_metal_client` (NOT `cargo build --workspace`, which can unify features). |
+| `embassy_channels` | no | Heap-backed `EmbassySyncChannels` (implies `bare_metal` + `alloc`). Useful for tests before sizing static pools. |
 
-By default the crate enables `std`. To use in a `no_std` environment (e.g., embedded targets), disable default features with `default-features = false`. In that mode only the `protocol`, `traits`, and `e2e` modules are available, and the crate compiles in `no_std` mode. Most applications only need one of `client` or `server`.
+By default the crate enables `std`. To use in a `no_std` environment (e.g., embedded targets), disable default features with `default-features = false`. In that mode the `protocol`, `traits`, `transport`, and `e2e` modules are available; `client` / `server` (and their `tokio_transport` backend) are not. Most applications only need one of `client` or `server`.
 
 ## Quick Start
 
+These examples require the `client-tokio` and `server-tokio` features respectively.
+
 ### Client
 
 ```rust
@@ -66,9 +75,17 @@ use std::net::Ipv4Addr;
 
 #[tokio::main]
 async fn main() {
-    // Client::new returns a (Client, ClientUpdates) pair.
-    // Client is Clone-able and can be shared across tasks.
-    let (client, mut updates) = Client::<RawPayload>::new(Ipv4Addr::new(192, 168, 1, 100));
+    // Client::new returns a Clone-able handle, an update stream, and
+    // the run-loop future. The future must be actively driven — either
+    // spawned on the runtime as shown below, or awaited alongside your
+    // own work in a `tokio::select!`. If the future is never polled,
+    // Client method calls that send commands over the control channel
+    // will hang indefinitely waiting on their oneshot response.
+    // `Error::Shutdown` is returned only once the run-loop future has
+    // been dropped or its task cancelled.
+    let (client, mut updates, run) =
+        Client::<RawPayload, _, _, _>::new(Ipv4Addr::new(192, 168, 1, 100));
+    let _run_task = tokio::spawn(run);
 
     // Bind the SD multicast socket to discover services
     client.bind_discovery().await.unwrap();
@@ -95,12 +112,18 @@ use std::net::Ipv4Addr;
 async fn main() -> Result<(), Box<dyn std::error::Error>> {
     let config = ServerConfig::new(Ipv4Addr::new(192, 168, 1, 200), 30500, 0x1234, 1);
     let mut server = Server::new(config).await?;
-    server.start_announcing()?;
+    let announce_handle = tokio::spawn(server.announcement_loop()?);
 
     let publisher = server.publisher();
-    tokio::spawn(async move { server.run().await });
+    let run_handle = tokio::spawn(async move { server.run().await });
+
+    // Publish events to subscribers, e.g.:
+    // publisher.publish_event(0x1234, 1, 0x01, &message).await?;
 
-    // Publish events to subscribers...
+    tokio::select! {
+        res = announce_handle => eprintln!("announcement loop exited unexpectedly: {res:?}"),
+        res = run_handle      => eprintln!("server run loop exited: {res:?}"),
+    }
     Ok(())
 }
 ```
diff --git a/examples/bare_metal_client/Cargo.toml b/examples/bare_metal_client/Cargo.toml
new file mode 100644
index 0000000..844497a
--- /dev/null
+++ b/examples/bare_metal_client/Cargo.toml
@@ -0,0 +1,17 @@
+[package]
+name = "bare_metal_client"
+version = "0.0.0"
+edition = "2024"
+publish = false
+
+# `simple-someip` is compiled with `default-features = false,
+# features = ["client", "bare_metal"]` — no tokio, no socket2 pulled in
+# by the crate itself. The example binary adds tokio only for its own
+# executor and mock driver; real firmware would use embassy_executor or
+# a similar bare-metal async runtime instead.
+[dependencies]
+simple-someip = { path = "../..", default-features = false, features = ["client", "bare_metal"] }
+tokio = { version = "1", features = ["macros", "rt-multi-thread", "time"] }
+# Provides the host platform critical-section implementation required by
+# embassy-sync (pulled in via simple-someip's bare_metal feature).
+critical-section = { version = "1", features = ["std"] }
diff --git a/examples/bare_metal_client/src/main.rs b/examples/bare_metal_client/src/main.rs
new file mode 100644
index 0000000..db910fb
--- /dev/null
+++ b/examples/bare_metal_client/src/main.rs
@@ -0,0 +1,305 @@
+//! Host-side demonstration of [`Client::new_with_deps`] with a
+//! static-pool no-alloc [`ChannelFactory`].
+//!
+//! # What this example shows
+//!
+//! `simple-someip` is compiled with
+//! `default-features = false, features = ["client", "bare_metal"]` —
+//! no tokio, no socket2 pulled in by *the crate itself*. The example
+//! binary adds tokio only for its own executor and mock driver; real
+//! firmware would use `embassy_executor` (or any bare-metal async
+//! runtime) instead.
+//!
+//! Building or running this example in isolation proves that the
+//! bare-metal API compiles under exactly the feature set a firmware
+//! consumer would use:
+//!
+//! ```text
+//! cargo build -p bare_metal_client
+//! cargo run  -p bare_metal_client
+//! ```
+//!
+//! # Patterns demonstrated
+//!
+//! | Pattern | This example | Firmware replacement |
+//! |---------|-------------|----------------------|
+//! | Channel factory | `BareMetalChannels` via `define_static_channels!` | same macro, sized to your HWM |
+//! | Transport | `MockFactory` / `MockSocket` | `embassy_net`, smoltcp, custom Ethernet ISR |
+//! | Timer | `MockTimer` using `tokio::time::sleep` | `embassy_time::Timer::after` |
+//! | Task spawner | `TokioBackedSpawner` | `embassy_executor::Spawner` |
+//! | Lock handles | `Arc<Mutex<_>>` / `Arc<RwLock<_>>` | stack-allocated handles (see below) |
+//!
+//! # What is not yet demonstrated
+//!
+//! The `E2ERegistry` and interface handles still use heap-allocated
+//! `Arc<Mutex<_>>` / `Arc<RwLock<_>>` wrappers. A future verification
+//! pass will replace these with stack-allocated alternatives and confirm
+//! zero heap allocation after `Client::new_with_deps` returns.
+//!
+//! [`Client::new_with_deps`]: simple_someip::Client::new_with_deps
+//! [`ChannelFactory`]: simple_someip::transport::ChannelFactory
+
+use core::future::Future;
+use core::net::{Ipv4Addr, SocketAddrV4};
+use core::pin::Pin;
+use core::task::{Context, Poll};
+use core::time::Duration;
+
+use std::collections::VecDeque;
+use std::sync::{Arc, Mutex};
+
+use simple_someip::client::Error as ClientError;
+use simple_someip::client::{ClientUpdate, ControlMessage, ReceivedMessage, SendMessage};
+use simple_someip::define_static_channels;
+use simple_someip::e2e::E2ERegistry;
+use simple_someip::protocol::sd::RebootFlag;
+use simple_someip::transport::{
+    ReceivedDatagram, SocketOptions, Spawner, Timer, TransportError, TransportFactory,
+    TransportSocket,
+};
+use simple_someip::{Client, ClientDeps, RawPayload};
+
+// ── Static-pool channel factory ───────────────────────────────────────
+//
+// Pool sizes are sized to a modest single-service workload. Production
+// firmware should size each pool to the workload's high-water mark
+// (maximum concurrent in-flight requests / subscriptions).
+
+define_static_channels! {
+    name: BareMetalChannels,
+    oneshot: [
+        (Result<(), ClientError>, 8),
+        (Result<RawPayload, ClientError>, 4),
+        (Result<RebootFlag, ClientError>, 4),
+    ],
+    bounded: [
+        ((ControlMessage<RawPayload, BareMetalChannels>, 4), 1),
+        ((SendMessage<RawPayload, BareMetalChannels>, 16), 4),
+        ((Result<ReceivedMessage<RawPayload>, ClientError>, 16), 4),
+    ],
+    unbounded: [
+        (ClientUpdate<RawPayload>, 1),
+    ],
+}
+
+// ── Mock transport ────────────────────────────────────────────────────
+//
+// Two queues simulate the network. A real firmware transport drives
+// these from a network driver ISR instead of an in-process VecDeque.
+
+#[derive(Default)]
+struct MockPipe {
+    sent: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound_waker: Mutex<Option<core::task::Waker>>,
+}
+
+#[derive(Clone)]
+struct MockFactory {
+    pipe: Arc<MockPipe>,
+    next_port: Arc<Mutex<u16>>,
+}
+
+impl TransportFactory for MockFactory {
+    type Socket = MockSocket;
+    type BindFuture<'a> =
+        core::pin::Pin<Box<dyn Future<Output = Result<Self::Socket, TransportError>> + Send + 'a>>;
+
+    fn bind<'a>(&'a self, addr: SocketAddrV4, _options: &'a SocketOptions) -> Self::BindFuture<'a> {
+        let pipe = Arc::clone(&self.pipe);
+        let port = if addr.port() == 0 {
+            let mut p = self.next_port.lock().unwrap();
+            *p = p.saturating_add(1);
+            30000u16.saturating_add(*p)
+        } else {
+            addr.port()
+        };
+        let local = SocketAddrV4::new(*addr.ip(), port);
+        Box::pin(async move { Ok(MockSocket { pipe, local }) })
+    }
+}
+
+struct MockSocket {
+    pipe: Arc<MockPipe>,
+    local: SocketAddrV4,
+}
+
+struct MockSendFut {
+    pipe: Arc<MockPipe>,
+    bytes: Option<Vec<u8>>,
+    target: SocketAddrV4,
+}
+
+impl Future for MockSendFut {
+    type Output = Result<(), TransportError>;
+
+    fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        if let Some(bytes) = me.bytes.take() {
+            me.pipe.sent.lock().unwrap().push_back((bytes, me.target));
+        }
+        Poll::Ready(Ok(()))
+    }
+}
+
+struct MockRecvFut<'a> {
+    pipe: Arc<MockPipe>,
+    buf: &'a mut [u8],
+}
+
+impl Future for MockRecvFut<'_> {
+    type Output = Result<ReceivedDatagram, TransportError>;
+
+    #[allow(clippy::single_match_else)]
+    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        match me.pipe.inbound.lock().unwrap().pop_front() {
+            Some((bytes, source)) => {
+                let n = bytes.len().min(me.buf.len());
+                me.buf[..n].copy_from_slice(&bytes[..n]);
+                Poll::Ready(Ok(ReceivedDatagram {
+                    bytes_received: n,
+                    source,
+                    truncated: n < bytes.len(),
+                }))
+            }
+            // No datagram — register the waker on the pipe and park.
+            // A real bare-metal impl registers the waker on the network
+            // driver's RX-ready interrupt instead.
+            None => {
+                *me.pipe.inbound_waker.lock().unwrap() = Some(cx.waker().clone());
+                if let Some((bytes, source)) = me.pipe.inbound.lock().unwrap().pop_front() {
+                    let n = bytes.len().min(me.buf.len());
+                    me.buf[..n].copy_from_slice(&bytes[..n]);
+                    return Poll::Ready(Ok(ReceivedDatagram {
+                        bytes_received: n,
+                        source,
+                        truncated: n < bytes.len(),
+                    }));
+                }
+                Poll::Pending
+            }
+        }
+    }
+}
+
+impl TransportSocket for MockSocket {
+    type SendFuture<'a> = MockSendFut;
+    type RecvFuture<'a> = MockRecvFut<'a>;
+
+    fn send_to<'a>(&'a self, buf: &'a [u8], target: SocketAddrV4) -> MockSendFut {
+        MockSendFut {
+            pipe: Arc::clone(&self.pipe),
+            bytes: Some(buf.to_vec()),
+            target,
+        }
+    }
+
+    fn recv_from<'a>(&'a self, buf: &'a mut [u8]) -> MockRecvFut<'a> {
+        MockRecvFut {
+            pipe: Arc::clone(&self.pipe),
+            buf,
+        }
+    }
+
+    fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+        Ok(self.local)
+    }
+
+    fn join_multicast_v4(&self, _group: Ipv4Addr, _iface: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+
+    fn leave_multicast_v4(&self, _group: Ipv4Addr, _iface: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+}
+
+// ── Mock Timer ────────────────────────────────────────────────────────
+//
+// Honors `duration` per the `Timer` trait contract (MAY overshoot, MUST
+// NOT undershoot). Real firmware replaces this with e.g.
+// `embassy_time::Timer::after(d).await`.
+
+struct MockTimer;
+
+impl Timer for MockTimer {
+    type SleepFuture<'a> = core::pin::Pin<Box<dyn Future<Output = ()> + Send + 'a>>;
+    fn sleep(&self, duration: Duration) -> Self::SleepFuture<'_> {
+        Box::pin(async move {
+            tokio::time::sleep(duration).await;
+        })
+    }
+}
+
+// ── Spawner ───────────────────────────────────────────────────────────
+//
+// Wraps tokio::spawn for this example. Real firmware wraps
+// `embassy_executor::Spawner::spawn` or equivalent. The Spawner trait
+// contract requires submitted futures to be polled to completion —
+// never drop them without polling.
+
+struct TokioBackedSpawner;
+
+impl Spawner for TokioBackedSpawner {
+    fn spawn(&self, future: impl Future<Output = ()> + Send + 'static) {
+        drop(tokio::spawn(future));
+    }
+}
+
+// ── Main ──────────────────────────────────────────────────────────────
+
+#[tokio::main]
+async fn main() {
+    let pipe = Arc::new(MockPipe::default());
+    let factory = MockFactory {
+        pipe: Arc::clone(&pipe),
+        next_port: Arc::new(Mutex::new(0)),
+    };
+
+    // std Arc/Mutex/RwLock are sufficient here — they implement the
+    // E2ERegistryHandle / InterfaceHandle lock-handle traits and are
+    // gated by `feature = "std"`, not by `client-tokio`. A future
+    // no-alloc port replaces these with stack-allocated handles.
+    let e2e: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+    let iface: Arc<std::sync::RwLock<Ipv4Addr>> =
+        Arc::new(std::sync::RwLock::new(Ipv4Addr::LOCALHOST));
+
+    let (client, _updates, run_fut) = Client::<
+        RawPayload,
+        Arc<Mutex<E2ERegistry>>,
+        Arc<std::sync::RwLock<Ipv4Addr>>,
+        BareMetalChannels,
+    >::new_with_deps(
+        ClientDeps {
+            factory,
+            spawner: TokioBackedSpawner,
+            timer: MockTimer,
+            e2e_registry: e2e,
+            interface: iface,
+        },
+        false, // multicast_loopback
+    );
+    // `_updates` is a `ClientUpdates` receiver. In production, poll it
+    // for `ClientUpdate` events: discovery changes, unicast replies,
+    // reboot notifications, and errors.
+
+    // The run future is Send + 'static, so it can be handed to any
+    // executor — tokio here, embassy_executor on real firmware.
+    let run_handle = tokio::spawn(run_fut);
+
+    // Client is live. Sanity-check the interface address.
+    assert_eq!(client.interface(), Ipv4Addr::LOCALHOST);
+
+    // Tear down: drop client first (closes the control channel), then
+    // abort and await cancellation.
+    drop(client);
+    run_handle.abort();
+    let _ = run_handle.await;
+
+    println!(
+        "bare-metal example: Client::new_with_deps with BareMetalChannels (define_static_channels!) \
+         compiled and ran successfully under features=[client, bare_metal] — \
+         no tokio / socket2 from simple-someip itself."
+    );
+}
diff --git a/examples/bare_metal_server/Cargo.toml b/examples/bare_metal_server/Cargo.toml
new file mode 100644
index 0000000..4847af6
--- /dev/null
+++ b/examples/bare_metal_server/Cargo.toml
@@ -0,0 +1,17 @@
+[package]
+name = "bare_metal_server"
+version = "0.0.0"
+edition = "2024"
+publish = false
+
+# `simple-someip` is compiled with `default-features = false,
+# features = ["server", "bare_metal"]` — no tokio, no socket2 pulled in
+# by the crate itself. The example binary adds tokio only for its own
+# executor and mock driver; real firmware would use embassy_executor or
+# a similar bare-metal async runtime instead.
+[dependencies]
+simple-someip = { path = "../..", default-features = false, features = ["server", "bare_metal"] }
+tokio = { version = "1", features = ["macros", "rt-multi-thread", "time"] }
+# Provides the host platform critical-section implementation required by
+# embassy-sync (pulled in via simple-someip's bare_metal feature).
+critical-section = { version = "1", features = ["std"] }
diff --git a/examples/bare_metal_server/src/main.rs b/examples/bare_metal_server/src/main.rs
new file mode 100644
index 0000000..db0037f
--- /dev/null
+++ b/examples/bare_metal_server/src/main.rs
@@ -0,0 +1,347 @@
+//! Host-side demonstration of [`Server::new_with_deps`] on a no-tokio,
+//! no-socket2 build.
+//!
+//! # What this example shows
+//!
+//! `simple-someip` is compiled with
+//! `default-features = false, features = ["server", "bare_metal"]` —
+//! no tokio, no socket2 pulled in by *the crate itself*. The example
+//! binary adds tokio only for its own executor and mock driver; real
+//! firmware would use `embassy_executor` (or any bare-metal async
+//! runtime) instead.
+//!
+//! Building or running this example in isolation proves that the
+//! bare-metal server API compiles under exactly the feature set a
+//! firmware consumer would use:
+//!
+//! ```text
+//! cargo build -p bare_metal_server
+//! cargo run  -p bare_metal_server
+//! ```
+//!
+//! # Patterns demonstrated
+//!
+//! | Pattern | This example | Firmware replacement |
+//! |---------|-------------|----------------------|
+//! | Transport | `MockFactory` / `MockSocket` | `embassy_net`, smoltcp, custom Ethernet ISR |
+//! | Timer | `MockTimer` using `tokio::time::sleep` | `embassy_time::Timer::after` |
+//! | Subscription table | `MockSubscriptions` | `heapless`-backed table behind a CS mutex |
+//! | Lock handle | `Arc<Mutex<E2ERegistry>>` | stack-allocated handle (see below) |
+//!
+//! # What is not yet demonstrated
+//!
+//! The `E2ERegistry` handle still uses a heap-allocated `Arc<Mutex<_>>`.
+//! A future verification pass will replace this with a stack-allocated
+//! alternative and confirm zero heap allocation after
+//! `Server::new_with_deps` returns.
+//!
+//! [`Server::new_with_deps`]: simple_someip::Server::new_with_deps
+
+use core::future::Future;
+use core::net::{Ipv4Addr, SocketAddrV4};
+use core::pin::Pin;
+use core::task::{Context, Poll};
+use core::time::Duration;
+
+use std::collections::VecDeque;
+use std::sync::{Arc, Mutex};
+use std::vec::Vec;
+
+use simple_someip::e2e::E2ERegistry;
+use simple_someip::server::{ServerConfig, SubscribeError, Subscriber, SubscriptionHandle};
+use simple_someip::transport::{
+    ReceivedDatagram, SocketOptions, Timer, TransportError, TransportFactory, TransportSocket,
+};
+use simple_someip::{Server, ServerDeps};
+
+// ── Mock transport ────────────────────────────────────────────────────
+//
+// Two queues simulate the network. A real firmware transport drives
+// these from a network driver ISR instead of an in-process VecDeque.
+
+#[derive(Default)]
+struct MockPipe {
+    sent: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound_waker: Mutex<Option<core::task::Waker>>,
+}
+
+#[derive(Clone)]
+struct MockFactory {
+    pipe: Arc<MockPipe>,
+    next_port: Arc<Mutex<u16>>,
+}
+
+impl TransportFactory for MockFactory {
+    type Socket = MockSocket;
+    type BindFuture<'a> =
+        core::pin::Pin<Box<dyn Future<Output = Result<Self::Socket, TransportError>> + Send + 'a>>;
+
+    fn bind<'a>(&'a self, addr: SocketAddrV4, _options: &'a SocketOptions) -> Self::BindFuture<'a> {
+        let pipe = Arc::clone(&self.pipe);
+        let port = if addr.port() == 0 {
+            let mut p = self.next_port.lock().unwrap();
+            *p = p.saturating_add(1);
+            40000u16.saturating_add(*p)
+        } else {
+            addr.port()
+        };
+        let local = SocketAddrV4::new(*addr.ip(), port);
+        Box::pin(async move { Ok(MockSocket { pipe, local }) })
+    }
+}
+
+struct MockSocket {
+    pipe: Arc<MockPipe>,
+    local: SocketAddrV4,
+}
+
+struct MockSendFut {
+    pipe: Arc<MockPipe>,
+    bytes: Option<Vec<u8>>,
+    target: SocketAddrV4,
+}
+
+impl Future for MockSendFut {
+    type Output = Result<(), TransportError>;
+
+    fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        if let Some(bytes) = me.bytes.take() {
+            me.pipe.sent.lock().unwrap().push_back((bytes, me.target));
+        }
+        Poll::Ready(Ok(()))
+    }
+}
+
+struct MockRecvFut<'a> {
+    pipe: Arc<MockPipe>,
+    buf: &'a mut [u8],
+}
+
+impl Future for MockRecvFut<'_> {
+    type Output = Result<ReceivedDatagram, TransportError>;
+
+    #[allow(clippy::single_match_else)]
+    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        match me.pipe.inbound.lock().unwrap().pop_front() {
+            Some((bytes, source)) => {
+                let n = bytes.len().min(me.buf.len());
+                me.buf[..n].copy_from_slice(&bytes[..n]);
+                Poll::Ready(Ok(ReceivedDatagram {
+                    bytes_received: n,
+                    source,
+                    truncated: n < bytes.len(),
+                }))
+            }
+            // No datagram — register the waker on the pipe and park.
+            // A real bare-metal impl registers the waker on the network
+            // driver's RX-ready interrupt instead.
+            None => {
+                *me.pipe.inbound_waker.lock().unwrap() = Some(cx.waker().clone());
+                if let Some((bytes, source)) = me.pipe.inbound.lock().unwrap().pop_front() {
+                    let n = bytes.len().min(me.buf.len());
+                    me.buf[..n].copy_from_slice(&bytes[..n]);
+                    return Poll::Ready(Ok(ReceivedDatagram {
+                        bytes_received: n,
+                        source,
+                        truncated: n < bytes.len(),
+                    }));
+                }
+                Poll::Pending
+            }
+        }
+    }
+}
+
+impl TransportSocket for MockSocket {
+    type SendFuture<'a> = MockSendFut;
+    type RecvFuture<'a> = MockRecvFut<'a>;
+
+    fn send_to<'a>(&'a self, buf: &'a [u8], target: SocketAddrV4) -> MockSendFut {
+        MockSendFut {
+            pipe: Arc::clone(&self.pipe),
+            bytes: Some(buf.to_vec()),
+            target,
+        }
+    }
+
+    fn recv_from<'a>(&'a self, buf: &'a mut [u8]) -> MockRecvFut<'a> {
+        MockRecvFut {
+            pipe: Arc::clone(&self.pipe),
+            buf,
+        }
+    }
+
+    fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+        Ok(self.local)
+    }
+
+    fn join_multicast_v4(&self, _group: Ipv4Addr, _iface: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+
+    fn leave_multicast_v4(&self, _group: Ipv4Addr, _iface: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+}
+
+// ── Mock Timer ────────────────────────────────────────────────────────
+//
+// Honors `duration` per the `Timer` trait contract. Real
+// firmware replaces this with e.g. `embassy_time::Timer::after(d).await`.
+
+#[derive(Clone)]
+struct MockTimer;
+
+impl Timer for MockTimer {
+    type SleepFuture<'a> = core::pin::Pin<Box<dyn Future<Output = ()> + Send + 'a>>;
+    fn sleep(&self, duration: Duration) -> Self::SleepFuture<'_> {
+        Box::pin(async move {
+            tokio::time::sleep(duration).await;
+        })
+    }
+}
+
+// ── Mock SubscriptionHandle ───────────────────────────────────────────
+//
+// On `server-tokio`, `Arc<RwLock<SubscriptionManager>>` is the built-in
+// impl. Bare-metal callers supply their own. A real firmware impl would
+// back this with a `critical_section::Mutex<RefCell<_>>` or
+// `spin::Mutex<_>` over a `heapless`-backed table; here we use
+// `std::sync::Mutex` over a `Vec` because the example runs on the host.
+// The trait impl itself is the portable pattern — only the concurrency
+// primitive and storage type change on firmware.
+
+type SubKey = (u16, u16, u16, SocketAddrV4);
+
+#[derive(Clone, Default)]
+struct MockSubscriptions(Arc<Mutex<Vec<SubKey>>>);
+
+impl SubscriptionHandle for MockSubscriptions {
+    fn subscribe(
+        &self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        subscriber_addr: SocketAddrV4,
+    ) -> impl Future<Output = Result<(), SubscribeError>> + '_ {
+        let inner = Arc::clone(&self.0);
+        async move {
+            let mut guard = inner.lock().unwrap();
+            let key = (service_id, instance_id, event_group_id, subscriber_addr);
+            if !guard.contains(&key) {
+                guard.push(key);
+            }
+            Ok(())
+        }
+    }
+
+    fn unsubscribe(
+        &self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        subscriber_addr: SocketAddrV4,
+    ) -> impl Future<Output = ()> + '_ {
+        let inner = Arc::clone(&self.0);
+        async move {
+            inner
+                .lock()
+                .unwrap()
+                .retain(|e| *e != (service_id, instance_id, event_group_id, subscriber_addr));
+        }
+    }
+
+    fn for_each_subscriber<'a, F>(
+        &'a self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        mut f: F,
+    ) -> impl Future<Output = usize> + 'a
+    where
+        F: FnMut(&Subscriber) + 'a,
+    {
+        let inner = Arc::clone(&self.0);
+        async move {
+            let guard = inner.lock().unwrap();
+            let mut count = 0;
+            for (s, i, e, addr) in guard.iter() {
+                if *s == service_id && *i == instance_id && *e == event_group_id {
+                    let sub = Subscriber::new(*addr, *s, *i, *e);
+                    f(&sub);
+                    count += 1;
+                }
+            }
+            count
+        }
+    }
+}
+
+// ── Main ──────────────────────────────────────────────────────────────
+
+// current_thread matches a single-core bare-metal executor; yields are
+// fully sequential, which lets the assertion below observe the first
+// SD announcement reliably.
+#[tokio::main(flavor = "current_thread")]
+async fn main() {
+    let pipe = Arc::new(MockPipe::default());
+    let factory = MockFactory {
+        pipe: Arc::clone(&pipe),
+        next_port: Arc::new(Mutex::new(0)),
+    };
+
+    // std Arc/Mutex implements E2ERegistryHandle and is gated by
+    // `feature = "std"`, not `server-tokio`. A future no-alloc port
+    // replaces this with a stack-allocated handle.
+    let e2e: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+    let subs = MockSubscriptions::default();
+
+    // service_id=0x1234, instance_id=1, bound to LOCALHOST:30490.
+    let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 30490, 0x1234, 1);
+
+    let server = Server::<
+        Arc<Mutex<E2ERegistry>>,
+        MockSubscriptions,
+        MockFactory,
+        MockTimer,
+    >::new_with_deps(
+        ServerDeps { factory, timer: MockTimer, e2e_registry: e2e, subscriptions: subs },
+        config,
+        false, // multicast_loopback
+    )
+    .await
+    .expect("Server::new_with_deps failed");
+
+    // The announcement loop periodically multicasts SD OfferService
+    // entries so clients on the network can discover this service.
+    // It is Send + 'static and can be handed to any executor.
+    let announce_handle = tokio::spawn(
+        server
+            .announcement_loop()
+            .expect("non-passive server must have an announcement loop"),
+    );
+
+    // Yield twice: the announcement loop fires its first SD offer on the
+    // first poll before the inter-announcement timer starts.
+    tokio::task::yield_now().await;
+    tokio::task::yield_now().await;
+
+    // Verify the server actually sent at least one SD announcement.
+    let sent = pipe.sent.lock().unwrap().len();
+    assert!(
+        sent > 0,
+        "server should have multicast at least one SD OfferService"
+    );
+
+    announce_handle.abort();
+    let _ = announce_handle.await;
+
+    println!(
+        "bare-metal server example: Server::new_with_deps compiled and ran successfully \
+         under features=[server, bare_metal] — no tokio / socket2 from simple-someip itself. \
+         SD announcements sent: {sent}."
+    );
+}
diff --git a/examples/client_server/Cargo.toml b/examples/client_server/Cargo.toml
index 9d4495f..d4f8aa5 100644
--- a/examples/client_server/Cargo.toml
+++ b/examples/client_server/Cargo.toml
@@ -5,7 +5,7 @@ edition = "2024"
 publish = false
 
 [dependencies]
-simple-someip = { path = "../..", features = ["client", "server"] }
+simple-someip = { path = "../..", features = ["client-tokio", "server-tokio"] }
 tokio = { version = "1", features = ["macros", "rt-multi-thread", "time"] }
 tracing = "0.1"
 tracing-subscriber = "0.3"
diff --git a/examples/client_server/src/main.rs b/examples/client_server/src/main.rs
index 82771d0..d873b79 100644
--- a/examples/client_server/src/main.rs
+++ b/examples/client_server/src/main.rs
@@ -1,4 +1,4 @@
-//! Client+Server hybrid example using `start_sd_announcements`.
+//! Client+Server hybrid example using `Client::sd_announcements_loop`.
 //!
 //! Demonstrates how to run a SOME/IP application that is simultaneously:
 //! - A **client** subscribing to a remote service's events
@@ -10,8 +10,8 @@
 //! This ensures remote nodes see a single coherent network identity for
 //! multicast announcements.
 //!
-//! The server's built-in `start_announcing()` is NOT used — instead, the
-//! client's `start_sd_announcements()` handles periodic multicast
+//! The server's built-in `announcement_loop()` is NOT used — instead, the
+//! client's `sd_announcements_loop()` handles periodic multicast
 //! announcements. The server's `run()` loop still handles unicast SD
 //! traffic (e.g. `SubscribeAck`/`SubscribeNack` responses) on its own
 //! socket, which is necessary for subscription management.
@@ -106,7 +106,8 @@ async fn main() -> Result<(), Box<dyn std::error::Error>> {
 
     // ── Create the client (handles discovery, subscriptions, SD socket) ──
 
-    let (client, mut updates) = simple_someip::Client::<Payload>::new(interface);
+    let (client, mut updates, run_fut) = simple_someip::Client::<Payload, _, _, _>::new(interface);
+    let _run_handle = tokio::spawn(run_fut);
     client.bind_discovery().await?;
     info!("Client discovery bound");
 
@@ -115,23 +116,27 @@ async fn main() -> Result<(), Box<dyn std::error::Error>> {
     let config = ServerConfig {
         interface,
         local_port: MY_SERVER_PORT,
-        service_id: MY_SERVER_SERVICE_ID,
-        instance_id: MY_SERVER_INSTANCE_ID,
         major_version: 1,
         minor_version: 0,
         ttl: 3,
+        ..ServerConfig::new(
+            interface,
+            MY_SERVER_PORT,
+            MY_SERVER_SERVICE_ID,
+            MY_SERVER_INSTANCE_ID,
+        )
     };
 
     let mut server = Server::new(config).await?;
     info!("Server bound on port {MY_SERVER_PORT}");
 
-    // NOTE: We intentionally do NOT call server.start_announcing().
-    // The client's start_sd_announcements handles all SD traffic.
+    // NOTE: We intentionally do NOT spawn server.announcement_loop().
+    // The client's sd_announcements_loop handles all SD traffic.
 
     let _publisher = server.publisher();
 
     // Spawn the server event loop (handles incoming subscriptions).
-    tokio::spawn(async move {
+    let _server_handle = tokio::spawn(async move {
         if let Err(e) = server.run().await {
             error!("Server error: {e}");
         }
@@ -140,7 +145,8 @@ async fn main() -> Result<(), Box<dyn std::error::Error>> {
     // ── Start combined SD announcements from the client socket ───────────
 
     let sd_header = build_sd_header(interface);
-    let _announce_handle = client.start_sd_announcements(sd_header, Duration::from_secs(1));
+    let _announce_handle =
+        tokio::spawn(client.sd_announcements_loop(sd_header, Duration::from_secs(1)));
     info!("Started combined Find+Offer SD announcements (1s interval)");
 
     // ── Main event loop ─────────────────────────────────────────────────
diff --git a/examples/discovery_client/Cargo.toml b/examples/discovery_client/Cargo.toml
index 7ccb1e4..51a9cd3 100644
--- a/examples/discovery_client/Cargo.toml
+++ b/examples/discovery_client/Cargo.toml
@@ -6,7 +6,7 @@ publish = false
 
 [dependencies]
 embedded-io = "0.7"
-simple-someip = { path = "../..", features = ["client"] }
+simple-someip = { path = "../..", features = ["client-tokio"] }
 tokio = { version = "1", features = ["macros", "rt-multi-thread"] }
 tracing = "0.1"
 tracing-subscriber = "0.3"
diff --git a/examples/discovery_client/src/main.rs b/examples/discovery_client/src/main.rs
index 41b90fc..4c3fcb0 100644
--- a/examples/discovery_client/src/main.rs
+++ b/examples/discovery_client/src/main.rs
@@ -287,7 +287,8 @@ async fn main() -> Result<(), Error> {
 
     info!("Starting discovery client on interface {interface}");
 
-    let (client, mut updates) = simple_someip::Client::<Payload>::new(interface);
+    let (client, mut updates, run_fut) = simple_someip::Client::<Payload, _, _, _>::new(interface);
+    let _run_handle = tokio::spawn(run_fut);
     client.bind_discovery().await.unwrap();
 
     let mut state = DiscoveryState::new();
diff --git a/src/client/bind_dispatch.rs b/src/client/bind_dispatch.rs
new file mode 100644
index 0000000..39d8977
--- /dev/null
+++ b/src/client/bind_dispatch.rs
@@ -0,0 +1,172 @@
+//! Spawner-agnostic bind dispatch for the `Client` run-loop.
+//!
+//! `Inner` needs to bind two kinds of UDP sockets — the SD multicast
+//! socket and per-port unicast sockets — and submit each socket's I/O
+//! loop to a task spawner. Multi-threaded executors (tokio default)
+//! require the spawned future to be `Send`; single-threaded executors
+//! (embassy with `task-arena = 0`, tokio's `LocalSet`) accept `!Send`
+//! futures via [`crate::LocalSpawner`].
+//!
+//! Rather than duplicating `Inner::run_future` for the two cases, we
+//! abstract the bind-and-spawn step behind [`BindDispatch`]. `Inner` is
+//! generic over a single `D: BindDispatch` field; the public
+//! [`Client::new_with_deps`](super::Client::new_with_deps) constructs a
+//! [`SpawnerDispatch`] and
+//! [`Client::new_with_deps_local`](super::Client::new_with_deps_local)
+//! constructs a [`LocalSpawnerDispatch`].
+//!
+//! The trait is intentionally crate-private — third parties extend the
+//! public surface by implementing [`crate::Spawner`] or
+//! [`crate::LocalSpawner`], not by writing their own `BindDispatch`.
+
+use core::future::Future;
+use core::net::Ipv4Addr;
+
+use super::error::Error;
+use super::socket_manager::SocketManager;
+use crate::traits::PayloadWireFormat;
+use crate::transport::{
+    ChannelFactory, E2ERegistryHandle, LocalSpawner, Spawner, TransportFactory, TransportSocket,
+};
+
+/// Crate-private bind-and-spawn abstraction shared by Send and `!Send`
+/// `Client` construction paths.
+pub(super) trait BindDispatch<MD, C, R>
+where
+    MD: PayloadWireFormat + Clone + core::fmt::Debug + Send + 'static,
+    C: ChannelFactory,
+    R: E2ERegistryHandle,
+    Result<super::socket_manager::ReceivedMessage<MD>, Error>:
+        crate::transport::BoundedPooled<C, 16>,
+    super::socket_manager::SendMessage<MD, C>: crate::transport::BoundedPooled<C, 16>,
+    Result<(), Error>: crate::transport::OneshotPooled<C>,
+{
+    /// Bind a discovery socket and submit its I/O loop to the
+    /// configured task executor.
+    fn bind_discovery(
+        &self,
+        interface: Ipv4Addr,
+        e2e_registry: R,
+        session_id: u16,
+        session_has_wrapped: bool,
+        multicast_loopback: bool,
+    ) -> impl Future<Output = Result<SocketManager<MD, C>, Error>> + '_;
+
+    /// Bind a unicast socket on `port` (0 = ephemeral) and submit its
+    /// I/O loop.
+    fn bind_unicast(
+        &self,
+        port: u16,
+        e2e_registry: R,
+    ) -> impl Future<Output = Result<SocketManager<MD, C>, Error>> + '_;
+}
+
+/// `BindDispatch` for the multi-threaded path: requires a
+/// [`Spawner`] and a `Send + Sync` transport socket.
+pub(super) struct SpawnerDispatch<F, S> {
+    pub factory: F,
+    pub spawner: S,
+}
+
+impl<MD, C, R, F, S> BindDispatch<MD, C, R> for SpawnerDispatch<F, S>
+where
+    MD: PayloadWireFormat + Clone + core::fmt::Debug + Send + 'static,
+    C: ChannelFactory,
+    R: E2ERegistryHandle,
+    F: TransportFactory + Send + Sync + 'static,
+    F::Socket: Send + Sync + 'static,
+    for<'a> F::BindFuture<'a>: Send,
+    for<'a> <F::Socket as TransportSocket>::SendFuture<'a>: Send,
+    for<'a> <F::Socket as TransportSocket>::RecvFuture<'a>: Send,
+    S: Spawner + Send + Sync + 'static,
+    Result<super::socket_manager::ReceivedMessage<MD>, Error>:
+        crate::transport::BoundedPooled<C, 16>,
+    super::socket_manager::SendMessage<MD, C>: crate::transport::BoundedPooled<C, 16>,
+    Result<(), Error>: crate::transport::OneshotPooled<C>,
+{
+    fn bind_discovery(
+        &self,
+        interface: Ipv4Addr,
+        e2e_registry: R,
+        session_id: u16,
+        session_has_wrapped: bool,
+        multicast_loopback: bool,
+    ) -> impl Future<Output = Result<SocketManager<MD, C>, Error>> + '_ {
+        SocketManager::<MD, C>::bind_discovery_seeded_with_transport(
+            &self.factory,
+            &self.spawner,
+            interface,
+            e2e_registry,
+            session_id,
+            session_has_wrapped,
+            multicast_loopback,
+        )
+    }
+
+    fn bind_unicast(
+        &self,
+        port: u16,
+        e2e_registry: R,
+    ) -> impl Future<Output = Result<SocketManager<MD, C>, Error>> + '_ {
+        SocketManager::<MD, C>::bind_with_transport(
+            &self.factory,
+            &self.spawner,
+            port,
+            e2e_registry,
+        )
+    }
+}
+
+/// `BindDispatch` for the single-threaded path: requires a
+/// [`LocalSpawner`] and `'static` transport socket. The socket and its
+/// GAT futures are not required to be `Send`.
+pub(super) struct LocalSpawnerDispatch<F, S> {
+    pub factory: F,
+    pub spawner: S,
+}
+
+impl<MD, C, R, F, S> BindDispatch<MD, C, R> for LocalSpawnerDispatch<F, S>
+where
+    MD: PayloadWireFormat + Clone + core::fmt::Debug + Send + 'static,
+    C: ChannelFactory,
+    R: E2ERegistryHandle,
+    F: TransportFactory + 'static,
+    F::Socket: 'static,
+    S: LocalSpawner + 'static,
+    Result<super::socket_manager::ReceivedMessage<MD>, Error>:
+        crate::transport::BoundedPooled<C, 16>,
+    super::socket_manager::SendMessage<MD, C>: crate::transport::BoundedPooled<C, 16>,
+    Result<(), Error>: crate::transport::OneshotPooled<C>,
+{
+    fn bind_discovery(
+        &self,
+        interface: Ipv4Addr,
+        e2e_registry: R,
+        session_id: u16,
+        session_has_wrapped: bool,
+        multicast_loopback: bool,
+    ) -> impl Future<Output = Result<SocketManager<MD, C>, Error>> + '_ {
+        SocketManager::<MD, C>::bind_discovery_seeded_with_transport_local(
+            &self.factory,
+            &self.spawner,
+            interface,
+            e2e_registry,
+            session_id,
+            session_has_wrapped,
+            multicast_loopback,
+        )
+    }
+
+    fn bind_unicast(
+        &self,
+        port: u16,
+        e2e_registry: R,
+    ) -> impl Future<Output = Result<SocketManager<MD, C>, Error>> + '_ {
+        SocketManager::<MD, C>::bind_with_transport_local(
+            &self.factory,
+            &self.spawner,
+            port,
+            e2e_registry,
+        )
+    }
+}
diff --git a/src/client/error.rs b/src/client/error.rs
index 64af381..8ad9564 100644
--- a/src/client/error.rs
+++ b/src/client/error.rs
@@ -1,14 +1,21 @@
 use thiserror::Error;
 
 /// Errors that can occur during SOME/IP client operations.
+///
+/// # Stability
+///
+/// This enum is **not** marked `#[non_exhaustive]`, so downstream crates
+/// may currently match it exhaustively. That convenience comes with a
+/// real cost: **any new variant added here is a breaking change** and
+/// must be flagged in the changelog and reflected in the next `SemVer`
+/// bump (pre-1.0, a minor bump is sufficient, but it still requires a
+/// release-notes entry). The same is true of renaming or restructuring
+/// existing variants.
 #[derive(Error, Debug)]
 pub enum Error {
     /// A SOME/IP protocol-level error.
     #[error(transparent)]
     Protocol(#[from] crate::protocol::Error),
-    /// An I/O error from the underlying network transport.
-    #[error(transparent)]
-    Io(#[from] std::io::Error),
     /// Received a discovery message that was not expected.
     #[error("Unexpected discovery message: {0:?}")]
     UnexpectedDiscoveryMessage(crate::protocol::Header),
@@ -24,4 +31,119 @@ pub enum Error {
     /// An E2E protection or checking error occurred.
     #[error(transparent)]
     E2e(#[from] crate::e2e::Error),
+    /// A fixed-capacity internal structure is full. The argument is a
+    /// lowercase `snake_case` tag naming the resource; grep the crate for
+    /// the tag to find the compile-time constant that governs it.
+    ///
+    /// Current tags:
+    /// - `"unicast_sockets"` — bound by `UNICAST_SOCKETS_CAP`. The
+    ///   client cannot bind a new ephemeral / requested-port unicast
+    ///   socket because the per-client cap is exhausted.
+    /// - `"udp_buffer"` — bound by [`crate::UDP_BUFFER_SIZE`]. A
+    ///   `Client::send` was rejected because the encoded message
+    ///   exceeds the application-level UDP cap. **Note:** with E2E
+    ///   protect configured for the destination key, the post-protect
+    ///   payload may add up to the protect profile's overhead bytes
+    ///   (Profile 1: 4, Profile 4: 16). The pre-encode check uses the
+    ///   raw size; the post-protect re-check inside the spawned send
+    ///   loop produces this error if the protected datagram would
+    ///   overflow the cap.
+    /// - `"pending_responses"` — bound by `PENDING_RESPONSES_CAP`. A
+    ///   request was enqueued but the in-flight response table is
+    ///   full; the request was dropped.
+    /// - `"request_queue"` — bound by `REQUEST_QUEUE_CAP`. The
+    ///   client's internal control-message queue overflowed during a
+    ///   multi-pass `push_front` re-enqueue (e.g. an auto-bind path).
+    ///   Public callers normally hit the bounded(4) control channel
+    ///   first and either backpressure or fail with `Shutdown`; this
+    ///   tag fires only in the narrow re-enqueue overflow window.
+    /// - `"service_registry"` — bound by `SERVICE_REGISTRY_CAP`. A
+    ///   new `(service_id, instance_id)` endpoint cannot be registered
+    ///   because the registry is full.
+    #[error("internal capacity exceeded: {0}")]
+    Capacity(&'static str),
+    /// An error surfaced by the pluggable transport backend (see
+    /// [`crate::transport::TransportError`]).
+    #[error(transparent)]
+    Transport(#[from] crate::transport::TransportError),
+    /// The client's internal run-loop future has exited — either because
+    /// the caller dropped it before or during polling, the executor
+    /// cancelled its task, or it returned. All public `Client` methods
+    /// that enqueue a control message or await its response return
+    /// this variant when the control channel is closed, rather than
+    /// panicking on `.unwrap()` of the send / recv result. Treat it as
+    /// a caller-side lifecycle error: the `Client` handle has outlived
+    /// its driver and further calls on it cannot make progress.
+    #[error("client run loop is no longer running")]
+    Shutdown,
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::transport::TransportError;
+    use std::format;
+
+    #[test]
+    fn transport_variant_displays_via_inner_display_not_debug() {
+        // Regression guard: previously `{0:?}` leaked debug formatting
+        // (e.g. `AddressInUse`) into user-facing error messages. The
+        // `#[error(transparent)]` form delegates fully to the inner
+        // `TransportError`'s Display impl.
+        let err = Error::Transport(TransportError::AddressInUse);
+        let displayed = format!("{err}");
+
+        // No debug-format artifacts: no braces (`AddressInUse` is a unit
+        // variant, but struct-like variants would debug-format with
+        // braces), no quote-wrapping, no raw variant name from debug.
+        assert!(
+            !displayed.contains('{'),
+            "unexpected `{{` in Display output: {displayed:?}"
+        );
+        assert!(
+            !displayed.contains('}'),
+            "unexpected `}}` in Display output: {displayed:?}"
+        );
+        assert!(
+            !displayed.contains('"'),
+            "unexpected `\"` in Display output: {displayed:?}"
+        );
+
+        // `transparent` delegates to the inner Display verbatim.
+        let inner = format!("{}", TransportError::AddressInUse);
+        assert_eq!(displayed, inner);
+        assert_eq!(displayed, "address in use");
+    }
+
+    #[test]
+    fn capacity_variant_includes_tag_in_display() {
+        let err = Error::Capacity("request_queue");
+        let displayed = format!("{err}");
+        assert!(
+            displayed.contains("request_queue"),
+            "Capacity display must include the tag: {displayed:?}"
+        );
+    }
+
+    #[test]
+    fn shutdown_variant_display() {
+        let err = Error::Shutdown;
+        let displayed = format!("{err}");
+        assert!(
+            !displayed.is_empty(),
+            "Shutdown must have a non-empty display message"
+        );
+    }
+
+    #[test]
+    fn simple_variants_display_without_panicking() {
+        for err in [
+            Error::SocketClosedUnexpectedly,
+            Error::UnicastSocketNotBound,
+            Error::ServiceNotFound,
+            Error::Shutdown,
+        ] {
+            let _ = format!("{err}");
+        }
+    }
 }
diff --git a/src/client/inner.rs b/src/client/inner.rs
index 412c6c6..b6c6674 100644
--- a/src/client/inner.rs
+++ b/src/client/inner.rs
@@ -1,59 +1,70 @@
-use std::{
-    borrow::ToOwned,
-    collections::{HashMap, VecDeque},
-    future,
-    net::{Ipv4Addr, SocketAddr, SocketAddrV4},
-    sync::{Arc, Mutex},
-    task::Poll,
-};
-use tokio::{
-    select,
-    sync::{
-        mpsc::{self, Receiver, Sender},
-        oneshot,
-    },
-};
+use core::future;
+use core::net::{Ipv4Addr, SocketAddr, SocketAddrV4};
+use core::task::Poll;
+use futures::{FutureExt, pin_mut, select};
+use heapless::{Deque, index_map::FnvIndexMap};
+use std::borrow::ToOwned;
+#[cfg(all(test, feature = "client-tokio"))]
+use std::sync::{Arc, Mutex};
 use tracing::{debug, error, info, trace, warn};
 
+#[cfg(all(test, feature = "client-tokio"))]
+use crate::e2e::E2ERegistry;
+#[cfg(all(test, feature = "client-tokio"))]
+use crate::tokio_transport::{TokioChannels, TokioSpawner, TokioTimer, TokioTransport};
 use crate::{
+    Timer,
     client::{
         ClientUpdate, DiscoveryMessage,
         service_registry::{ServiceEndpointInfo, ServiceInstanceId, ServiceRegistry},
         session::{SessionTracker, SessionVerdict, TransportKind},
         socket_manager::{ReceivedMessage, SocketManager},
     },
-    e2e::E2ERegistry,
     protocol::{self, Message},
     traits::PayloadWireFormat,
+    transport::{ChannelFactory, E2ERegistryHandle, MpscRecv, OneshotSend, UnboundedSend},
 };
 
 use super::error::Error;
 
-pub(super) enum ControlMessage<P: PayloadWireFormat> {
-    SetInterface(Ipv4Addr, oneshot::Sender<Result<(), Error>>),
-    BindDiscovery(oneshot::Sender<Result<(), Error>>),
-    UnbindDiscovery(oneshot::Sender<Result<(), Error>>),
+/// Max depth of the internal control-message queue. Each entry is one
+/// in-flight `ControlMessage`. Must be generous enough to absorb bursts
+/// from `Client` callers between event-loop ticks.
+const REQUEST_QUEUE_CAP: usize = 32;
+
+/// Max number of outstanding unicast request-response pairs. Each entry is
+/// a `request_id` awaiting a reply. Must be a power of two.
+const PENDING_RESPONSES_CAP: usize = 64;
+
+/// Max number of bound unicast sockets tracked by port. Must be a power of
+/// two.
+const UNICAST_SOCKETS_CAP: usize = 8;
+
+pub enum ControlMessage<P: PayloadWireFormat + 'static, C: ChannelFactory> {
+    SetInterface(Ipv4Addr, C::OneshotSender<Result<(), Error>>),
+    BindDiscovery(C::OneshotSender<Result<(), Error>>),
+    UnbindDiscovery(C::OneshotSender<Result<(), Error>>),
     SendSD(
         SocketAddrV4,
         P::SdHeader,
-        oneshot::Sender<Result<(), Error>>,
+        C::OneshotSender<Result<(), Error>>,
     ),
     AddEndpoint(
         u16,
         u16,
         SocketAddrV4,
         u16,
-        oneshot::Sender<Result<(), Error>>,
+        C::OneshotSender<Result<(), Error>>,
     ),
-    RemoveEndpoint(u16, u16, oneshot::Sender<Result<(), Error>>),
+    RemoveEndpoint(u16, u16, C::OneshotSender<Result<(), Error>>),
     SendToService {
         service_id: u16,
         instance_id: u16,
         message: Message<P>,
         /// Fires when the UDP send completes (or errors on lookup/bind).
-        send_complete: oneshot::Sender<Result<(), Error>>,
+        send_complete: C::OneshotSender<Result<(), Error>>,
         /// Fires when a matching unicast response arrives.
-        response: oneshot::Sender<Result<P, Error>>,
+        response: C::OneshotSender<Result<P, Error>>,
     },
     Subscribe {
         service_id: u16,
@@ -62,18 +73,18 @@ pub(super) enum ControlMessage<P: PayloadWireFormat> {
         ttl: u32,
         event_group_id: u16,
         client_port: u16,
-        response: oneshot::Sender<Result<(), Error>>,
+        response: C::OneshotSender<Result<(), Error>>,
     },
-    QueryRebootFlag(oneshot::Sender<crate::protocol::sd::RebootFlag>),
+    QueryRebootFlag(C::OneshotSender<Result<crate::protocol::sd::RebootFlag, Error>>),
     /// Test-only: force `sd_session_has_wrapped` to simulate the state a
     /// long-running client reaches after its SD session counter wraps past
     /// `0xFFFF`, without actually sending 65k SD messages. Fires the
     /// accompanying oneshot once the mutation is applied.
-    #[cfg(test)]
-    ForceSdSessionWrappedForTest(bool, oneshot::Sender<()>),
+    #[cfg(all(test, feature = "client-tokio"))]
+    ForceSdSessionWrappedForTest(bool, C::OneshotSender<Result<(), Error>>),
 }
 
-impl<P: PayloadWireFormat> std::fmt::Debug for ControlMessage<P> {
+impl<P: PayloadWireFormat + 'static, C: ChannelFactory> std::fmt::Debug for ControlMessage<P, C> {
     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
         match self {
             Self::SetInterface(addr, _) => f.debug_tuple("SetInterface").field(addr).finish(),
@@ -117,7 +128,7 @@ impl<P: PayloadWireFormat> std::fmt::Debug for ControlMessage<P> {
                 .field("event_group_id", event_group_id)
                 .finish_non_exhaustive(),
             Self::QueryRebootFlag(_) => f.write_str("QueryRebootFlag"),
-            #[cfg(test)]
+            #[cfg(all(test, feature = "client-tokio"))]
             Self::ForceSdSessionWrappedForTest(b, _) => f
                 .debug_tuple("ForceSdSessionWrappedForTest")
                 .field(b)
@@ -126,45 +137,58 @@ impl<P: PayloadWireFormat> std::fmt::Debug for ControlMessage<P> {
     }
 }
 
-impl<P: PayloadWireFormat> ControlMessage<P> {
-    pub fn set_interface(interface: Ipv4Addr) -> (oneshot::Receiver<Result<(), Error>>, Self) {
-        let (sender, receiver) = oneshot::channel();
+impl<P, C> ControlMessage<P, C>
+where
+    P: PayloadWireFormat + Send + 'static,
+    C: ChannelFactory,
+    Result<(), Error>: crate::transport::OneshotPooled<C>,
+    Result<P, Error>: crate::transport::OneshotPooled<C>,
+    Result<crate::protocol::sd::RebootFlag, Error>: crate::transport::OneshotPooled<C>,
+{
+    #[must_use]
+    pub fn set_interface(interface: Ipv4Addr) -> (C::OneshotReceiver<Result<(), Error>>, Self) {
+        let (sender, receiver) = C::oneshot();
         (receiver, Self::SetInterface(interface, sender))
     }
-    pub fn bind_discovery() -> (oneshot::Receiver<Result<(), Error>>, Self) {
-        let (sender, receiver) = oneshot::channel();
+    #[must_use]
+    pub fn bind_discovery() -> (C::OneshotReceiver<Result<(), Error>>, Self) {
+        let (sender, receiver) = C::oneshot();
         (receiver, Self::BindDiscovery(sender))
     }
-    pub fn unbind_discovery() -> (oneshot::Receiver<Result<(), Error>>, Self) {
-        let (sender, receiver) = oneshot::channel();
+    #[must_use]
+    pub fn unbind_discovery() -> (C::OneshotReceiver<Result<(), Error>>, Self) {
+        let (sender, receiver) = C::oneshot();
         (receiver, Self::UnbindDiscovery(sender))
     }
 
+    #[must_use]
     pub fn send_sd(
         socket_addr: SocketAddrV4,
         header: P::SdHeader,
-    ) -> (oneshot::Receiver<Result<(), Error>>, Self) {
-        let (sender, receiver) = oneshot::channel();
+    ) -> (C::OneshotReceiver<Result<(), Error>>, Self) {
+        let (sender, receiver) = C::oneshot();
         (receiver, Self::SendSD(socket_addr, header, sender))
     }
+    #[must_use]
     pub fn add_endpoint(
         service_id: u16,
         instance_id: u16,
         addr: SocketAddrV4,
         local_port: u16,
-    ) -> (oneshot::Receiver<Result<(), Error>>, Self) {
-        let (sender, receiver) = oneshot::channel();
+    ) -> (C::OneshotReceiver<Result<(), Error>>, Self) {
+        let (sender, receiver) = C::oneshot();
         (
             receiver,
             Self::AddEndpoint(service_id, instance_id, addr, local_port, sender),
         )
     }
 
+    #[must_use]
     pub fn remove_endpoint(
         service_id: u16,
         instance_id: u16,
-    ) -> (oneshot::Receiver<Result<(), Error>>, Self) {
-        let (sender, receiver) = oneshot::channel();
+    ) -> (C::OneshotReceiver<Result<(), Error>>, Self) {
+        let (sender, receiver) = C::oneshot();
         (
             receiver,
             Self::RemoveEndpoint(service_id, instance_id, sender),
@@ -172,17 +196,18 @@ impl<P: PayloadWireFormat> ControlMessage<P> {
     }
 
     #[allow(clippy::type_complexity)]
+    #[must_use]
     pub fn send_to_service(
         service_id: u16,
         instance_id: u16,
         message: Message<P>,
     ) -> (
-        oneshot::Receiver<Result<(), Error>>,
-        oneshot::Receiver<Result<P, Error>>,
+        C::OneshotReceiver<Result<(), Error>>,
+        C::OneshotReceiver<Result<P, Error>>,
         Self,
     ) {
-        let (send_complete_tx, send_complete_rx) = oneshot::channel();
-        let (response_tx, response_rx) = oneshot::channel();
+        let (send_complete_tx, send_complete_rx) = C::oneshot();
+        let (response_tx, response_rx) = C::oneshot();
         (
             send_complete_rx,
             response_rx,
@@ -196,6 +221,7 @@ impl<P: PayloadWireFormat> ControlMessage<P> {
         )
     }
 
+    #[must_use]
     pub fn subscribe(
         service_id: u16,
         instance_id: u16,
@@ -203,8 +229,8 @@ impl<P: PayloadWireFormat> ControlMessage<P> {
         ttl: u32,
         event_group_id: u16,
         client_port: u16,
-    ) -> (oneshot::Receiver<Result<(), Error>>, Self) {
-        let (sender, receiver) = oneshot::channel();
+    ) -> (C::OneshotReceiver<Result<(), Error>>, Self) {
+        let (sender, receiver) = C::oneshot();
         (
             receiver,
             Self::Subscribe {
@@ -219,37 +245,91 @@ impl<P: PayloadWireFormat> ControlMessage<P> {
         )
     }
 
-    pub fn query_reboot_flag() -> (oneshot::Receiver<crate::protocol::sd::RebootFlag>, Self) {
-        let (sender, receiver) = oneshot::channel();
+    #[must_use]
+    pub fn query_reboot_flag() -> (
+        C::OneshotReceiver<Result<crate::protocol::sd::RebootFlag, Error>>,
+        Self,
+    ) {
+        let (sender, receiver) = C::oneshot();
         (receiver, Self::QueryRebootFlag(sender))
     }
 
-    #[cfg(test)]
-    pub fn force_sd_session_wrapped_for_test(wrapped: bool) -> (oneshot::Receiver<()>, Self) {
-        let (sender, receiver) = oneshot::channel();
+    #[cfg(all(test, feature = "client-tokio"))]
+    #[must_use]
+    pub fn force_sd_session_wrapped_for_test(
+        wrapped: bool,
+    ) -> (C::OneshotReceiver<Result<(), Error>>, Self) {
+        let (sender, receiver) = C::oneshot();
         (
             receiver,
             Self::ForceSdSessionWrappedForTest(wrapped, sender),
         )
     }
+
+    /// Consume this message and notify its oneshot senders with
+    /// `Error::Capacity(structure_name)` instead of silently dropping them.
+    ///
+    /// Dropping the senders would let the awaiting `oneshot::Receiver`s
+    /// resolve to `RecvError`, which the public APIs currently `.unwrap()`
+    /// — that would panic callers under load. Delivering an explicit
+    /// `Err(Error::Capacity(..))` turns a would-be panic into a normal
+    /// `Result` with a stable, descriptive error.
+    fn reject_with_capacity(self, structure_name: &'static str) {
+        match self {
+            Self::SetInterface(_, response)
+            | Self::BindDiscovery(response)
+            | Self::UnbindDiscovery(response)
+            | Self::SendSD(_, _, response)
+            | Self::AddEndpoint(_, _, _, _, response)
+            | Self::RemoveEndpoint(_, _, response)
+            | Self::Subscribe { response, .. } => {
+                let _ = response.send(Err(Error::Capacity(structure_name)));
+            }
+            Self::SendToService {
+                send_complete,
+                response,
+                ..
+            } => {
+                let _ = send_complete.send(Err(Error::Capacity(structure_name)));
+                let _ = response.send(Err(Error::Capacity(structure_name)));
+            }
+            Self::QueryRebootFlag(response) => {
+                let _ = response.send(Err(Error::Capacity(structure_name)));
+            }
+            #[cfg(all(test, feature = "client-tokio"))]
+            Self::ForceSdSessionWrappedForTest(_, response) => {
+                let _ = response.send(Err(Error::Capacity(structure_name)));
+            }
+        }
+    }
 }
 
-pub(super) struct Inner<PayloadDefinitions: PayloadWireFormat> {
+pub(super) struct Inner<
+    PayloadDefinitions: PayloadWireFormat + 'static,
+    Tm: Timer,
+    R: E2ERegistryHandle,
+    C: ChannelFactory,
+    D,
+> {
     /// MPSC Receiver used to receive control messages from outer client
-    control_receiver: Receiver<ControlMessage<PayloadDefinitions>>,
+    control_receiver: C::BoundedReceiver<ControlMessage<PayloadDefinitions, C>, 4>,
     /// Queue of pending control messages to process
-    request_queue: VecDeque<ControlMessage<PayloadDefinitions>>,
+    request_queue: Deque<ControlMessage<PayloadDefinitions, C>, REQUEST_QUEUE_CAP>,
     /// Pending request-responses keyed by `request_id` (`client_id` << 16 | `session_counter`).
     /// Set by `SendToService`, cleared when a matching unicast arrives.
-    pending_responses: HashMap<u32, oneshot::Sender<Result<PayloadDefinitions, Error>>>,
+    pending_responses: FnvIndexMap<
+        u32,
+        C::OneshotSender<Result<PayloadDefinitions, Error>>,
+        PENDING_RESPONSES_CAP,
+    >,
     /// Unbounded sender used to send updates to outer client
-    update_sender: mpsc::UnboundedSender<ClientUpdate<PayloadDefinitions>>,
+    update_sender: C::UnboundedSender<ClientUpdate<PayloadDefinitions>>,
     /// Target interface for sockets
     interface: Ipv4Addr,
     /// Socket manager for service discovery if bound
-    discovery_socket: Option<SocketManager<PayloadDefinitions>>,
+    discovery_socket: Option<SocketManager<PayloadDefinitions, C>>,
     /// Socket managers for unicast messages, keyed by local port
-    unicast_sockets: HashMap<u16, SocketManager<PayloadDefinitions>>,
+    unicast_sockets: FnvIndexMap<u16, SocketManager<PayloadDefinitions, C>, UNICAST_SOCKETS_CAP>,
     /// Per-sender SD session state for reboot detection
     session_tracker: SessionTracker,
     /// Registry of known service endpoints (auto-populated from SD + manual)
@@ -265,14 +345,27 @@ pub(super) struct Inner<PayloadDefinitions: PayloadWireFormat> {
     sd_session_id: u16,
     sd_session_has_wrapped: bool,
     /// Shared E2E registry for runtime E2E configuration
-    e2e_registry: Arc<Mutex<E2ERegistry>>,
+    e2e_registry: R,
     /// Enable multicast loopback on SD sockets for same-host testing
     multicast_loopback: bool,
+    /// Bind dispatch — abstracts the bind-and-spawn step over either a
+    /// [`Spawner`](crate::transport::Spawner) (Send-required) or a
+    /// [`LocalSpawner`](crate::transport::LocalSpawner) (single-task)
+    /// path. Holds the [`TransportFactory`](crate::transport::TransportFactory)
+    /// and the spawner internally; see
+    /// [`crate::client::bind_dispatch`] for the two impls.
+    dispatch: D,
+    /// Async sleep primitive used by the run-loop's idle tick and any
+    /// future periodic-emission paths. On `client-tokio` builds this is
+    /// [`TokioTimer`] (which wraps `tokio::time::sleep`).
+    timer: Tm,
     /// Phantom data to represent the generic message definitions
-    phantom: std::marker::PhantomData<PayloadDefinitions>,
+    phantom: core::marker::PhantomData<PayloadDefinitions>,
 }
 
-impl<PayloadDefinitions: PayloadWireFormat> std::fmt::Debug for Inner<PayloadDefinitions> {
+impl<P: PayloadWireFormat, Tm: Timer, R: E2ERegistryHandle, C: ChannelFactory, D> std::fmt::Debug
+    for Inner<P, Tm, R, C, D>
+{
     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
         f.debug_struct("Inner")
             .field("interface", &self.interface)
@@ -284,29 +377,59 @@ impl<PayloadDefinitions: PayloadWireFormat> std::fmt::Debug for Inner<PayloadDef
     }
 }
 
-impl<PayloadDefinitions> Inner<PayloadDefinitions>
+impl<PayloadDefinitions, Tm, R, C, D> Inner<PayloadDefinitions, Tm, R, C, D>
 where
-    PayloadDefinitions: PayloadWireFormat + Clone + std::fmt::Debug + 'static,
+    PayloadDefinitions: PayloadWireFormat + Clone + std::fmt::Debug + Send + 'static,
+    Tm: Timer + 'static,
+    R: E2ERegistryHandle,
+    C: ChannelFactory,
+    D: crate::client::bind_dispatch::BindDispatch<PayloadDefinitions, C, R> + 'static,
+    // Channel-bound bundle (see comment in `client::mod`).
+    Result<(), Error>: crate::transport::OneshotPooled<C>,
+    Result<PayloadDefinitions, Error>: crate::transport::OneshotPooled<C>,
+    Result<crate::protocol::sd::RebootFlag, Error>: crate::transport::OneshotPooled<C>,
+    ControlMessage<PayloadDefinitions, C>: crate::transport::BoundedPooled<C, 4>,
+    super::socket_manager::SendMessage<PayloadDefinitions, C>:
+        crate::transport::BoundedPooled<C, 16>,
+    Result<super::socket_manager::ReceivedMessage<PayloadDefinitions>, Error>:
+        crate::transport::BoundedPooled<C, 16>,
+    super::ClientUpdate<PayloadDefinitions>: crate::transport::UnboundedPooled<C>,
 {
-    pub fn spawn(
+    /// Construct an `Inner` and return the control/update channels plus
+    /// the run-loop future.
+    ///
+    /// The dispatch is one of [`SpawnerDispatch`] (Send-required) or
+    /// [`LocalSpawnerDispatch`] (single-task) — the
+    /// `Client::new_with_deps` / `Client::new_with_deps_local` public
+    /// constructors pick the right one. The returned future inherits
+    /// the dispatch's auto-trait set: `Send` if the dispatch is
+    /// Send-aware and all dependencies are `Send`, `!Send` otherwise.
+    ///
+    /// [`SpawnerDispatch`]: super::bind_dispatch::SpawnerDispatch
+    /// [`LocalSpawnerDispatch`]: super::bind_dispatch::LocalSpawnerDispatch
+    #[allow(clippy::type_complexity)]
+    pub fn build(
         interface: Ipv4Addr,
-        e2e_registry: Arc<Mutex<E2ERegistry>>,
+        e2e_registry: R,
         multicast_loopback: bool,
+        dispatch: D,
+        timer: Tm,
     ) -> (
-        Sender<ControlMessage<PayloadDefinitions>>,
-        mpsc::UnboundedReceiver<ClientUpdate<PayloadDefinitions>>,
+        C::BoundedSender<ControlMessage<PayloadDefinitions, C>, 4>,
+        C::UnboundedReceiver<ClientUpdate<PayloadDefinitions>>,
+        impl core::future::Future<Output = ()> + 'static,
     ) {
         info!("Initializing SOME/IP Client");
-        let (control_sender, control_receiver) = mpsc::channel(4);
-        let (update_sender, update_receiver) = mpsc::unbounded_channel();
+        let (control_sender, control_receiver) = C::bounded::<_, 4>();
+        let (update_sender, update_receiver) = C::unbounded();
         let inner = Self {
             control_receiver,
-            request_queue: VecDeque::new(),
-            pending_responses: HashMap::new(),
+            request_queue: Deque::new(),
+            pending_responses: FnvIndexMap::new(),
             update_sender,
             interface,
             discovery_socket: None,
-            unicast_sockets: HashMap::new(),
+            unicast_sockets: FnvIndexMap::new(),
             session_tracker: SessionTracker::default(),
             service_registry: ServiceRegistry::default(),
             run: true,
@@ -316,23 +439,27 @@ where
             sd_session_has_wrapped: false,
             e2e_registry,
             multicast_loopback,
-            phantom: std::marker::PhantomData,
+            dispatch,
+            timer,
+            phantom: core::marker::PhantomData,
         };
-        inner.run();
-        (control_sender, update_receiver)
+        (control_sender, update_receiver, inner.run_future())
     }
 
-    fn bind_discovery(&mut self) -> Result<(), Error> {
+    async fn bind_discovery(&mut self) -> Result<(), Error> {
         if self.discovery_socket.is_some() {
             Ok(())
         } else {
-            let socket = SocketManager::bind_discovery_seeded(
-                self.interface,
-                Arc::clone(&self.e2e_registry),
-                self.sd_session_id,
-                self.sd_session_has_wrapped,
-                self.multicast_loopback,
-            )?;
+            let socket = self
+                .dispatch
+                .bind_discovery(
+                    self.interface,
+                    self.e2e_registry.clone(),
+                    self.sd_session_id,
+                    self.sd_session_has_wrapped,
+                    self.multicast_loopback,
+                )
+                .await?;
             self.discovery_socket = Some(socket);
             Ok(())
         }
@@ -353,21 +480,93 @@ where
         self.interface = interface;
     }
 
-    fn bind_unicast(&mut self, port: u16) -> Result<u16, Error> {
+    async fn bind_unicast(&mut self, port: u16) -> Result<u16, Error> {
         if port != 0
             && let Some(socket) = self.unicast_sockets.get(&port)
         {
             return Ok(socket.port());
         }
-        let unicast_socket = SocketManager::bind(port, Arc::clone(&self.e2e_registry))?;
+        // Check capacity before asking the OS for a port so we don't
+        // bind-then-drop a socket we can't track.
+        if self.unicast_sockets.len() >= UNICAST_SOCKETS_CAP {
+            warn!(
+                "unicast_sockets at capacity ({}); refusing new bind of port {}",
+                UNICAST_SOCKETS_CAP, port
+            );
+            return Err(Error::Capacity("unicast_sockets"));
+        }
+        let unicast_socket = self
+            .dispatch
+            .bind_unicast(port, self.e2e_registry.clone())
+            .await?;
         let bound_port = unicast_socket.port();
-        self.unicast_sockets.insert(bound_port, unicast_socket);
+        // Capacity was checked above, so insert cannot report "full" here.
+        // A defensive check guards against a future refactor that changes
+        // the ordering.
+        if self
+            .unicast_sockets
+            .insert(bound_port, unicast_socket)
+            .is_err()
+        {
+            error!(
+                "unicast_sockets insert failed after capacity check passed — invariant violation"
+            );
+            return Err(Error::Capacity("unicast_sockets"));
+        }
         debug!("Bound unicast socket on port {}", bound_port);
         Ok(bound_port)
     }
 
+    /// Tracks the caller's response channel against `request_id` so a
+    /// future unicast reply can be routed back. If the
+    /// `pending_responses` map is already at `PENDING_RESPONSES_CAP`, the
+    /// `response` sender is recovered from the failed `insert` and used
+    /// to deliver `Err(Error::Capacity("pending_responses"))` — the
+    /// caller's `PendingResponse::response().await` resolves cleanly
+    /// instead of panicking on the `RecvError` that dropping the Sender
+    /// would have produced. If `request_id` is reused while an older
+    /// pending entry still exists (e.g. after a `session_counter`
+    /// wrap-around), the displaced sender is likewise completed with
+    /// `Err(Error::Capacity("pending_responses"))` rather than being
+    /// silently dropped — the caller awaiting the previous request
+    /// sees a clean error instead of a `RecvError` panic. Any reply
+    /// that later arrives for a dropped `request_id` is surfaced on
+    /// the update stream via `ClientUpdate::Unicast` instead of
+    /// matching a pending entry.
+    fn track_or_reject_pending_response(
+        &mut self,
+        request_id: u32,
+        response: C::OneshotSender<Result<PayloadDefinitions, Error>>,
+    ) {
+        match self.pending_responses.insert(request_id, response) {
+            Ok(None) => {}
+            Ok(Some(displaced_response)) => {
+                // `request_id` reuse is expected once `session_counter`
+                // wraps every ~65k requests on a long-lived client, and
+                // legitimate when the previous request is still pending.
+                // The displaced sender carries `Error::Capacity` to its
+                // awaiter; logging at `warn!` per wrap floods ops dashboards
+                // for a routine event, so demote to `debug!`.
+                debug!(
+                    "pending_responses already contained request_id \
+                     0x{:08X}; replacing existing pending response",
+                    request_id
+                );
+                let _ = displaced_response.send(Err(Error::Capacity("pending_responses")));
+            }
+            Err((_req_id, response)) => {
+                warn!(
+                    "pending_responses at capacity ({}); response tracking \
+                     dropped for request_id 0x{:08X}",
+                    PENDING_RESPONSES_CAP, request_id
+                );
+                let _ = response.send(Err(Error::Capacity("pending_responses")));
+            }
+        }
+    }
+
     async fn receive_discovery(
-        socket_manager: &mut Option<SocketManager<PayloadDefinitions>>,
+        socket_manager: &mut Option<SocketManager<PayloadDefinitions, C>>,
     ) -> Result<
         (
             SocketAddr,
@@ -376,47 +575,86 @@ where
         ),
         Error,
     > {
-        if let Some(receiver) = socket_manager {
-            match receiver.receive().await {
-                Some(result) => match result {
-                    Ok(received) => {
-                        let someip_header = received.message.header().clone();
-                        if let Some(sd_header) = received.message.sd_header() {
-                            Ok((received.source, someip_header, sd_header.to_owned()))
-                        } else {
-                            Err(Error::UnexpectedDiscoveryMessage(someip_header))
-                        }
-                    }
-                    Err(err) => Err(err),
-                },
-                None => Err(Error::SocketClosedUnexpectedly),
-            }
+        let Some(socket) = socket_manager else {
+            // If we don't have a receiver, return a future that never resolves
+            return future::pending().await;
+        };
+        let Some(result) = socket.receive().await else {
+            // Socket loop has exited. Evict the dead manager so
+            // subsequent polls don't busy-loop on a closed receiver —
+            // instead they fall through to the `future::pending()`
+            // arm and wait until the user re-binds discovery (e.g.
+            // via SetInterface).
+            *socket_manager = None;
+            return Err(Error::SocketClosedUnexpectedly);
+        };
+        let received = result?;
+        let someip_header = received.message.header().clone();
+        if let Some(sd_header) = received.message.sd_header() {
+            Ok((received.source, someip_header, sd_header.to_owned()))
         } else {
-            // If we don't have a receiver, we should return a future that never resolves
-            future::pending().await
+            Err(Error::UnexpectedDiscoveryMessage(someip_header))
         }
     }
 
     /// Receive from any bound unicast socket. Returns the first message ready
     /// from any socket. If no sockets are bound, returns a future that never resolves.
+    ///
+    /// A unicast socket whose loop has exited (`poll_receive` returns
+    /// `Poll::Ready(None)`) is evicted from the map immediately rather
+    /// than having `Err(SocketClosedUnexpectedly)` returned once per
+    /// poll forever, which would CPU-pin the run-loop and flood the
+    /// update stream.
     async fn receive_any_unicast(
-        unicast_sockets: &mut HashMap<u16, SocketManager<PayloadDefinitions>>,
+        unicast_sockets: &mut FnvIndexMap<
+            u16,
+            SocketManager<PayloadDefinitions, C>,
+            UNICAST_SOCKETS_CAP,
+        >,
     ) -> Result<ReceivedMessage<PayloadDefinitions>, Error> {
         if unicast_sockets.is_empty() {
             return future::pending().await;
         }
 
-        // Use poll_fn to manually poll each socket's receiver
         std::future::poll_fn(|cx| {
-            for socket in unicast_sockets.values_mut() {
+            // Collect ports of any sockets that report `Ready(None)`
+            // (loop has exited). Evict them after the iteration so we
+            // do not mutate the map while iterating it.
+            let mut dead_ports: heapless::Vec<u16, UNICAST_SOCKETS_CAP> = heapless::Vec::new();
+            let mut delivered: Option<Result<ReceivedMessage<PayloadDefinitions>, Error>> = None;
+            for (port, socket) in unicast_sockets.iter_mut() {
                 if let Poll::Ready(result) = socket.poll_receive(cx) {
-                    return Poll::Ready(match result {
-                        Some(msg) => msg,
-                        None => Err(Error::SocketClosedUnexpectedly),
-                    });
+                    match result {
+                        Some(msg) => {
+                            delivered = Some(msg);
+                            break;
+                        }
+                        None => {
+                            // Mark for eviction; keep scanning others.
+                            let _ = dead_ports.push(*port);
+                        }
+                    }
                 }
             }
-            Poll::Pending
+            for port in &dead_ports {
+                unicast_sockets.remove(port);
+                tracing::warn!("Unicast socket on port {port} closed; evicted from registry");
+            }
+            if let Some(msg) = delivered {
+                Poll::Ready(msg)
+            } else if unicast_sockets.is_empty() {
+                // The last socket just got evicted; fall through to a
+                // pending state so the next bind triggers a fresh poll.
+                Poll::Pending
+            } else if !dead_ports.is_empty() {
+                // At least one socket got evicted but others remain;
+                // re-poll so the caller observes the next ready event
+                // promptly instead of waiting on a stale waker.
+                cx.waker().wake_by_ref();
+                Poll::Pending
+            } else {
+                Poll::Pending
+            }
         })
         .await
     }
@@ -432,52 +670,72 @@ where
                             self.interface
                         );
                         self.unbind_discovery().await;
-                        self.request_queue
-                            .push_front(ControlMessage::SetInterface(interface, response));
+                        // Re-enqueue after pop. The slot we popped is free,
+                        // so `push_front` should never fail here — but if a
+                        // future refactor breaks that invariant, reject via
+                        // the capacity path instead of silently dropping the
+                        // response oneshot (matches the primary `push_back`
+                        // overflow arm in the control-channel receiver).
+                        if let Err(rejected) = self
+                            .request_queue
+                            .push_front(ControlMessage::SetInterface(interface, response))
+                        {
+                            error!("request_queue push_front failed after pop — invariant broken");
+                            rejected.reject_with_capacity("request_queue");
+                        }
                         return;
                     }
                     if self.interface != interface {
                         self.set_interface(interface);
-                        self.request_queue
-                            .push_front(ControlMessage::SetInterface(interface, response));
-                        return;
-                    }
-                    info!("Binding to interface: {}", interface);
-                    let bind_result = self.bind_discovery();
-                    match &bind_result {
-                        Ok(()) => {
-                            info!("Successfully Bound to interface: {}", interface);
-                        }
-                        Err(e) => {
-                            warn!("Failed to bind to interface: {}. Error: {:?}", interface, e);
+                        // See re-enqueue note above.
+                        if let Err(rejected) = self
+                            .request_queue
+                            .push_front(ControlMessage::SetInterface(interface, response))
+                        {
+                            error!("request_queue push_front failed after pop — invariant broken");
+                            rejected.reject_with_capacity("request_queue");
                         }
+                        return;
                     }
-                    if response.send(bind_result).is_err() {
-                        warn!("SetInterface response receiver dropped (caller canceled)");
+                    // Reaching here: discovery is not bound AND
+                    // `interface == self.interface`. Do nothing — the
+                    // user expressed no change of intent. Previously
+                    // this branch silently called `bind_discovery()`
+                    // as a side effect, which surprised callers
+                    // probing the current interface via
+                    // `client.set_interface(client.interface()).await`.
+                    debug!("SetInterface: no-op (interface unchanged, discovery not bound)");
+                    if response.send(Ok(())).is_err() {
+                        debug!("SetInterface: caller dropped the response receiver");
                     }
                 }
                 ControlMessage::BindDiscovery(response) => {
-                    let result = self.bind_discovery();
+                    let result = self.bind_discovery().await;
                     if response.send(result).is_err() {
-                        warn!("BindDiscovery response receiver dropped (caller canceled)");
+                        debug!("BindDiscovery: caller dropped the response receiver");
                     }
                 }
                 ControlMessage::UnbindDiscovery(response) => {
                     self.unbind_discovery().await;
                     if response.send(Ok(())).is_err() {
-                        warn!("UnbindDiscovery response receiver dropped (caller canceled)");
+                        debug!("UnbindDiscovery: caller dropped the response receiver");
                     }
                 }
                 ControlMessage::SendSD(target, header, response) => {
                     // SD Message, If the discovery socket is not bound, bind it
                     match &mut self.discovery_socket {
                         None => {
-                            match self.bind_discovery() {
+                            match self.bind_discovery().await {
                                 Ok(()) => {
-                                    // Discovery socket successfully bound, send the message on the next loop
-                                    self.request_queue.push_front(ControlMessage::SendSD(
-                                        target, header, response,
-                                    ));
+                                    // See re-enqueue note on SetInterface above.
+                                    if let Err(rejected) = self.request_queue.push_front(
+                                        ControlMessage::SendSD(target, header, response),
+                                    ) {
+                                        error!(
+                                            "request_queue push_front failed after pop — invariant broken"
+                                        );
+                                        rejected.reject_with_capacity("request_queue");
+                                    }
                                 }
                                 Err(e) => {
                                     error!(
@@ -485,8 +743,8 @@ where
                                         e
                                     );
                                     if response.send(Err(e)).is_err() {
-                                        warn!(
-                                            "SendSD error response receiver dropped (caller canceled)"
+                                        debug!(
+                                            "SendSD (bind-err path): caller dropped the response receiver"
                                         );
                                     }
                                 }
@@ -505,7 +763,7 @@ where
                                 .send(target, message)
                                 .await;
                             if response.send(send_result).is_err() {
-                                warn!("SendSD response receiver dropped (caller canceled)");
+                                debug!("SendSD: caller dropped the response receiver");
                             }
                         }
                     }
@@ -517,7 +775,7 @@ where
                     local_port,
                     response,
                 ) => {
-                    self.service_registry.insert(
+                    let insert_result = self.service_registry.insert(
                         ServiceInstanceId {
                             service_id,
                             instance_id,
@@ -529,12 +787,23 @@ where
                             minor_version: 0xFFFF_FFFF,
                         },
                     );
-                    debug!(
-                        "Added endpoint for service 0x{:04X}.0x{:04X} -> {}",
-                        service_id, instance_id, addr,
-                    );
-                    if response.send(Ok(())).is_err() {
-                        warn!("AddEndpoint response receiver dropped (caller canceled)");
+                    let outcome = if insert_result.is_ok() {
+                        debug!(
+                            "Added endpoint for service 0x{:04X}.0x{:04X} -> {}",
+                            service_id, instance_id, addr,
+                        );
+                        Ok(())
+                    } else {
+                        warn!(
+                            "service_registry at capacity ({}); cannot add 0x{:04X}.0x{:04X}",
+                            crate::client::service_registry::SERVICE_REGISTRY_CAP,
+                            service_id,
+                            instance_id,
+                        );
+                        Err(Error::Capacity("service_registry"))
+                    };
+                    if response.send(outcome).is_err() {
+                        debug!("AddEndpoint: caller dropped the response receiver");
                     }
                 }
                 ControlMessage::RemoveEndpoint(service_id, instance_id, response) => {
@@ -547,7 +816,7 @@ where
                         service_id, instance_id,
                     );
                     if response.send(Ok(())).is_err() {
-                        warn!("RemoveEndpoint response receiver dropped (caller canceled)");
+                        debug!("RemoveEndpoint: caller dropped the response receiver");
                     }
                 }
                 ControlMessage::SendToService {
@@ -571,7 +840,7 @@ where
                     let source_port = if desired_port == 0 {
                         // Ephemeral: auto-bind only if no sockets exist, then use first
                         if self.unicast_sockets.is_empty() {
-                            match self.bind_unicast(0) {
+                            match self.bind_unicast(0).await {
                                 Ok(port) => {
                                     debug!("Auto-bound unicast on port {} for SendToService", port);
                                     port
@@ -586,7 +855,7 @@ where
                         }
                     } else {
                         // Specific port: bind if not already bound
-                        match self.bind_unicast(desired_port) {
+                        match self.bind_unicast(desired_port).await {
                             Ok(port) => port,
                             Err(e) => {
                                 let _ = send_complete.send(Err(e));
@@ -596,30 +865,37 @@ where
                     };
                     let socket = self.unicast_sockets.get_mut(&source_port).unwrap();
 
-                    // Stamp request ID
+                    // Stamp request ID with the CURRENT session counter,
+                    // but only advance it on successful send. A failed
+                    // send should not chew through the 16-bit session
+                    // space — under transient transport failure that
+                    // could wrap toward in-flight pending_responses
+                    // far faster than expected.
                     let request_id =
                         (u32::from(self.client_id) << 16) | u32::from(self.session_counter);
                     message.set_request_id(request_id);
-                    self.session_counter = self.session_counter.wrapping_add(1);
-                    if self.session_counter == 0 {
-                        self.session_counter = 1;
-                    }
 
                     let send_result = socket.send(target, message).await;
                     match send_result {
                         Ok(()) => {
+                            // Advance the counter only after a real
+                            // wire transmission. Skip 0 on wrap.
+                            self.session_counter = self.session_counter.wrapping_add(1);
+                            if self.session_counter == 0 {
+                                self.session_counter = 1;
+                            }
                             let _ = send_complete.send(Ok(()));
-                            self.pending_responses.insert(request_id, response);
+                            self.track_or_reject_pending_response(request_id, response);
                         }
                         Err(e) => {
                             let _ = send_complete.send(Err(e));
                         }
                     }
                 }
-                #[cfg(test)]
+                #[cfg(all(test, feature = "client-tokio"))]
                 ControlMessage::ForceSdSessionWrappedForTest(wrapped, response) => {
                     self.sd_session_has_wrapped = wrapped;
-                    let _ = response.send(());
+                    let _ = response.send(Ok(()));
                 }
                 ControlMessage::QueryRebootFlag(response) => {
                     // Prefer the live socket's tracked flag when bound. When
@@ -632,11 +908,13 @@ where
                     // next `reboot_flag()` call.
                     let flag = if let Some(socket) = self.discovery_socket.as_ref() {
                         socket.reboot_flag()
+                    } else if self.sd_session_has_wrapped {
+                        crate::protocol::sd::RebootFlag::Continuous
                     } else {
-                        crate::protocol::sd::RebootFlag::from(!self.sd_session_has_wrapped)
+                        crate::protocol::sd::RebootFlag::RecentlyRebooted
                     };
-                    if response.send(flag).is_err() {
-                        warn!("QueryRebootFlag response receiver dropped (caller canceled)");
+                    if response.send(Ok(flag)).is_err() {
+                        debug!("QueryRebootFlag: caller dropped the response receiver");
                     }
                 }
                 ControlMessage::Subscribe {
@@ -654,38 +932,67 @@ where
                         instance_id,
                     };
                     if self.service_registry.get(id).is_none() {
-                        let _ = response.send(Err(Error::ServiceNotFound));
+                        if response.send(Err(Error::ServiceNotFound)).is_err() {
+                            debug!(
+                                "Subscribe (ServiceNotFound): caller dropped the response receiver (expected for subscribe_no_wait)"
+                            );
+                        }
                         return;
                     }
 
                     // Bind unicast on the requested port (0 = ephemeral)
-                    let unicast_port = match self.bind_unicast(client_port) {
+                    let unicast_port = match self.bind_unicast(client_port).await {
                         Ok(port) => {
                             debug!("Bound unicast on port {} for Subscribe", port);
                             port
                         }
                         Err(e) => {
-                            let _ = response.send(Err(e));
+                            if response.send(Err(e)).is_err() {
+                                debug!(
+                                    "Subscribe (bind-err): caller dropped the response receiver"
+                                );
+                            }
                             return;
                         }
                     };
 
                     // Auto-bind discovery if not bound (re-queue like SendSD does)
                     match &mut self.discovery_socket {
-                        None => match self.bind_discovery() {
+                        None => match self.bind_discovery().await {
                             Ok(()) => {
-                                self.request_queue.push_front(ControlMessage::Subscribe {
-                                    service_id,
-                                    instance_id,
-                                    major_version,
-                                    ttl,
-                                    event_group_id,
-                                    client_port,
-                                    response,
-                                });
+                                // Re-enqueue the Subscribe carrying the
+                                // ALREADY-bound `unicast_port` so pass-2
+                                // hits the `bind_unicast` dedupe path
+                                // instead of allocating a second
+                                // ephemeral socket. Carrying the
+                                // original `client_port=0` would
+                                // re-bind ephemerally and leak the
+                                // original socket into
+                                // `unicast_sockets` until the slot cap
+                                // hit.
+                                if let Err(rejected) =
+                                    self.request_queue.push_front(ControlMessage::Subscribe {
+                                        service_id,
+                                        instance_id,
+                                        major_version,
+                                        ttl,
+                                        event_group_id,
+                                        client_port: unicast_port,
+                                        response,
+                                    })
+                                {
+                                    error!(
+                                        "request_queue push_front failed after pop — invariant broken"
+                                    );
+                                    rejected.reject_with_capacity("request_queue");
+                                }
                             }
                             Err(e) => {
-                                let _ = response.send(Err(e));
+                                if response.send(Err(e)).is_err() {
+                                    debug!(
+                                        "Subscribe (discovery-bind-err): caller dropped the response receiver"
+                                    );
+                                }
                             }
                         },
                         Some(discovery_socket) => {
@@ -714,7 +1021,9 @@ where
                                 .send(target, message)
                                 .await;
                             if response.send(send_result).is_err() {
-                                warn!("Subscribe response receiver dropped (caller canceled)");
+                                debug!(
+                                    "Subscribe: caller dropped the response receiver (expected for subscribe_no_wait)"
+                                );
                             }
                         }
                     }
@@ -724,10 +1033,16 @@ where
     }
 
     #[allow(clippy::too_many_lines)]
-    fn run(mut self) {
-        tokio::spawn(async move {
-            info!("SOME/IP Client processing loop started");
-            loop {
+    async fn run_future(mut self) {
+        info!("SOME/IP Client processing loop started");
+        loop {
+            // Scope the `&mut self` destructure + pinned per-iteration
+            // futures so all borrows of `self` drop before we call
+            // `self.handle_control_message().await` below. `pin_mut!`
+            // creates stack-pinned locals that outlive the select
+            // macro, so the inner block is required to release those
+            // borrows.
+            let should_break = {
                 let Self {
                     control_receiver,
                     pending_responses,
@@ -738,65 +1053,100 @@ where
                     session_tracker,
                     service_registry,
                     run,
+                    timer,
                     ..
                 } = &mut self;
+                // Build fresh per-iteration futures and fuse them for
+                // `select!`'s `FusedFuture + Unpin` bound.
+                // `receive_discovery` / `receive_any_unicast` are
+                // async fns that are not `Unpin`; the `Timer::sleep`
+                // future likewise. Stack-pinning via `pin_mut!`
+                // satisfies both.
+                //
+                // The 125ms idle tick goes through the caller-supplied
+                // `Timer` impl. On `client-tokio` builds this is
+                // `TokioTimer` (wrapping `tokio::time::sleep`); bare-metal
+                // builds plug in their own (e.g. an `embassy_time` shim).
+                let control_fut = control_receiver.recv().fuse();
+                let sleep_fut = timer.sleep(core::time::Duration::from_millis(125)).fuse();
+                let discovery_fut = Self::receive_discovery(discovery_socket).fuse();
+                let unicast_fut = Self::receive_any_unicast(unicast_sockets).fuse();
+                pin_mut!(control_fut, sleep_fut, discovery_fut, unicast_fut);
+
+                // `select!` (not `select_biased!`) randomizes the
+                // arm check order each poll so no single arm can
+                // starve the others under sustained load. Matches
+                // the original `tokio::select!` fairness behavior.
                 select! {
-                    () = tokio::time::sleep(std::time::Duration::from_millis(125)) => {}
-                    // Receive a control message
-                    ctrl = control_receiver.recv() => {
-                        if let Some(ctrl) = ctrl {
-                            debug!("Received control message: {:?}", ctrl);
-                            request_queue.push_back(ctrl);
-                        } else {
-                            // The sender has been dropped, so we should exit
-                            *run = false;
+                // Receive a control message
+                ctrl = control_fut => {
+                    if let Some(ctrl) = ctrl {
+                        debug!("Received control message: {:?}", ctrl);
+                        if let Err(rejected) = request_queue.push_back(ctrl) {
+                            // Queue full: notify the rejected message's
+                            // oneshot senders with `Error::Capacity` so
+                            // callers see a typed overload error rather
+                            // than a `RecvError` (which `client::mod`
+                            // maps to `Error::Shutdown`, conflating
+                            // overload with lifecycle failure).
+                            warn!(
+                                "request_queue at capacity ({}); rejecting control message with Capacity error",
+                                REQUEST_QUEUE_CAP
+                            );
+                            rejected.reject_with_capacity("request_queue");
                         }
+                    } else {
+                        // The sender has been dropped, so we should exit
+                        *run = false;
                     }
-                    // Receive a discovery message
-                    discovery = Inner::receive_discovery(discovery_socket) => {
-                        trace!("Received discovery message: {:?}", discovery);
-                        match discovery {
-                            Ok((source, someip_header, sd_header)) => {
-                                // Extract session ID from SOME/IP request_id (lower 16 bits)
-                                let session_id = (someip_header.request_id() & 0xFFFF) as u16;
-                                let sd_payload = PayloadDefinitions::new_sd_payload(&sd_header);
-                                // Extract reboot flag from the SD payload flags
-                                let reboot_flag = sd_payload
-                                    .sd_flags()
-                                    .map_or(crate::protocol::sd::RebootFlag::Continuous, |f| {
-                                        f.reboot()
-                                    });
-
-                                // Track sender session/reboot state for every SD entry
-                                // that identifies a service instance, not only
-                                // offer/stop-offer entries. This ensures reboot
-                                // detection works for all SD traffic (FindService,
-                                // Subscribe, SubscribeAck, etc.).
-                                let mut rebooted = false;
-                                for (svc_id, inst_id) in sd_payload.service_instances() {
-                                    let verdict = session_tracker.check(
-                                        source,
-                                        TransportKind::Multicast,
-                                        svc_id,
-                                        inst_id,
-                                        session_id,
-                                        reboot_flag,
-                                    );
-                                    if verdict == SessionVerdict::Reboot {
-                                        rebooted = true;
-                                    }
+                }
+                () = sleep_fut => {}
+                // Receive a discovery message
+                discovery = discovery_fut => {
+                    trace!("Received discovery message: {:?}", discovery);
+                    match discovery {
+                        Ok((source, someip_header, sd_header)) => {
+                            // Extract session ID from SOME/IP request_id (lower 16 bits)
+                            let session_id = (someip_header.request_id() & 0xFFFF) as u16;
+                            let sd_payload = PayloadDefinitions::new_sd_payload(&sd_header);
+                            // Extract reboot flag from the SD payload flags
+                            let reboot_flag = sd_payload
+                                .sd_flags()
+                                .map_or(crate::protocol::sd::RebootFlag::Continuous, |f| {
+                                    f.reboot()
+                                });
+
+                            // Track sender session/reboot state for every SD entry
+                            // that identifies a service instance, not only
+                            // offer/stop-offer entries. This ensures reboot
+                            // detection works for all SD traffic (FindService,
+                            // Subscribe, SubscribeAck, etc.).
+                            let mut rebooted = false;
+                            for (svc_id, inst_id) in sd_payload.service_instances() {
+                                let verdict = session_tracker.check(
+                                    source,
+                                    TransportKind::Multicast,
+                                    svc_id,
+                                    inst_id,
+                                    session_id,
+                                    reboot_flag,
+                                );
+                                if verdict == SessionVerdict::Reboot {
+                                    rebooted = true;
                                 }
+                            }
 
-                                // Auto-populate service registry from offer/stop-offer
-                                // SD entries.
-                                for ep in sd_payload.offered_endpoints() {
-                                    let id = ServiceInstanceId {
-                                        service_id: ep.service_id,
-                                        instance_id: ep.instance_id,
-                                    };
-                                    if ep.is_offer {
-                                        if let Some(addr) = ep.addr {
-                                            service_registry.insert(
+                            // Auto-populate service registry from offer/stop-offer
+                            // SD entries.
+                            for ep in sd_payload.offered_endpoints() {
+                                let id = ServiceInstanceId {
+                                    service_id: ep.service_id,
+                                    instance_id: ep.instance_id,
+                                };
+                                if ep.is_offer {
+                                    if let Some(addr) = ep.addr {
+                                        if service_registry
+                                            .insert(
                                                 id,
                                                 ServiceEndpointInfo {
                                                     addr,
@@ -804,75 +1154,100 @@ where
                                                     major_version: ep.major_version,
                                                     minor_version: ep.minor_version,
                                                 },
-                                            );
+                                            )
+                                            .is_ok()
+                                        {
                                             trace!(
                                                 "Registry: added 0x{:04X}.0x{:04X} -> {}",
                                                 ep.service_id, ep.instance_id, addr,
                                             );
+                                        } else {
+                                            warn!(
+                                                "Registry full; dropped offer for 0x{:04X}.0x{:04X}",
+                                                ep.service_id, ep.instance_id,
+                                            );
                                         }
-                                    } else {
-                                        service_registry.remove(id);
-                                        trace!(
-                                            "Registry: removed 0x{:04X}.0x{:04X}",
-                                            ep.service_id, ep.instance_id,
-                                        );
                                     }
+                                } else {
+                                    service_registry.remove(id);
+                                    trace!(
+                                        "Registry: removed 0x{:04X}.0x{:04X}",
+                                        ep.service_id, ep.instance_id,
+                                    );
                                 }
-
-                                if rebooted {
-                                    let _ = update_sender.send(ClientUpdate::SenderRebooted(source));
-                                }
-
-                                let discovery_msg = DiscoveryMessage {
-                                    source,
-                                    someip_header,
-                                    sd_header,
-                                };
-                                let _ = update_sender.send(ClientUpdate::DiscoveryUpdated(discovery_msg));
                             }
-                            Err(err) => {
-                                error!("Error receiving discovery message: {:?}", err);
-                                let _ = update_sender.send(ClientUpdate::Error(err));
+
+                            if rebooted {
+                                let _ = update_sender.send_now(ClientUpdate::SenderRebooted(source));
                             }
+
+                            let discovery_msg = DiscoveryMessage {
+                                source,
+                                someip_header,
+                                sd_header,
+                            };
+                            let _ = update_sender.send_now(ClientUpdate::DiscoveryUpdated(discovery_msg));
                         }
-                     }
-                     unicast = Inner::receive_any_unicast(unicast_sockets) => {
-                         trace!("Received unicast message: {:?}", unicast);
-                         match unicast {
-                             Ok(received) => {
-                                 let ReceivedMessage { message: received_message, e2e_status, .. } = received;
-                                 // Check if this matches a pending request-response by request_id
-                                 let request_id = received_message.header().request_id();
-                                 if let Some(sender) = pending_responses.remove(&request_id) {
-                                     let _ = sender.send(Ok(received_message.payload().clone()));
-                                     continue;
-                                 }
-                                 // Not a response — forward as ClientUpdate::Unicast
-                                 let _ = update_sender.send(ClientUpdate::Unicast { message: received_message, e2e_status });
-                             }
-                             Err(err) => {
-                                 let _ = update_sender.send(ClientUpdate::Error(err));
+                        Err(err) => {
+                            error!("Error receiving discovery message: {:?}", err);
+                            let _ = update_sender.send_now(ClientUpdate::Error(err));
+                        }
+                    }
+                 }
+                 unicast = unicast_fut => {
+                     trace!("Received unicast message: {:?}", unicast);
+                     match unicast {
+                         Ok(received) => {
+                             let ReceivedMessage { message: received_message, e2e_status, .. } = received;
+                             // Check if this matches a pending request-response by request_id
+                             let request_id = received_message.header().request_id();
+                             if let Some(sender) = pending_responses.remove(&request_id) {
+                                 let _ = sender.send(Ok(received_message.payload().clone()));
+                                 continue;
                              }
+                             // Not a response — forward as ClientUpdate::Unicast
+                             let _ = update_sender.send_now(ClientUpdate::Unicast { message: received_message, e2e_status });
+                         }
+                         Err(err) => {
+                             let _ = update_sender.send_now(ClientUpdate::Error(err));
                          }
                      }
+                 }
                 }
-                if !*run {
-                    info!("SOME/IP Client processing loop exiting");
-                    break;
-                }
-                self.handle_control_message().await;
+                !*run
+            };
+            if should_break {
+                info!("SOME/IP Client processing loop exiting");
+                break;
             }
-        });
+            self.handle_control_message().await;
+        }
     }
 }
 
-#[cfg(test)]
+#[cfg(all(test, feature = "client-tokio"))]
 mod tests {
     use super::*;
     use crate::protocol::sd::test_support::{TestPayload, empty_sd_header};
+    use crate::transport::{OneshotRecv, UnboundedRecv};
     use std::format;
-
-    type TestControl = ControlMessage<TestPayload>;
+    use tokio::sync::mpsc::Sender;
+    use tokio::sync::{mpsc, oneshot};
+
+    type TestControl = ControlMessage<TestPayload, TokioChannels>;
+    /// Type alias for the fully-spelled `Inner` flavor used throughout
+    /// these tests: tokio everything, default `Arc<Mutex<E2ERegistry>>`
+    /// and `Arc<RwLock<Ipv4Addr>>` handles.
+    type TestInner = Inner<
+        TestPayload,
+        crate::tokio_transport::TokioTimer,
+        Arc<Mutex<E2ERegistry>>,
+        TokioChannels,
+        crate::client::bind_dispatch::SpawnerDispatch<
+            crate::tokio_transport::TokioTransport,
+            TokioSpawner,
+        >,
+    >;
 
     #[test]
     fn test_control_message_constructors() {
@@ -906,6 +1281,76 @@ mod tests {
         assert!(matches!(msg, ControlMessage::Subscribe { .. }));
     }
 
+    /// `reject_with_capacity` must notify every oneshot sender inside a
+    /// rejected `ControlMessage` with `Err(Error::Capacity(..))` — for
+    /// `SendToService`, _both_ the `send_complete` and `response`
+    /// channels. Dropping either channel would let a caller's `.unwrap()`
+    /// (or `.expect(...)` inside `PendingResponse::response()`) panic on
+    /// the resulting `RecvError`, which is exactly what Copilot flagged.
+    #[test]
+    fn reject_with_capacity_notifies_every_sender() {
+        use crate::transport::OneshotCancelled;
+        use futures::FutureExt;
+
+        fn expect_capacity<F>(rx: F, label: &str)
+        where
+            F: core::future::Future<Output = Result<Result<(), Error>, OneshotCancelled>>,
+        {
+            match rx.now_or_never() {
+                Some(Ok(Err(Error::Capacity(s)))) => assert_eq!(s, "request_queue", "{label}"),
+                other => panic!("{label}: expected Some(Ok(Err(Capacity))), got {other:?}"),
+            }
+        }
+
+        // Variants carrying a single Result<(), Error> response sender.
+        let (rx, msg) = TestControl::set_interface(Ipv4Addr::LOCALHOST);
+        msg.reject_with_capacity("request_queue");
+        expect_capacity(rx.recv(), "SetInterface");
+
+        let (rx, msg) = TestControl::bind_discovery();
+        msg.reject_with_capacity("request_queue");
+        expect_capacity(rx.recv(), "BindDiscovery");
+
+        let (rx, msg) = TestControl::unbind_discovery();
+        msg.reject_with_capacity("request_queue");
+        expect_capacity(rx.recv(), "UnbindDiscovery");
+
+        let target = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 1234);
+        let (rx, msg) = TestControl::send_sd(target, empty_sd_header());
+        msg.reject_with_capacity("request_queue");
+        expect_capacity(rx.recv(), "SendSD");
+
+        let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 5000);
+        let (rx, msg) = TestControl::add_endpoint(0x1234, 0x0001, addr, 0);
+        msg.reject_with_capacity("request_queue");
+        expect_capacity(rx.recv(), "AddEndpoint");
+
+        let (rx, msg) = TestControl::remove_endpoint(0x1234, 0x0001);
+        msg.reject_with_capacity("request_queue");
+        expect_capacity(rx.recv(), "RemoveEndpoint");
+
+        let (rx, msg) = TestControl::subscribe(0x1234, 0x0001, 1, 3, 0x01, 0);
+        msg.reject_with_capacity("request_queue");
+        expect_capacity(rx.recv(), "Subscribe");
+
+        // SendToService carries two senders — both must be notified so that
+        // neither `send_rx.recv().await.unwrap()?` nor `PendingResponse::response()`
+        // panics.
+        let message = Message::<TestPayload>::new_sd(1, &empty_sd_header());
+        let (send_rx, resp_rx, msg) = TestControl::send_to_service(0x1234, 0x0001, message);
+        msg.reject_with_capacity("request_queue");
+        expect_capacity(send_rx.recv(), "SendToService.send_complete");
+        // resp_rx has type Result<TestPayload, Error> — check it separately
+        match resp_rx.recv().now_or_never() {
+            Some(Ok(Err(Error::Capacity(s)))) => {
+                assert_eq!(s, "request_queue", "SendToService.response");
+            }
+            other => {
+                panic!("SendToService.response: expected Some(Ok(Err(Capacity))), got {other:?}")
+            }
+        }
+    }
+
     #[test]
     fn test_control_message_debug() {
         let (_rx, msg) = TestControl::set_interface(Ipv4Addr::LOCALHOST);
@@ -946,29 +1391,329 @@ mod tests {
         assert!(s.contains("event_group_id"));
     }
 
+    /// Build an [`Inner`] without spawning the run loop, for direct
+    /// unit-testing of state-mutating methods.
+    fn make_inner_for_test() -> TestInner {
+        let (_control_sender, control_receiver) =
+            TokioChannels::bounded::<ControlMessage<TestPayload, TokioChannels>, 4>();
+        let (update_sender, _update_receiver) =
+            TokioChannels::unbounded::<ClientUpdate<TestPayload>>();
+        Inner {
+            control_receiver,
+            request_queue: Deque::new(),
+            pending_responses: FnvIndexMap::new(),
+            update_sender,
+            interface: Ipv4Addr::LOCALHOST,
+            discovery_socket: None,
+            unicast_sockets: FnvIndexMap::new(),
+            session_tracker: SessionTracker::default(),
+            service_registry: ServiceRegistry::default(),
+            run: true,
+            client_id: 0x1234,
+            session_counter: 1,
+            sd_session_id: 1,
+            sd_session_has_wrapped: false,
+            e2e_registry: Arc::new(Mutex::new(E2ERegistry::new())),
+            multicast_loopback: false,
+            dispatch: crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            timer: TokioTimer,
+            phantom: core::marker::PhantomData,
+        }
+    }
+
+    #[tokio::test]
+    async fn bind_unicast_returns_capacity_error_when_map_full() {
+        let mut inner = make_inner_for_test();
+
+        // Fill unicast_sockets to capacity using ephemeral binds (port 0).
+        // Each call with port=0 creates a fresh socket on a distinct OS-chosen
+        // port, so the cap is what gates — not duplicate-key collapse.
+        for _ in 0..UNICAST_SOCKETS_CAP {
+            let bound = inner
+                .bind_unicast(0)
+                .await
+                .expect("ephemeral bind below cap should succeed");
+            assert_ne!(bound, 0, "OS should assign a non-zero ephemeral port");
+        }
+        assert_eq!(inner.unicast_sockets.len(), UNICAST_SOCKETS_CAP);
+
+        // The next bind must fail with Error::Capacity and must NOT bind a
+        // socket (pre-bind capacity check).
+        let err = inner
+            .bind_unicast(0)
+            .await
+            .expect_err("bind past cap should fail");
+        match err {
+            Error::Capacity(name) => assert_eq!(name, "unicast_sockets"),
+            other => panic!("expected Error::Capacity, got {other:?}"),
+        }
+        assert_eq!(
+            inner.unicast_sockets.len(),
+            UNICAST_SOCKETS_CAP,
+            "map should remain at capacity, not bind-then-drop a new socket"
+        );
+    }
+
+    /// Happy path: with room in `pending_responses`, the helper tracks
+    /// the entry and does NOT signal the caller — the sender stays
+    /// alive so a future unicast reply can resolve it.
+    #[tokio::test]
+    async fn track_or_reject_pending_response_inserts_when_room_available() {
+        use futures::FutureExt;
+        let mut inner = make_inner_for_test();
+        let (tx, rx) = oneshot::channel::<Result<TestPayload, Error>>();
+
+        inner.track_or_reject_pending_response(0xDEAD_BEEF, tx);
+
+        assert_eq!(inner.pending_responses.len(), 1);
+        assert!(
+            inner.pending_responses.contains_key(&0xDEAD_BEEF),
+            "entry should be keyed by the provided request_id",
+        );
+        // Receiver is still waiting — helper did NOT pre-emptively
+        // resolve it with a capacity error on the happy path.
+        assert!(
+            rx.now_or_never().is_none(),
+            "receiver must still be pending when the insert succeeds",
+        );
+    }
+
+    /// Regression guard against cb1d0d1: without explicit rejection,
+    /// the dropped Sender would cause `PendingResponse::response()` to
+    /// panic on `RecvError` rather than returning a clean
+    /// `Err(Error::Capacity("pending_responses"))`. Exercises the
+    /// overflow branch in `track_or_reject_pending_response`, which is
+    /// the same branch the `SendToService` run-loop arm now delegates
+    /// to.
+    #[tokio::test]
+    async fn track_or_reject_pending_response_rejects_on_saturation() {
+        let mut inner = make_inner_for_test();
+
+        // Fill the map to capacity with dummy oneshot senders. The
+        // receivers are stashed to keep each channel open for the
+        // remainder of the test — on `tokio::sync::oneshot`, dropping
+        // the receiver does not drop the sender; it flips the sender
+        // into a state where `send()` fails with the value returned.
+        // The stash is what lets us later observe `sender.send(...)`
+        // succeeding against a still-open channel when the overflow
+        // case completes the displaced sender with a capacity error.
+        let mut stashed: std::vec::Vec<oneshot::Receiver<Result<TestPayload, Error>>> =
+            std::vec::Vec::with_capacity(PENDING_RESPONSES_CAP);
+        for i in 0..PENDING_RESPONSES_CAP {
+            let (tx, rx) = oneshot::channel::<Result<TestPayload, Error>>();
+            inner
+                .pending_responses
+                .insert(
+                    u32::try_from(i).expect("PENDING_RESPONSES_CAP fits in u32"),
+                    tx,
+                )
+                .expect("filling under cap must succeed");
+            stashed.push(rx);
+        }
+        assert_eq!(inner.pending_responses.len(), PENDING_RESPONSES_CAP);
+
+        // One more entry — map is full, the helper must recover the
+        // sender from the failed insert and deliver an explicit
+        // capacity error on it.
+        let (overflow_tx, overflow_rx) = oneshot::channel::<Result<TestPayload, Error>>();
+        let overflow_key: u32 = 0xFFFF_FFFE;
+        inner.track_or_reject_pending_response(overflow_key, overflow_tx);
+
+        // Map size unchanged — the overflow attempt was rejected, not
+        // silently dropping an existing entry.
+        assert_eq!(
+            inner.pending_responses.len(),
+            PENDING_RESPONSES_CAP,
+            "overflow must not evict existing entries",
+        );
+        assert!(
+            !inner.pending_responses.contains_key(&overflow_key),
+            "overflowed key must not be in the map",
+        );
+
+        // The caller's receiver resolves to Err(Capacity), not a
+        // panicking RecvError — this is the invariant cb1d0d1 fixes.
+        let result = overflow_rx
+            .await
+            .expect("receiver should get the explicit Err, not RecvError from dropped Sender");
+        match result {
+            Err(Error::Capacity(tag)) => assert_eq!(tag, "pending_responses"),
+            other => panic!("expected Err(Error::Capacity(\"pending_responses\")), got {other:?}"),
+        }
+    }
+
+    /// If a `request_id` is reused while an older pending entry is still
+    /// live (e.g. `session_counter` wrap-around), `insert` returns
+    /// `Ok(Some(old_sender))`. Without handling that case, the displaced
+    /// sender is dropped and the caller awaiting the original request
+    /// hits `RecvError` (which `PendingResponse::response()` treats as a
+    /// fatal panic). This test guards against that: the displaced
+    /// sender must be completed with
+    /// `Err(Error::Capacity("pending_responses"))` so the original
+    /// caller gets a clean `Result` instead of a panicking `RecvError`.
+    #[tokio::test]
+    async fn track_or_reject_pending_response_completes_displaced_sender() {
+        use futures::FutureExt;
+
+        let mut inner = make_inner_for_test();
+        let key: u32 = 0xCAFE_F00D;
+
+        // First tracking: the sender lives in the map.
+        let (first_tx, first_rx) = oneshot::channel::<Result<TestPayload, Error>>();
+        inner.track_or_reject_pending_response(key, first_tx);
+        assert_eq!(inner.pending_responses.len(), 1);
+
+        // Second tracking with the same key: displaces the first sender.
+        let (second_tx, second_rx) = oneshot::channel::<Result<TestPayload, Error>>();
+        inner.track_or_reject_pending_response(key, second_tx);
+
+        // Map still has one entry — the second one replaced the first.
+        assert_eq!(inner.pending_responses.len(), 1);
+        assert!(inner.pending_responses.contains_key(&key));
+
+        // The original caller's receiver resolves to Err(Capacity) — not
+        // a dropped-sender RecvError.
+        let displaced_result = first_rx.await.expect(
+            "displaced sender must be completed with a real Err, \
+             not dropped (which would produce RecvError)",
+        );
+        match displaced_result {
+            Err(Error::Capacity(tag)) => assert_eq!(tag, "pending_responses"),
+            other => {
+                panic!("expected Err(Error::Capacity(\\\"pending_responses\\\")), got {other:?}")
+            }
+        }
+
+        // The new sender is still live and pending.
+        assert!(
+            second_rx.now_or_never().is_none(),
+            "replacement sender must still be pending in the map",
+        );
+    }
+
+    /// Sibling to `client_new_with_spawner_routes_socket_spawns_through_it`
+    /// in `mod.rs`, which covers the `bind_discovery` path. This one
+    /// covers `bind_unicast`: each successful ephemeral unicast bind
+    /// must submit exactly one future through the injected `Spawner`.
+    /// Without this test, a future refactor could silently revert the
+    /// unicast bind path to direct `tokio::spawn` and only the
+    /// discovery path's test would fail to catch it.
     #[tokio::test]
-    async fn test_inner_spawn_and_shutdown() {
-        let (control_sender, mut update_receiver) = Inner::<TestPayload>::spawn(
+    async fn bind_unicast_routes_through_injected_spawner() {
+        use core::sync::atomic::{AtomicUsize, Ordering};
+
+        #[derive(Clone)]
+        struct CountingSpawner {
+            count: Arc<AtomicUsize>,
+        }
+
+        impl crate::transport::Spawner for CountingSpawner {
+            fn spawn(&self, future: impl core::future::Future<Output = ()> + Send + 'static) {
+                self.count.fetch_add(1, Ordering::SeqCst);
+                // Delegate so the socket loop actually runs — matters
+                // if the caller later issues a send that awaits the
+                // loop's oneshot ack. For the pure-spawn-count
+                // assertion below it would also work to drop the
+                // future; we delegate to keep the Inner in a healthy
+                // state in case assertion ordering changes.
+                drop(tokio::spawn(future));
+            }
+        }
+
+        let count = Arc::new(AtomicUsize::new(0));
+        let spawner = CountingSpawner {
+            count: Arc::clone(&count),
+        };
+
+        // Build Inner directly with the counting spawner — same pattern
+        // as `make_inner_for_test`, but parameterized on S.
+        let (_control_sender, control_receiver) = mpsc::channel(4);
+        let (update_sender, _update_receiver) = mpsc::unbounded_channel();
+        let mut inner: Inner<
+            TestPayload,
+            TokioTimer,
+            Arc<Mutex<E2ERegistry>>,
+            TokioChannels,
+            crate::client::bind_dispatch::SpawnerDispatch<TokioTransport, CountingSpawner>,
+        > = Inner {
+            control_receiver,
+            request_queue: Deque::new(),
+            pending_responses: FnvIndexMap::new(),
+            update_sender,
+            interface: Ipv4Addr::LOCALHOST,
+            discovery_socket: None,
+            unicast_sockets: FnvIndexMap::new(),
+            session_tracker: SessionTracker::default(),
+            service_registry: ServiceRegistry::default(),
+            run: true,
+            client_id: 0x1234,
+            session_counter: 1,
+            sd_session_id: 1,
+            sd_session_has_wrapped: false,
+            e2e_registry: Arc::new(Mutex::new(E2ERegistry::new())),
+            multicast_loopback: false,
+            dispatch: crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner,
+            },
+            timer: TokioTimer,
+            phantom: core::marker::PhantomData,
+        };
+
+        // Three ephemeral binds → three distinct socket loops spawned.
+        for i in 0..3 {
+            let bound = inner
+                .bind_unicast(0)
+                .await
+                .expect("ephemeral bind should succeed");
+            assert_ne!(bound, 0, "iteration {i}: OS should assign a port");
+        }
+
+        assert_eq!(
+            count.load(Ordering::SeqCst),
+            3,
+            "expected exactly three spawns (one per bind_unicast call), got {}",
+            count.load(Ordering::SeqCst)
+        );
+    }
+
+    #[tokio::test]
+    async fn test_inner_build_and_shutdown() {
+        let (control_sender, mut update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
         // Drop control sender to trigger loop exit
         drop(control_sender);
         // The update receiver should eventually return None when the inner loop exits
-        let result =
-            tokio::time::timeout(std::time::Duration::from_secs(2), update_receiver.recv()).await;
+        let result = tokio::time::timeout(
+            std::time::Duration::from_secs(2),
+            UnboundedRecv::recv(&mut update_receiver),
+        )
+        .await;
         assert!(result.is_ok());
         assert!(result.unwrap().is_none());
     }
 
     /// Helper: verify inner loop is still alive by sending an `AddEndpoint` and
     /// checking that a response arrives within 2 seconds.
-    async fn assert_inner_alive(control_sender: &Sender<ControlMessage<TestPayload>>) {
+    async fn assert_inner_alive(
+        control_sender: &Sender<ControlMessage<TestPayload, TokioChannels>>,
+    ) {
         let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9999);
         let (rx, msg) = TestControl::add_endpoint(0xFFFE, 0xFFFE, addr, 0);
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx.recv())
             .await
             .expect("Timed out — inner loop appears dead")
             .expect("Oneshot closed — inner loop appears dead");
@@ -982,11 +1727,17 @@ mod tests {
 
     #[tokio::test]
     async fn test_dropped_receiver_bind_discovery_continues() {
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let (rx, msg) = TestControl::bind_discovery();
         drop(rx);
@@ -998,11 +1749,17 @@ mod tests {
 
     #[tokio::test]
     async fn test_dropped_receiver_unbind_discovery_continues() {
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let (rx, msg) = TestControl::unbind_discovery();
         drop(rx);
@@ -1014,11 +1771,17 @@ mod tests {
 
     #[tokio::test]
     async fn test_dropped_receiver_set_interface_continues() {
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         // SetInterface(LOCALHOST) on a fresh inner goes straight to
         // bind_discovery + send response (interface already matches).
@@ -1032,16 +1795,22 @@ mod tests {
 
     #[tokio::test]
     async fn test_dropped_receiver_send_sd_continues() {
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         // Bind discovery first so the SendSD path has a socket to use
         let (rx, msg) = TestControl::bind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // Send SD with a dropped receiver
         let target = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 30490);
@@ -1061,18 +1830,24 @@ mod tests {
 
     #[tokio::test]
     async fn test_queued_messages_all_complete() {
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         // Bind discovery so SetInterface will take the multi-step path:
         // iteration 1: unbind discovery, re-queue SetInterface
         // iteration 2: interface matches, bind discovery, send response
         let (rx, msg) = TestControl::bind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // Queue both messages into the channel buffer before the inner loop
         // processes either. mpsc sends on a non-full buffer complete without
@@ -1087,13 +1862,13 @@ mod tests {
         control_sender.send(msg_add).await.unwrap();
 
         // Both should complete successfully
-        let set_result = tokio::time::timeout(std::time::Duration::from_secs(3), rx_set)
+        let set_result = tokio::time::timeout(std::time::Duration::from_secs(3), rx_set.recv())
             .await
             .expect("Timed out waiting for SetInterface")
             .expect("SetInterface oneshot closed");
         assert!(set_result.is_ok());
 
-        let add_result = tokio::time::timeout(std::time::Duration::from_secs(3), rx_add)
+        let add_result = tokio::time::timeout(std::time::Duration::from_secs(3), rx_add.recv())
             .await
             .expect("Timed out waiting for AddEndpoint")
             .expect("AddEndpoint oneshot closed");
@@ -1103,27 +1878,27 @@ mod tests {
         assert_inner_alive(&control_sender).await;
     }
 
-    #[test]
-    fn test_send_to_service_constructor_returns_two_receivers() {
+    #[tokio::test]
+    async fn test_send_to_service_constructor_returns_two_receivers() {
         let message = Message::<TestPayload>::new_sd(1, &empty_sd_header());
-        let (send_rx, resp_rx, _msg) = TestControl::send_to_service(0x1234, 0x0001, message);
+        let (send_rx, resp_rx, msg) = TestControl::send_to_service(0x1234, 0x0001, message);
 
         // Extract the senders from the control message
         if let ControlMessage::SendToService {
             send_complete,
             response,
             ..
-        } = _msg
+        } = msg
         {
             // Both channels are independent — sending on one doesn't affect the other
             send_complete.send(Ok(())).unwrap();
-            assert!(send_rx.blocking_recv().unwrap().is_ok());
+            assert!(send_rx.recv().await.unwrap().is_ok());
 
             let payload = TestPayload {
                 header: empty_sd_header(),
             };
             response.send(Ok(payload.clone())).unwrap();
-            assert_eq!(resp_rx.blocking_recv().unwrap().unwrap(), payload);
+            assert_eq!(resp_rx.recv().await.unwrap().unwrap(), payload);
         } else {
             panic!("expected SendToService variant");
         }
@@ -1131,11 +1906,17 @@ mod tests {
 
     #[tokio::test]
     async fn test_dropped_receiver_add_endpoint_continues() {
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 5000);
         let (rx, msg) = TestControl::add_endpoint(0x1234, 0x0001, addr, 0);
@@ -1148,11 +1929,17 @@ mod tests {
 
     #[tokio::test]
     async fn test_dropped_receiver_remove_endpoint_continues() {
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let (rx, msg) = TestControl::remove_endpoint(0x1234, 0x0001);
         drop(rx);
@@ -1164,17 +1951,23 @@ mod tests {
 
     #[tokio::test]
     async fn test_dropped_receiver_send_to_service_send_complete_continues() {
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         // Add an endpoint first so SendToService doesn't fail with ServiceNotFound
         let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 5000);
         let (rx, msg) = TestControl::add_endpoint(0x1234, 0x0001, addr, 0);
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // Send SendToService with the send_complete receiver dropped
         let message = Message::<TestPayload>::new_sd(1, &empty_sd_header());
@@ -1190,50 +1983,68 @@ mod tests {
     async fn test_bind_discovery_with_loopback() {
         // Spawn inner with multicast_loopback=true so bind_discovery exercises
         // the loopback-enabled branch of SocketManager::bind_discovery.
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             true,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let (rx, msg) = TestControl::bind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
     }
 
     #[tokio::test]
     async fn test_bind_discovery_idempotent() {
         // Binding discovery twice should succeed (early return on already-bound)
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let (rx, msg) = TestControl::bind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // Second bind should also succeed (idempotent path)
         let (rx, msg) = TestControl::bind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
     }
 
     #[tokio::test]
     async fn test_send_sd_auto_binds_discovery() {
         // SendSD without a bound discovery socket should auto-bind and succeed
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let target = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 30490);
         let sd_header = empty_sd_header();
         let (rx, msg) = TestControl::send_sd(target, sd_header);
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx.recv())
             .await
             .expect("Timed out waiting for SendSD")
             .expect("SendSD oneshot closed");
@@ -1243,21 +2054,27 @@ mod tests {
     #[tokio::test]
     async fn test_send_to_service_auto_binds_unicast() {
         // SendToService with no unicast sockets should auto-bind ephemeral
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 5000);
         let (rx, msg) = TestControl::add_endpoint(0x1234, 0x0001, addr, 0);
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         let message = Message::<TestPayload>::new_sd(1, &empty_sd_header());
         let (send_rx, _resp_rx, msg) = TestControl::send_to_service(0x1234, 0x0001, message);
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(2), send_rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(2), send_rx.recv())
             .await
             .expect("Timed out waiting for SendToService")
             .expect("SendToService oneshot closed");
@@ -1267,27 +2084,33 @@ mod tests {
     #[tokio::test]
     async fn test_subscribe_with_endpoint_sends_sd() {
         // Subscribe with a known endpoint and bound discovery should send the SD message
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         // Bind discovery first
         let (rx, msg) = TestControl::bind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // Add endpoint
         let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 5000);
         let (rx, msg) = TestControl::add_endpoint(0x1234, 0x0001, addr, 0);
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // Subscribe
         let (rx, msg) = TestControl::subscribe(0x1234, 0x0001, 1, 3, 0x01, 0);
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx.recv())
             .await
             .expect("Timed out waiting for Subscribe")
             .expect("Subscribe oneshot closed");
@@ -1297,22 +2120,28 @@ mod tests {
     #[tokio::test]
     async fn test_subscribe_auto_binds_discovery() {
         // Subscribe without discovery bound should auto-bind and succeed
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         // Add endpoint but do NOT bind discovery
         let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 5000);
         let (rx, msg) = TestControl::add_endpoint(0x1234, 0x0001, addr, 0);
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // Subscribe should auto-bind discovery
         let (rx, msg) = TestControl::subscribe(0x1234, 0x0001, 1, 3, 0x01, 0);
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx.recv())
             .await
             .expect("Timed out waiting for Subscribe")
             .expect("Subscribe oneshot closed");
@@ -1321,15 +2150,21 @@ mod tests {
 
     #[tokio::test]
     async fn test_subscribe_unknown_service_returns_error() {
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let (rx, msg) = TestControl::subscribe(0xFFFF, 0xFFFF, 1, 3, 0x01, 0);
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx.recv())
             .await
             .expect("Timed out")
             .expect("oneshot closed");
@@ -1339,28 +2174,34 @@ mod tests {
     #[tokio::test]
     async fn test_send_to_service_reuses_existing_unicast_socket() {
         // When a unicast socket already exists, SendToService should reuse it
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 5000);
         let (rx, msg) = TestControl::add_endpoint(0x1234, 0x0001, addr, 0);
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // First send auto-binds unicast
         let message = Message::<TestPayload>::new_sd(1, &empty_sd_header());
         let (send_rx, _resp_rx, msg) = TestControl::send_to_service(0x1234, 0x0001, message);
         control_sender.send(msg).await.unwrap();
-        send_rx.await.unwrap().unwrap();
+        send_rx.recv().await.unwrap().unwrap();
 
         // Second send reuses the existing socket (no auto-bind needed)
         let message = Message::<TestPayload>::new_sd(1, &empty_sd_header());
         let (send_rx, _resp_rx, msg) = TestControl::send_to_service(0x1234, 0x0001, message);
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(2), send_rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(2), send_rx.recv())
             .await
             .expect("Timed out")
             .expect("oneshot closed");
@@ -1373,11 +2214,17 @@ mod tests {
     #[tokio::test]
     async fn test_dropped_receiver_subscribe_service_not_found_continues() {
         // Subscribe with no endpoint → ServiceNotFound response is dropped
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let (rx, msg) = TestControl::subscribe(0x1234, 0x0001, 1, 3, 0x01, 0);
         drop(rx);
@@ -1390,17 +2237,23 @@ mod tests {
     #[tokio::test]
     async fn test_set_interface_changes_interface() {
         // SetInterface to a different address exercises the interface!=current path
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         // Change to a different loopback-range address (127.0.0.2).
         // Binding discovery on 127.0.0.2 should succeed on most systems.
         let (rx, msg) = TestControl::set_interface(Ipv4Addr::new(127, 0, 0, 2));
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(3), rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(3), rx.recv())
             .await
             .expect("Timed out waiting for SetInterface")
             .expect("SetInterface oneshot closed");
@@ -1414,16 +2267,22 @@ mod tests {
     #[tokio::test]
     async fn test_set_interface_with_discovery_bound_changes_interface() {
         // SetInterface when discovery is already bound: unbind → change → rebind
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         // Bind discovery on LOCALHOST first
         let (rx, msg) = TestControl::bind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // Change to 127.0.0.2 — this takes the multi-step path:
         // 1. unbind discovery, re-queue
@@ -1431,7 +2290,7 @@ mod tests {
         // 3. interface == 127.0.0.2, bind discovery
         let (rx, msg) = TestControl::set_interface(Ipv4Addr::new(127, 0, 0, 2));
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(3), rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(3), rx.recv())
             .await
             .expect("Timed out waiting for SetInterface")
             .expect("SetInterface oneshot closed");
@@ -1444,26 +2303,32 @@ mod tests {
     async fn test_subscribe_specific_port_reuse() {
         // Subscribe twice with the same specific client_port exercises the
         // bind_unicast port-reuse path (port != 0 && already bound).
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         // Add endpoint and bind discovery
         let (rx, msg) = TestControl::bind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 5000);
         let (rx, msg) = TestControl::add_endpoint(0x1234, 0x0001, addr, 0);
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // First subscribe with specific port — binds the port
         let (rx, msg) = TestControl::subscribe(0x1234, 0x0001, 1, 3, 0x01, 44444);
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx.recv())
             .await
             .expect("Timed out")
             .expect("oneshot closed");
@@ -1472,7 +2337,7 @@ mod tests {
         // Second subscribe with the same port — reuses the existing socket
         let (rx, msg) = TestControl::subscribe(0x1234, 0x0001, 1, 3, 0x02, 44444);
         control_sender.send(msg).await.unwrap();
-        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx)
+        let result = tokio::time::timeout(std::time::Duration::from_secs(2), rx.recv())
             .await
             .expect("Timed out")
             .expect("oneshot closed");
@@ -1490,11 +2355,17 @@ mod tests {
         use std::vec;
         use tokio::net::UdpSocket;
 
-        let (control_sender, _update_receiver) = Inner::<TestPayload>::spawn(
+        let (control_sender, _update_receiver, run_fut) = TestInner::build(
             Ipv4Addr::LOCALHOST,
             Arc::new(Mutex::new(E2ERegistry::new())),
             false,
+            crate::client::bind_dispatch::SpawnerDispatch {
+                factory: TokioTransport,
+                spawner: TokioSpawner,
+            },
+            TokioTimer,
         );
+        let _run_handle = tokio::spawn(run_fut);
 
         let raw = UdpSocket::bind("127.0.0.1:0").await.unwrap();
         let target = SocketAddrV4::new(Ipv4Addr::LOCALHOST, raw.local_addr().unwrap().port());
@@ -1502,11 +2373,11 @@ mod tests {
         // Bind and send one SD message to advance the session counter.
         let (rx, msg) = TestControl::bind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         let (rx, msg) = TestControl::send_sd(target, empty_sd_header());
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         let mut buf = vec![0u8; 1400];
         let (len, _) =
@@ -1522,16 +2393,16 @@ mod tests {
         // Unbind, then rebind.
         let (rx, msg) = TestControl::unbind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         let (rx, msg) = TestControl::bind_discovery();
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         // Send a second SD message and verify both session counter and reboot flag persisted.
         let (rx, msg) = TestControl::send_sd(target, empty_sd_header());
         control_sender.send(msg).await.unwrap();
-        rx.await.unwrap().unwrap();
+        rx.recv().await.unwrap().unwrap();
 
         let (len, _) =
             tokio::time::timeout(std::time::Duration::from_secs(2), raw.recv_from(&mut buf))
diff --git a/src/client/mod.rs b/src/client/mod.rs
index 026f2b7..a7881e8 100644
--- a/src/client/mod.rs
+++ b/src/client/mod.rs
@@ -1,3 +1,34 @@
+//! SOME/IP client.
+//!
+//! # Memory footprint
+//!
+//! The client's internal `Inner` state is allocated inline rather than on
+//! the heap. With the default capacity constants declared in `inner.rs` —
+//! `REQUEST_QUEUE_CAP=32`, `PENDING_RESPONSES_CAP=64`, `UNICAST_SOCKETS_CAP=8`,
+//! and `SESSION_CAP=64` — `Inner<P>` occupies on the order of **8–12 KiB**,
+//! depending on `sizeof::<P>()` and `sizeof::<SocketManager<P>>()`.
+//!
+//! In addition, each `SocketManager`'s spawn loop holds a persistent
+//! `[u8; UDP_BUFFER_SIZE]` receive/send buffer. When the send path needs
+//! E2E protection (i.e. the destination key is registered in the
+//! `E2ERegistry`), it transiently allocates a second
+//! `[u8; UDP_BUFFER_SIZE]` on the stack for the protected output; sends
+//! without E2E protection do not pay this cost. So an active
+//! socket-loop future carries one always-live `UDP_BUFFER_SIZE` buffer
+//! plus up to one additional `UDP_BUFFER_SIZE` buffer during E2E sends.
+//! With `UNICAST_SOCKETS_CAP=8` sockets bound, the total per-client
+//! buffer budget scales as `UNICAST_SOCKETS_CAP * UDP_BUFFER_SIZE`
+//! always-live, up to `2 * UNICAST_SOCKETS_CAP * UDP_BUFFER_SIZE` at
+//! peak during concurrent E2E-protected sends on every socket. At the
+//! current default of `UDP_BUFFER_SIZE = 1500`, that is ~12 KiB
+//! always-live / ~24 KiB peak per client.
+//!
+//! On `std + tokio`, all of this is allocated on the heap when each future
+//! is spawned, so the overhead is invisible to callers. On the bare-metal
+//! port (future), whoever drives the futures must arrange storage for them
+//! (either a `static` or a heap allocator); the capacity constants plus
+//! [`crate::UDP_BUFFER_SIZE`] are the knobs for trimming this footprint.
+mod bind_dispatch;
 mod error;
 mod inner;
 mod service_registry;
@@ -5,42 +36,85 @@ mod session;
 mod socket_manager;
 
 pub use error::Error;
-
-use crate::e2e::{E2ECheckStatus, E2EKey, E2EProfile, E2ERegistry};
+/// Internal control message exchanged between [`Client`] handles and
+/// the run-loop. Exposed (rather than `pub(super)`) so callers can
+/// declare static channel pools for it via
+/// `crate::transport::BoundedPooled<C, 4>`. End users typically do not
+/// reference this type directly — the `define_static_channels!` macro
+/// (under `feature = "bare_metal"`) names it for them.
+pub use inner::ControlMessage;
+/// Per-socket message types exposed for the same reason as
+/// [`ControlMessage`] — see its docstring.
+pub use socket_manager::{ReceivedMessage, SendMessage};
+
+use crate::Timer;
+#[cfg(feature = "client-tokio")]
+use crate::e2e::E2ERegistry;
+use crate::e2e::{E2ECheckStatus, E2EKey, E2EProfile};
+#[cfg(feature = "client-tokio")]
+use crate::tokio_transport::{TokioChannels, TokioSpawner, TokioTimer};
+use crate::transport::{
+    BoundedPooled, ChannelFactory, E2ERegistryHandle, InterfaceHandle, MpscSend, OneshotPooled,
+    OneshotRecv, Spawner, TransportFactory, TransportSocket, UnboundedPooled, UnboundedRecv,
+};
 use crate::{protocol, protocol::Message, traits::PayloadWireFormat};
-use inner::{ControlMessage, Inner};
-use std::net::{Ipv4Addr, SocketAddr, SocketAddrV4};
+use core::net::{Ipv4Addr, SocketAddr, SocketAddrV4};
+use inner::Inner;
+#[cfg(feature = "client-tokio")]
 use std::sync::{Arc, Mutex, RwLock};
-use tokio::sync::{mpsc, oneshot};
 use tracing::info;
 
+// Bound bundle the client's internals demand from any
+// `C: ChannelFactory` they channel through. Stable Rust does not
+// elaborate where-clause bounds on a trait alias, and macros do not
+// expand inside `where` clauses, so the bundle is repeated inline at
+// each impl block that constructs channels. The list is authored once
+// here as documentation and copy-pasted; mismatch surfaces as a
+// trait-bound compile error pointing at the missing `OneshotPooled` /
+// `BoundedPooled` / `UnboundedPooled` impl.
+//
+// ```ignore
+//     Result<(), Error>: OneshotPooled<C>,
+//     Result<P, Error>: OneshotPooled<C>,
+//     Result<protocol::sd::RebootFlag, Error>: OneshotPooled<C>,
+//     ControlMessage<P, C>: BoundedPooled<C, 4>,
+//     SendMessage<P, C>: BoundedPooled<C, 16>,
+//     Result<ReceivedMessage<P>, Error>: BoundedPooled<C, 16>,
+//     ClientUpdate<P>: UnboundedPooled<C>,
+// ```
+//
+// When stable Rust gains implied bounds for trait where-clauses, this
+// collapses back to a single `C: ClientChannels<P>` supertrait.
+
 /// Handle to a pending SOME/IP request-response transaction.
 /// Resolves when the inner loop receives a matching unicast reply.
 /// Does not borrow `Client`.
-pub struct PendingResponse<P> {
-    receiver: oneshot::Receiver<Result<P, Error>>,
+pub struct PendingResponse<P: Send + 'static, C: ChannelFactory> {
+    receiver: C::OneshotReceiver<Result<P, Error>>,
 }
 
-impl<P> std::fmt::Debug for PendingResponse<P> {
+impl<P: Send + 'static, C: ChannelFactory> std::fmt::Debug for PendingResponse<P, C> {
     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
         f.debug_struct("PendingResponse").finish_non_exhaustive()
     }
 }
 
-impl<P> PendingResponse<P> {
+impl<P: Send + 'static, C: ChannelFactory> PendingResponse<P, C> {
     /// Await the response payload.
     ///
     /// # Errors
     ///
-    /// Returns the same errors as the request itself (e.g. deserialization failure).
-    ///
-    /// # Panics
-    ///
-    /// Panics if the inner loop dropped the response channel.
+    /// Returns the same errors as the request itself (e.g. deserialization
+    /// failure). Returns [`Error::Capacity`] with tag `"pending_responses"`
+    /// if the inner loop's response-tracking map was full when the request
+    /// was sent — the UDP send still went out, but the reply (if any)
+    /// arrives on [`ClientUpdates`] rather than this oneshot.
+    /// Returns [`Error::Shutdown`] only if the client's run-loop future
+    /// exits before the response is delivered — the caller's
+    /// `PendingResponse` handle outlived its driver. Reserving `Shutdown`
+    /// for actual lifecycle failure keeps `RecvError` unambiguous.
     pub async fn response(self) -> Result<P, Error> {
-        self.receiver
-            .await
-            .expect("inner loop dropped response channel")
+        self.receiver.recv().await.map_err(|_| Error::Shutdown)?
     }
 }
 
@@ -105,61 +179,145 @@ impl<P: PayloadWireFormat> std::fmt::Debug for ClientUpdate<P> {
 
 /// Stream of updates from the SOME/IP client event loop.
 ///
-/// Returned by [`Client::new`]. Call [`recv`](Self::recv) to receive
+/// Returned by `Client::new` (under `client-tokio`) or
+/// `Client::new_with_deps` / `Client::new_with_deps_local` (under
+/// `client`). Call [`recv`](Self::recv) to receive
 /// discovery, unicast, and error updates.
-pub struct ClientUpdates<MessageDefinitions: PayloadWireFormat> {
-    update_receiver: mpsc::UnboundedReceiver<ClientUpdate<MessageDefinitions>>,
+pub struct ClientUpdates<MessageDefinitions: PayloadWireFormat + 'static, C: ChannelFactory> {
+    update_receiver: C::UnboundedReceiver<ClientUpdate<MessageDefinitions>>,
 }
 
-impl<MessageDefinitions: PayloadWireFormat> std::fmt::Debug for ClientUpdates<MessageDefinitions> {
+impl<MessageDefinitions: PayloadWireFormat + 'static, C: ChannelFactory> std::fmt::Debug
+    for ClientUpdates<MessageDefinitions, C>
+{
     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
         f.debug_struct("ClientUpdates").finish_non_exhaustive()
     }
 }
 
-impl<MessageDefinitions: PayloadWireFormat> ClientUpdates<MessageDefinitions> {
+impl<MessageDefinitions: PayloadWireFormat + 'static, C: ChannelFactory>
+    ClientUpdates<MessageDefinitions, C>
+{
     /// Waits for the next update from the client event loop.
     ///
     /// Returns `None` when the inner loop has exited (all `Client` handles
     /// dropped and the event loop finished draining).
     pub async fn recv(&mut self) -> Option<ClientUpdate<MessageDefinitions>> {
-        self.update_receiver.recv().await
+        UnboundedRecv::recv(&mut self.update_receiver).await
     }
 }
 
+/// Bundle of dependencies passed to [`Client::new_with_deps`]. Bundling
+/// the five pluggable infrastructure types (`TransportFactory`,
+/// `Spawner`, `Timer`, `E2ERegistryHandle`, `InterfaceHandle`) into a
+/// single struct keeps the constructor's argument list manageable
+/// (consumers see one named field per dependency rather than positional
+/// args six deep).
+///
+/// All five fields are public so callers can construct the struct
+/// inline; there's no builder ceremony beyond the field assignments.
+pub struct ClientDeps<F, S, Tm, R, I>
+where
+    F: TransportFactory,
+    Tm: Timer,
+    R: E2ERegistryHandle,
+    I: InterfaceHandle,
+{
+    /// Transport factory used by `bind_*` to construct sockets.
+    pub factory: F,
+    /// Task-spawner used by `bind_*` to drive per-socket I/O loops.
+    pub spawner: S,
+    /// Async sleep primitive used by the run-loop's idle tick.
+    pub timer: Tm,
+    /// Shared E2E registry handle for runtime E2E configuration.
+    pub e2e_registry: R,
+    /// Shared interface-address handle. The run-loop reads its current
+    /// value when `bind_*` is invoked.
+    pub interface: I,
+}
+
 /// A SOME/IP client that handles service discovery and message exchange.
 ///
 /// `Client` is cheaply [`Clone`]-able. All clones share the same underlying
 /// event loop and can be used concurrently from different tasks.
+///
+/// The optional type parameters `R` and `I` let callers substitute their own
+/// [`E2ERegistryHandle`] and [`InterfaceHandle`] implementations (for example,
+/// bare-metal handles backed by a critical-section mutex rather than
+/// `Arc<Mutex<_>>`). On `std + tokio`, the defaults
+/// (`Arc<Mutex<E2ERegistry>>` and `Arc<RwLock<Ipv4Addr>>`) are used by the
+/// standard constructors `Self::new` / `Self::new_with_loopback` /
+/// `Self::new_with_spawner_and_loopback` (all under `client-tokio`).
 #[derive(Clone)]
-pub struct Client<MessageDefinitions: PayloadWireFormat> {
-    interface: Arc<RwLock<Ipv4Addr>>,
-    control_sender: mpsc::Sender<inner::ControlMessage<MessageDefinitions>>,
-    e2e_registry: Arc<Mutex<E2ERegistry>>,
+pub struct Client<
+    MessageDefinitions: PayloadWireFormat + Send + 'static,
+    R: E2ERegistryHandle,
+    I: InterfaceHandle,
+    C: ChannelFactory,
+> {
+    interface: I,
+    control_sender: C::BoundedSender<inner::ControlMessage<MessageDefinitions, C>, 4>,
+    e2e_registry: R,
 }
 
-impl<MessageDefinitions: PayloadWireFormat> std::fmt::Debug for Client<MessageDefinitions> {
+impl<MessageDefinitions, R, I, C> std::fmt::Debug for Client<MessageDefinitions, R, I, C>
+where
+    MessageDefinitions: PayloadWireFormat + Send + 'static,
+    R: E2ERegistryHandle,
+    I: InterfaceHandle,
+    C: ChannelFactory,
+{
     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
         f.debug_struct("Client")
-            .field(
-                "interface",
-                &*self.interface.read().expect("interface lock poisoned"),
-            )
+            .field("interface", &self.interface.get())
             .finish_non_exhaustive()
     }
 }
 
-impl<MessageDefinitions> Client<MessageDefinitions>
+/// Convenience constructors that default to `Arc<Mutex<_>>` / `Arc<RwLock<_>>`
+/// handles, the `TokioChannels` channel factory, and the `TokioSpawner` task
+/// submitter. Available under the `client-tokio` feature, which pulls in
+/// `tokio` + `socket2`. Bare-metal callers use
+/// [`Self::new_with_spawner_and_loopback`] (always available under `client`)
+/// and supply their own channel factory + spawner.
+#[cfg(feature = "client-tokio")]
+impl<MessageDefinitions>
+    Client<MessageDefinitions, Arc<Mutex<E2ERegistry>>, Arc<RwLock<Ipv4Addr>>, TokioChannels>
 where
     MessageDefinitions: PayloadWireFormat + Clone + std::fmt::Debug + 'static,
 {
-    /// Creates a new client bound to the given network interface and spawns its event loop.
-    ///
-    /// Returns a `(Client, ClientUpdates)` pair. The `Client` handle is
-    /// [`Clone`]-able and can be shared across tasks. `ClientUpdates` receives
-    /// discovery, unicast, and error updates from the event loop.
-    #[must_use]
-    pub fn new(interface: Ipv4Addr) -> (Self, ClientUpdates<MessageDefinitions>) {
+    /// Creates a new client bound to the given network interface and returns its run-loop future to be driven by the caller.
+    ///
+    /// Returns a `(Client, ClientUpdates, run_future)` triple. The `Client`
+    /// handle is [`Clone`]-able and can be shared across tasks.
+    /// `ClientUpdates` receives discovery, unicast, and error updates from
+    /// the event loop. `run_future` is the event loop itself — the caller
+    /// must drive it to completion (typically via `tokio::spawn`) for the
+    /// client to process any messages.
+    ///
+    /// The future is bounded `Send + 'static` because every in-repo
+    /// consumer spawns it on a multithreaded executor. Bare-metal
+    /// consumers whose transport produces `!Send` state will get a
+    /// cfg-gated alternative constructor alongside the bare-metal port.
+    ///
+    /// ```no_run
+    /// # use simple_someip::{Client, RawPayload};
+    /// # use std::net::Ipv4Addr;
+    /// # async fn demo() {
+    /// let (client, mut updates, run) = Client::<RawPayload, _, _, _>::new(Ipv4Addr::LOCALHOST);
+    /// let _run_task = tokio::spawn(run);
+    /// // ...interact with `client` and `updates`...
+    /// # let _ = (client, updates);
+    /// # }
+    /// ```
+    #[must_use = "the returned run-loop future must be spawned (e.g. tokio::spawn) for the client to make progress"]
+    pub fn new(
+        interface: Ipv4Addr,
+    ) -> (
+        Self,
+        ClientUpdates<MessageDefinitions, TokioChannels>,
+        impl core::future::Future<Output = ()> + Send + 'static,
+    ) {
         Self::new_with_loopback(interface, false)
     }
 
@@ -175,7 +333,7 @@ where
     /// With loopback enabled, the client's own discovery socket also receives
     /// the multicast SD traffic this client sends (e.g. `FindService` probes
     /// and periodic `OfferService` announcements driven by
-    /// [`Self::start_sd_announcements`]). Those self-sent messages are parsed
+    /// [`Self::sd_announcements_loop`]). Those self-sent messages are parsed
     /// the same as any other inbound SD traffic, so callers may observe:
     ///
     /// - [`ClientUpdate::DiscoveryUpdated`] events originating from this
@@ -186,32 +344,229 @@ where
     /// Consumers of [`ClientUpdates`] that need to ignore self-sent SD should
     /// filter on source address (the sender's IP/port is included on the
     /// update).
-    #[must_use]
+    #[must_use = "the returned run-loop future must be spawned (e.g. tokio::spawn) for the client to make progress"]
     pub fn new_with_loopback(
         interface: Ipv4Addr,
         multicast_loopback: bool,
-    ) -> (Self, ClientUpdates<MessageDefinitions>) {
-        let e2e_registry = Arc::new(Mutex::new(E2ERegistry::new()));
-        let (control_sender, update_receiver) =
-            Inner::spawn(interface, Arc::clone(&e2e_registry), multicast_loopback);
+    ) -> (
+        Self,
+        ClientUpdates<MessageDefinitions, TokioChannels>,
+        impl core::future::Future<Output = ()> + Send + 'static,
+    ) {
+        Self::new_with_spawner_and_loopback(interface, multicast_loopback, TokioSpawner)
+    }
+
+    /// Like [`Self::new_with_loopback`], but with a caller-provided
+    /// [`Spawner`]. Per-socket I/O loops are submitted through this
+    /// spawner instead of the default [`TokioSpawner`] / `tokio::spawn`.
+    ///
+    /// ```no_run
+    /// # use simple_someip::{Client, RawPayload, Spawner};
+    /// # use std::net::Ipv4Addr;
+    /// # async fn demo() {
+    /// struct MySpawner; // ...your executor's task-submission type.
+    /// # impl Spawner for MySpawner {
+    /// #   fn spawn(&self, _: impl core::future::Future<Output = ()> + Send + 'static) {}
+    /// # }
+    /// let (client, mut updates, run) =
+    ///     Client::<RawPayload, _, _, _>::new_with_spawner_and_loopback(
+    ///         Ipv4Addr::LOCALHOST,
+    ///         false,
+    ///         MySpawner,
+    ///     );
+    /// let _run_task = tokio::spawn(run);
+    /// # let _ = (client, updates);
+    /// # }
+    /// ```
+    ///
+    /// # Bounds
+    ///
+    /// `S: Spawner + Send + Sync + 'static` — the spawner is stored in
+    /// the run-loop future, which is `Send + 'static`, so the spawner
+    /// must match those bounds. `Sync` is required because `&self.spawner`
+    /// is held across `.await` points inside
+    /// `SocketManager::bind_with_transport` and
+    /// `bind_discovery_seeded_with_transport`, both of which execute on
+    /// the driven run-loop task (not on the user's call site).
+    #[must_use = "the returned run-loop future must be spawned (e.g. via the Spawner) for the client to make progress"]
+    pub fn new_with_spawner_and_loopback<S>(
+        interface: Ipv4Addr,
+        multicast_loopback: bool,
+        spawner: S,
+    ) -> (
+        Self,
+        ClientUpdates<MessageDefinitions, TokioChannels>,
+        impl core::future::Future<Output = ()> + Send + 'static,
+    )
+    where
+        S: Spawner + Send + Sync + 'static,
+    {
+        Self::new_with_deps(
+            ClientDeps {
+                factory: crate::tokio_transport::TokioTransport,
+                spawner,
+                timer: TokioTimer,
+                e2e_registry: Arc::new(Mutex::new(E2ERegistry::new())),
+                interface: Arc::new(RwLock::new(interface)),
+            },
+            multicast_loopback,
+        )
+    }
+}
+
+/// Methods available on all `Client<M, R, I, C>` regardless of handle types.
+impl<MessageDefinitions, R, I, C> Client<MessageDefinitions, R, I, C>
+where
+    MessageDefinitions: PayloadWireFormat + Clone + std::fmt::Debug + Send + 'static,
+    R: E2ERegistryHandle,
+    I: InterfaceHandle,
+    C: ChannelFactory,
+    Result<(), Error>: OneshotPooled<C>,
+    Result<MessageDefinitions, Error>: OneshotPooled<C>,
+    Result<protocol::sd::RebootFlag, Error>: OneshotPooled<C>,
+    ControlMessage<MessageDefinitions, C>: BoundedPooled<C, 4>,
+    SendMessage<MessageDefinitions, C>: BoundedPooled<C, 16>,
+    Result<ReceivedMessage<MessageDefinitions>, Error>: BoundedPooled<C, 16>,
+    ClientUpdate<MessageDefinitions>: UnboundedPooled<C>,
+{
+    /// Bare-metal-friendly constructor that takes every dependency
+    /// explicitly via a [`ClientDeps`] bundle: a [`TransportFactory`], a
+    /// [`Spawner`], a [`Timer`], an [`E2ERegistryHandle`], and an
+    /// [`InterfaceHandle`].
+    ///
+    /// This is the no-tokio entry point. The `client-tokio` convenience
+    /// constructors (`Self::new`, `Self::new_with_loopback`,
+    /// `Self::new_with_spawner_and_loopback`) ultimately delegate
+    /// here, supplying `TokioTransport` / `TokioTimer` / `TokioSpawner`
+    /// / `Arc<Mutex<E2ERegistry>>` / `Arc<RwLock<Ipv4Addr>>` for the
+    /// generic parameters. Bare-metal callers supply their own.
+    ///
+    /// `deps.interface` is consumed as an [`InterfaceHandle`]; the
+    /// run-loop reads its current value when `bind_*` is invoked, so
+    /// callers can share the handle with their own task and update it
+    /// through [`InterfaceHandle::set`] without going through the
+    /// control channel.
+    ///
+    /// # Bounds
+    ///
+    /// All five infrastructure parameters require `Send + Sync + 'static`
+    /// because the run-loop future is itself `Send + 'static` (so it can
+    /// be spawned on a multithreaded executor). Single-task / `LocalSet`
+    /// callers whose deps are `!Send` would need a `!Send` variant of
+    /// this constructor; that variant is planned alongside the
+    /// `LocalSet`-style spawner shim.
+    #[allow(clippy::type_complexity)]
+    #[must_use = "the returned run-loop future must be spawned (e.g. via the Spawner) for the client to make progress"]
+    pub fn new_with_deps<F, S, Tm>(
+        deps: ClientDeps<F, S, Tm, R, I>,
+        multicast_loopback: bool,
+    ) -> (
+        Self,
+        ClientUpdates<MessageDefinitions, C>,
+        impl core::future::Future<Output = ()> + Send + 'static,
+    )
+    where
+        F: TransportFactory + Send + Sync + 'static,
+        F::Socket: Send + Sync + 'static,
+        for<'a> F::BindFuture<'a>: Send,
+        for<'a> <F::Socket as TransportSocket>::SendFuture<'a>: Send,
+        for<'a> <F::Socket as TransportSocket>::RecvFuture<'a>: Send,
+        S: Spawner + Send + Sync + 'static,
+        Tm: Timer + Send + Sync + 'static,
+        for<'a> Tm::SleepFuture<'a>: Send,
+    {
+        let ClientDeps {
+            factory,
+            spawner,
+            timer,
+            e2e_registry,
+            interface,
+        } = deps;
+        let initial_addr = interface.get();
+        let dispatch = bind_dispatch::SpawnerDispatch { factory, spawner };
+        let (control_sender, update_receiver, run_future) =
+            Inner::<MessageDefinitions, Tm, R, C, bind_dispatch::SpawnerDispatch<F, S>>::build(
+                initial_addr,
+                e2e_registry.clone(),
+                multicast_loopback,
+                dispatch,
+                timer,
+            );
+        let client = Self {
+            interface,
+            control_sender,
+            e2e_registry,
+        };
+        let updates = ClientUpdates { update_receiver };
+        (client, updates, run_future)
+    }
 
+    /// `!Send` counterpart to [`Self::new_with_deps`].
+    ///
+    /// Constructs a `Client` whose run-loop and per-socket loops are
+    /// submitted through a [`LocalSpawner`]
+    /// (single-threaded executor) rather than a
+    /// [`Spawner`]. The factory's socket type
+    /// and its GAT futures are not required to be `Send`. The returned
+    /// run-loop future is `'static` but `!Send`.
+    ///
+    /// Use this constructor on embassy with `task-arena = 0`, on
+    /// tokio's `LocalSet`, on async-std's `LocalExecutor`, etc., where
+    /// the executor pins futures to a single thread.
+    ///
+    /// [`LocalSpawner`]: crate::transport::LocalSpawner
+    /// [`Spawner`]: crate::transport::Spawner
+    #[allow(clippy::type_complexity)]
+    #[must_use = "the returned run-loop future must be spawned (e.g. via the LocalSpawner) for the client to make progress"]
+    pub fn new_with_deps_local<F, S, Tm>(
+        deps: ClientDeps<F, S, Tm, R, I>,
+        multicast_loopback: bool,
+    ) -> (
+        Self,
+        ClientUpdates<MessageDefinitions, C>,
+        impl core::future::Future<Output = ()> + 'static,
+    )
+    where
+        F: TransportFactory + 'static,
+        F::Socket: 'static,
+        S: crate::transport::LocalSpawner + 'static,
+        Tm: Timer + 'static,
+    {
+        let ClientDeps {
+            factory,
+            spawner,
+            timer,
+            e2e_registry,
+            interface,
+        } = deps;
+        let initial_addr = interface.get();
+        let dispatch = bind_dispatch::LocalSpawnerDispatch { factory, spawner };
+        let (control_sender, update_receiver, run_future) = Inner::<
+            MessageDefinitions,
+            Tm,
+            R,
+            C,
+            bind_dispatch::LocalSpawnerDispatch<F, S>,
+        >::build(
+            initial_addr,
+            e2e_registry.clone(),
+            multicast_loopback,
+            dispatch,
+            timer,
+        );
         let client = Self {
-            interface: Arc::new(RwLock::new(interface)),
+            interface,
             control_sender,
             e2e_registry,
         };
         let updates = ClientUpdates { update_receiver };
-        (client, updates)
+        (client, updates, run_future)
     }
 
     /// Returns the current network interface address.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the interface lock is poisoned.
     #[must_use]
     pub fn interface(&self) -> Ipv4Addr {
-        *self.interface.read().expect("interface lock poisoned")
+        self.interface.get()
     }
 
     /// Changes the network interface and rebinds sockets.
@@ -220,14 +575,17 @@ where
     ///
     /// Returns an error if rebinding sockets on the new interface fails.
     ///
-    /// # Panics
-    ///
-    /// Panics if the internal control channel or interface lock is poisoned/closed.
+    /// Returns [`Error::Shutdown`] if the client's run-loop future has
+    /// exited before this call — the control-channel send cannot
+    /// complete without its receiver.
     pub async fn set_interface(&self, interface: Ipv4Addr) -> Result<(), Error> {
         let (response, message) = ControlMessage::set_interface(interface);
-        self.control_sender.send(message).await.unwrap();
-        response.await.unwrap()?;
-        *self.interface.write().expect("interface lock poisoned") = interface;
+        self.control_sender
+            .send(message)
+            .await
+            .map_err(|()| Error::Shutdown)?;
+        response.recv().await.map_err(|_| Error::Shutdown)??;
+        self.interface.set(interface);
         Ok(())
     }
 
@@ -236,14 +594,17 @@ where
     /// # Errors
     ///
     /// Returns an error if binding the multicast socket fails.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the internal control channel is closed.
+    /// Returns [`Error::Shutdown`] if the client's run-loop future has
+    /// exited before this call (dropped, cancelled, or otherwise gone)
+    /// — the `Client` handle has outlived its driver and further
+    /// control-channel sends cannot make progress.
     pub async fn bind_discovery(&self) -> Result<(), Error> {
         let (response, message) = ControlMessage::bind_discovery();
-        self.control_sender.send(message).await.unwrap();
-        response.await.unwrap()
+        self.control_sender
+            .send(message)
+            .await
+            .map_err(|()| Error::Shutdown)?;
+        response.recv().await.map_err(|_| Error::Shutdown)?
     }
 
     /// Unbinds the SD multicast discovery socket.
@@ -251,14 +612,17 @@ where
     /// # Errors
     ///
     /// Returns an error if unbinding the multicast socket fails.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the internal control channel is closed.
+    /// Returns [`Error::Shutdown`] if the client's run-loop future has
+    /// exited before this call (dropped, cancelled, or otherwise gone)
+    /// — the `Client` handle has outlived its driver and further
+    /// control-channel sends cannot make progress.
     pub async fn unbind_discovery(&self) -> Result<(), Error> {
         let (response, message) = ControlMessage::unbind_discovery();
-        self.control_sender.send(message).await.unwrap();
-        response.await.unwrap()
+        self.control_sender
+            .send(message)
+            .await
+            .map_err(|()| Error::Shutdown)?;
+        response.recv().await.map_err(|_| Error::Shutdown)?
     }
 
     /// Subscribes to an event group on a known service.
@@ -266,10 +630,10 @@ where
     /// # Errors
     ///
     /// Returns an error if the service is not found or subscription fails.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the internal control channel is closed.
+    /// Returns [`Error::Shutdown`] if the client's run-loop future has
+    /// exited before this call (dropped, cancelled, or otherwise gone)
+    /// — the `Client` handle has outlived its driver and further
+    /// control-channel sends cannot make progress.
     pub async fn subscribe(
         &self,
         service_id: u16,
@@ -287,17 +651,41 @@ where
             event_group_id,
             client_port,
         );
-        self.control_sender.send(message).await.unwrap();
-        response.await.unwrap()
+        self.control_sender
+            .send(message)
+            .await
+            .map_err(|()| Error::Shutdown)?;
+        response.recv().await.map_err(|_| Error::Shutdown)?
     }
 
     /// Like [`subscribe`](Self::subscribe) but does not wait for the
     /// subscription result.
     ///
+    /// Returns `()`: if the run-loop has exited the request is silently
+    /// lost — there is no error surface and no panic. Use
+    /// [`subscribe`](Self::subscribe) when you need to detect dispatch
+    /// failures.
+    ///
     /// This still awaits enqueueing the control message on the internal
-    /// channel, so it may block if that bounded channel is full. Useful for
-    /// periodic renewals where waiting for subscription processing is
+    /// channel, so it may block if that bounded channel is full. Useful
+    /// for periodic renewals where waiting for subscription processing is
     /// unnecessary.
+    ///
+    /// The response oneshot is simply dropped at the end of this call.
+    /// The inner loop's send-to-dropped-receiver path is not logged at
+    /// `warn!`; at most it is logged at `debug!`, so fire-and-forget
+    /// usage remains low-noise.
+    ///
+    /// # Silent drop on a closed channel
+    ///
+    /// Unlike the other `Client` methods (which return
+    /// `Err(Error::Shutdown)` if the run-loop has exited and closed the
+    /// receiver), `subscribe_no_wait` deliberately discards the `send`
+    /// result. If the run-loop has exited, the request is silently
+    /// dropped — no error surface, no panic. This matches the
+    /// fire-and-forget contract: callers that need to know whether the
+    /// subscription was actually dispatched should use
+    /// [`subscribe`](Self::subscribe) instead.
     pub async fn subscribe_no_wait(
         &self,
         service_id: u16,
@@ -307,7 +695,7 @@ where
         event_group_id: u16,
         client_port: u16,
     ) {
-        let (response, message) = ControlMessage::subscribe(
+        let (_response, message) = ControlMessage::subscribe(
             service_id,
             instance_id,
             major_version,
@@ -316,11 +704,6 @@ where
             client_port,
         );
         let _ = self.control_sender.send(message).await;
-        // Consume the response in the background so the inner loop doesn't
-        // warn about a dropped receiver.
-        tokio::spawn(async move {
-            let _ = response.await;
-        });
     }
 
     /// Returns the current SD reboot flag tracked by the client.
@@ -344,25 +727,42 @@ where
     /// Call this before manually building an SD header (e.g. one passed to
     /// [`send_sd_message`](Self::send_sd_message)) so the reboot flag reflects
     /// the current tracked state instead of a stale value baked at call time.
-    /// Headers passed to [`start_sd_announcements`](Self::start_sd_announcements)
+    /// Headers passed to `sd_announcements_loop` (under `client-tokio`)
     /// are refreshed automatically per-tick and do not need this call.
     ///
-    /// # Panics
+    /// # Errors
     ///
-    /// Panics if the internal control channel is closed.
-    pub async fn reboot_flag(&self) -> protocol::sd::RebootFlag {
+    /// Returns [`Error::Shutdown`] if the client's run-loop future has
+    /// exited before this call (dropped, cancelled, or otherwise gone)
+    /// — the `Client` handle has outlived its driver and further
+    /// control-channel sends cannot make progress.
+    ///
+    /// Returns [`Error::Capacity`] (with tag `"request_queue"`) if the
+    /// run loop's bounded control queue is saturated under load.
+    pub async fn reboot_flag(&self) -> Result<protocol::sd::RebootFlag, Error> {
         let (response, message) = ControlMessage::query_reboot_flag();
-        self.control_sender.send(message).await.unwrap();
-        response.await.unwrap()
+        self.control_sender
+            .send(message)
+            .await
+            .map_err(|()| Error::Shutdown)?;
+        response.recv().await.map_err(|_| Error::Shutdown)?
     }
 
     /// Test-only: force the inner loop's `sd_session_has_wrapped` so tests
     /// can observe post-wrap behavior without sending 65k SD messages.
-    #[cfg(test)]
-    pub(crate) async fn force_sd_session_wrapped_for_test(&self, wrapped: bool) {
+    /// Mirrors the public `Client` API: returns `Err(Error::Shutdown)` on
+    /// closed channels rather than panicking.
+    #[cfg(all(test, feature = "client-tokio"))]
+    pub(crate) async fn force_sd_session_wrapped_for_test(
+        &self,
+        wrapped: bool,
+    ) -> Result<(), Error> {
         let (response, message) = ControlMessage::force_sd_session_wrapped_for_test(wrapped);
-        self.control_sender.send(message).await.unwrap();
-        response.await.unwrap();
+        self.control_sender
+            .send(message)
+            .await
+            .map_err(|()| Error::Shutdown)?;
+        response.recv().await.map_err(|_| Error::Shutdown)?
     }
 
     /// Sends an SD message to a specific target address.
@@ -370,134 +770,21 @@ where
     /// # Errors
     ///
     /// Returns an error if sending the SD message fails.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the internal control channel is closed.
+    /// Returns [`Error::Shutdown`] if the client's run-loop future has
+    /// exited before this call (dropped, cancelled, or otherwise gone)
+    /// — the `Client` handle has outlived its driver and further
+    /// control-channel sends cannot make progress.
     pub async fn send_sd_message(
         &self,
         target: SocketAddrV4,
         sd_header: <MessageDefinitions as PayloadWireFormat>::SdHeader,
     ) -> Result<(), Error> {
         let (response, message) = ControlMessage::send_sd(target, sd_header);
-        self.control_sender.send(message).await.unwrap();
-        response.await.unwrap()
-    }
-
-    /// Start periodic SD announcements on the client's discovery socket.
-    ///
-    /// Spawns a background task that sends the given SD header to the
-    /// multicast group at a regular interval. Use this to bundle
-    /// `FindService` + `OfferService` entries from a single SD identity
-    /// when the application acts as both client and server.
-    ///
-    /// The announcements are sent via the client's SD socket, ensuring
-    /// they share the same source address as the client's `Subscribe` and
-    /// `FindService` messages.
-    ///
-    /// **Reboot flag auto-refresh:** the SD header's reboot bit is overridden
-    /// at each tick with the client's currently tracked reboot flag (via
-    /// [`PayloadWireFormat::set_reboot_flag`]). The reboot bit the caller
-    /// supplies on `sd_header` is therefore ignored. This ensures the flag
-    /// transitions from `RecentlyRebooted` to `Continuous` once the session
-    /// counter wraps past `0xFFFF`, rather than staying stuck on whatever
-    /// value was baked at call time.
-    ///
-    /// Returns a [`tokio::task::JoinHandle`] that can be used to abort the
-    /// background task. The task uses a weak reference to the client's
-    /// control channel, so it exits automatically when all `Client` handles
-    /// are dropped (via `shut_down()` or going out of scope).
-    ///
-    /// # Arguments
-    ///
-    /// * `sd_header` — The SD header to send (entries + options).
-    /// * `interval` — How often to send (e.g. every 1 second). Values below
-    ///   100ms are clamped to 100ms to prevent tight loops.
-    pub fn start_sd_announcements(
-        &self,
-        sd_header: <MessageDefinitions as PayloadWireFormat>::SdHeader,
-        interval: std::time::Duration,
-    ) -> tokio::task::JoinHandle<()>
-    where
-        <MessageDefinitions as PayloadWireFormat>::SdHeader: Send + 'static,
-    {
-        use crate::protocol::sd;
-
-        // Use a WeakSender so this task does NOT keep the control channel
-        // alive. When all strong Client handles are dropped (shut_down),
-        // the weak sender will fail to upgrade and the task exits cleanly.
-        let weak_sender = self.control_sender.downgrade();
-        let target = SocketAddrV4::new(sd::MULTICAST_IP, sd::MULTICAST_PORT);
-        let interval = interval.max(std::time::Duration::from_millis(100));
-
-        tokio::spawn(async move {
-            let mut tick = tokio::time::interval(interval);
-            tick.set_missed_tick_behavior(tokio::time::MissedTickBehavior::Skip);
-            // Consume the immediate first tick so we don't send before
-            // the caller has finished setting up (e.g. subscribing).
-            tick.tick().await;
-            let mut count = 0u64;
-            loop {
-                tick.tick().await;
-
-                // Refresh the reboot flag from the client's tracked state
-                // so long-running announcers transition from RecentlyRebooted
-                // to Continuous once the session counter wraps. The weak
-                // sender is upgraded, used to enqueue a single control
-                // message, then dropped before we await — keeping the strong
-                // sender alive across awaits would defeat the weak-sender
-                // shutdown path.
-                let (flag_rx, flag_msg) = ControlMessage::query_reboot_flag();
-                let Some(sender) = weak_sender.upgrade() else {
-                    tracing::info!("Client shut down, stopping SD announcements");
-                    break;
-                };
-                let enqueue_ok = sender.send(flag_msg).await.is_ok();
-                drop(sender);
-                if !enqueue_ok {
-                    tracing::warn!("SD announcement channel closed, stopping");
-                    break;
-                }
-                let Ok(reboot) = flag_rx.await else {
-                    tracing::warn!("SD announcement reboot-flag query dropped, stopping");
-                    break;
-                };
-                let mut header = sd_header.clone();
-                MessageDefinitions::set_reboot_flag(&mut header, reboot);
-
-                let (response, message) = ControlMessage::send_sd(target, header);
-
-                let Some(sender) = weak_sender.upgrade() else {
-                    tracing::info!("Client shut down, stopping SD announcements");
-                    break;
-                };
-                let send_ok = sender.send(message).await.is_ok();
-                drop(sender);
-
-                if !send_ok {
-                    tracing::warn!("SD announcement channel closed, stopping");
-                    break;
-                }
-
-                match response.await {
-                    Ok(Ok(())) => {
-                        count += 1;
-                        if count == 1 {
-                            tracing::info!("Sent first client SD announcement");
-                        } else {
-                            tracing::trace!("Sent {count} client SD announcements");
-                        }
-                    }
-                    Ok(Err(e)) => {
-                        tracing::error!("Failed to send SD announcement: {e:?}");
-                    }
-                    Err(_) => {
-                        tracing::warn!("SD announcement response dropped, stopping");
-                        break;
-                    }
-                }
-            }
-        })
+        self.control_sender
+            .send(message)
+            .await
+            .map_err(|()| Error::Shutdown)?;
+        response.recv().await.map_err(|_| Error::Shutdown)?
     }
 
     /// Registers a service endpoint in the client's endpoint registry.
@@ -514,10 +801,10 @@ where
     /// # Errors
     ///
     /// Returns an error if registering the endpoint fails.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the internal control channel is closed.
+    /// Returns [`Error::Shutdown`] if the client's run-loop future has
+    /// exited before this call (dropped, cancelled, or otherwise gone)
+    /// — the `Client` handle has outlived its driver and further
+    /// control-channel sends cannot make progress.
     pub async fn add_endpoint(
         &self,
         service_id: u16,
@@ -527,8 +814,11 @@ where
     ) -> Result<(), Error> {
         let (response, message) =
             ControlMessage::add_endpoint(service_id, instance_id, addr, local_port);
-        self.control_sender.send(message).await.unwrap();
-        response.await.unwrap()
+        self.control_sender
+            .send(message)
+            .await
+            .map_err(|()| Error::Shutdown)?;
+        response.recv().await.map_err(|_| Error::Shutdown)?
     }
 
     /// Removes a service endpoint from the client's endpoint registry.
@@ -536,38 +826,56 @@ where
     /// # Errors
     ///
     /// Returns an error if removing the endpoint fails.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the internal control channel is closed.
+    /// Returns [`Error::Shutdown`] if the client's run-loop future has
+    /// exited before this call (dropped, cancelled, or otherwise gone)
+    /// — the `Client` handle has outlived its driver and further
+    /// control-channel sends cannot make progress.
     pub async fn remove_endpoint(&self, service_id: u16, instance_id: u16) -> Result<(), Error> {
         let (response, message) = ControlMessage::remove_endpoint(service_id, instance_id);
-        self.control_sender.send(message).await.unwrap();
-        response.await.unwrap()
+        self.control_sender
+            .send(message)
+            .await
+            .map_err(|()| Error::Shutdown)?;
+        response.recv().await.map_err(|_| Error::Shutdown)?
     }
 
     /// Sends a message to a service and returns a handle to await the response.
     ///
     /// Call `.response()` on the returned handle to await the reply payload.
     ///
+    /// # Saturation behavior
+    ///
+    /// Response tracking uses a fixed-capacity internal map. If it is
+    /// saturated at the moment the reply-tracking slot would be installed,
+    /// this method still returns `Ok(PendingResponse)` — the UDP send has
+    /// already happened — but the returned `PendingResponse` will resolve to
+    /// `Err(Error::Capacity("pending_responses"))`. Any reply that later
+    /// arrives for that `request_id` is delivered as
+    /// [`ClientUpdate::Unicast`] on the update stream instead of through the
+    /// `PendingResponse`. Treat this error as "reply lost to saturation",
+    /// not "send failed". A `warn!`-level log accompanies the drop.
+    ///
     /// # Errors
     ///
     /// Returns an error if the service is not found, unicast binding fails,
     /// or the UDP send fails.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the internal control channel is closed.
+    /// Returns [`Error::Shutdown`] if the client's run-loop future has
+    /// exited before this call (dropped, cancelled, or otherwise gone)
+    /// — the `Client` handle has outlived its driver and further
+    /// control-channel sends cannot make progress.
     pub async fn send_to_service(
         &self,
         service_id: u16,
         instance_id: u16,
         message: crate::protocol::Message<MessageDefinitions>,
-    ) -> Result<PendingResponse<MessageDefinitions>, Error> {
+    ) -> Result<PendingResponse<MessageDefinitions, C>, Error> {
         let (send_rx, response_rx, ctrl_msg) =
             ControlMessage::send_to_service(service_id, instance_id, message);
-        self.control_sender.send(ctrl_msg).await.unwrap();
-        send_rx.await.unwrap()?;
+        self.control_sender
+            .send(ctrl_msg)
+            .await
+            .map_err(|()| Error::Shutdown)?;
+        send_rx.recv().await.map_err(|_| Error::Shutdown)??;
         Ok(PendingResponse {
             receiver: response_rx,
         })
@@ -583,10 +891,15 @@ where
     ///
     /// Returns an error if the service is not found, unicast binding fails,
     /// the UDP send fails, or the response payload fails to deserialize.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the internal control channel is closed.
+    /// Returns [`Error::Capacity`] with tag `"pending_responses"` if the
+    /// inner loop's response-tracking map was full when this request was
+    /// sent — the UDP send still went out, but the reply cannot be
+    /// routed back to this caller's oneshot (it arrives on
+    /// [`ClientUpdates`] instead).
+    /// Returns [`Error::Shutdown`] only if the client's run-loop future
+    /// has exited before this call (dropped, cancelled, or otherwise
+    /// gone) — the `Client` handle has outlived its driver and further
+    /// control-channel sends cannot make progress.
     pub async fn request(
         &self,
         service_id: u16,
@@ -595,11 +908,12 @@ where
     ) -> Result<MessageDefinitions, Error> {
         let (send_rx, response_rx, ctrl_msg) =
             ControlMessage::send_to_service(service_id, instance_id, message);
-        self.control_sender.send(ctrl_msg).await.unwrap();
-        send_rx.await.unwrap()?;
-        response_rx
+        self.control_sender
+            .send(ctrl_msg)
             .await
-            .expect("inner loop dropped response channel")
+            .map_err(|()| Error::Shutdown)?;
+        send_rx.recv().await.map_err(|_| Error::Shutdown)??;
+        response_rx.recv().await.map_err(|_| Error::Shutdown)?
     }
 
     /// Register an E2E profile for the given key.
@@ -608,26 +922,31 @@ where
     /// header checked and stripped, and outgoing messages will have E2E
     /// protection applied automatically.
     ///
+    /// # Shutdown semantics
+    ///
+    /// Unlike most public `Client` methods, `register_e2e` does NOT go
+    /// through the run-loop control channel — it operates directly on
+    /// the shared [`E2ERegistryHandle`]. Consequently it does not return
+    /// `Err(Error::Shutdown)` after the run-loop has exited; the
+    /// registry is still accessible via any held `Client` clone.
+    ///
     /// # Panics
     ///
-    /// Panics if the E2E registry mutex is poisoned.
+    /// May panic if the underlying [`E2ERegistryHandle`]
+    /// implementation panics (e.g., `Arc<Mutex<E2ERegistry>>` on mutex poison).
+    ///
+    /// [`E2ERegistryHandle`]: crate::transport::E2ERegistryHandle
     pub fn register_e2e(&self, key: E2EKey, profile: E2EProfile) {
-        self.e2e_registry
-            .lock()
-            .expect("e2e registry lock poisoned")
-            .register(key, profile);
+        self.e2e_registry.register(key, profile);
     }
 
     /// Remove E2E configuration for the given key.
     ///
-    /// # Panics
-    ///
-    /// Panics if the E2E registry mutex is poisoned.
+    /// Like [`Self::register_e2e`], this method bypasses the run-loop
+    /// control channel and is therefore not subject to
+    /// `Error::Shutdown`.
     pub fn unregister_e2e(&self, key: &E2EKey) {
-        self.e2e_registry
-            .lock()
-            .expect("e2e registry lock poisoned")
-            .unregister(key);
+        self.e2e_registry.unregister(key);
     }
 
     /// Shuts down the client by dropping the control channel.
@@ -640,25 +959,184 @@ where
     }
 }
 
-#[cfg(test)]
+/// `sd_announcements_loop` is only available with the `TokioChannels` backend
+/// because it requires `tokio::sync::mpsc::Sender::downgrade()` for the
+/// weak-sender shutdown pattern. A bare-metal alternative would need a
+/// different lifecycle mechanism (phase-future).
+#[cfg(feature = "client-tokio")]
+impl<MessageDefinitions, R, I> Client<MessageDefinitions, R, I, TokioChannels>
+where
+    MessageDefinitions: PayloadWireFormat + Clone + std::fmt::Debug + 'static,
+    R: E2ERegistryHandle,
+    I: InterfaceHandle,
+{
+    /// Start periodic SD announcements on the client's discovery socket.
+    ///
+    /// Spawns a background task that sends the given SD header to the
+    /// multicast group at a regular interval. Use this to bundle
+    /// `FindService` + `OfferService` entries from a single SD identity
+    /// when the application acts as both client and server.
+    ///
+    /// The announcements are sent via the client's SD socket, ensuring
+    /// they share the same source address as the client's `Subscribe` and
+    /// `FindService` messages.
+    ///
+    /// **Reboot flag auto-refresh:** the SD header's reboot bit is overridden
+    /// at each tick with the client's currently tracked reboot flag (via
+    /// [`PayloadWireFormat::set_reboot_flag`]). The reboot bit the caller
+    /// supplies on `sd_header` is therefore ignored. This ensures the flag
+    /// transitions from `RecentlyRebooted` to `Continuous` once the session
+    /// counter wraps past `0xFFFF`, rather than staying stuck on whatever
+    /// value was baked at call time.
+    ///
+    /// Returns an `impl Future<Output = ()> + Send + 'static` that the
+    /// caller drives on their executor (typically via `tokio::spawn`).
+    /// The loop uses a weak reference to the client's control channel,
+    /// so it exits automatically when all `Client` handles are dropped
+    /// (via `shut_down()` or going out of scope).
+    ///
+    /// ```no_run
+    /// # use simple_someip::{Client, RawPayload, TokioChannels, VecSdHeader};
+    /// # use simple_someip::protocol::sd::{self, RebootFlag, Flags};
+    /// # use std::sync::{Arc, Mutex, RwLock};
+    /// # use std::net::Ipv4Addr;
+    /// # async fn demo(
+    /// #     client: Client<
+    /// #         RawPayload,
+    /// #         Arc<Mutex<simple_someip::e2e::E2ERegistry>>,
+    /// #         Arc<RwLock<Ipv4Addr>>,
+    /// #         TokioChannels,
+    /// #     >,
+    /// # ) {
+    /// let header = VecSdHeader {
+    ///     flags: Flags::new_sd(RebootFlag::RecentlyRebooted),
+    ///     entries: vec![],
+    ///     options: vec![],
+    /// };
+    /// let handle = tokio::spawn(
+    ///     client.sd_announcements_loop(header, std::time::Duration::from_secs(1))
+    /// );
+    /// // ...later: handle.abort() to stop, or let the Client drop naturally.
+    /// # }
+    /// ```
+    ///
+    /// # Arguments
+    ///
+    /// * `sd_header` — The SD header to send (entries + options).
+    /// * `interval` — How often to send (e.g. every 1 second). Values below
+    ///   100ms are clamped to 100ms to prevent tight loops.
+    pub fn sd_announcements_loop(
+        &self,
+        sd_header: <MessageDefinitions as PayloadWireFormat>::SdHeader,
+        interval: std::time::Duration,
+    ) -> impl core::future::Future<Output = ()> + Send + 'static
+    where
+        <MessageDefinitions as PayloadWireFormat>::SdHeader: Send + 'static,
+    {
+        use crate::protocol::sd;
+        use crate::transport::OneshotRecv;
+
+        // Use a WeakSender so this future does NOT keep the control channel
+        // alive. When all strong Client handles are dropped (shut_down),
+        // the weak sender will fail to upgrade and the loop exits cleanly.
+        let weak_sender = self.control_sender.downgrade();
+        let target = SocketAddrV4::new(sd::MULTICAST_IP, sd::MULTICAST_PORT);
+        let interval = interval.max(std::time::Duration::from_millis(100));
+
+        async move {
+            let timer = TokioTimer;
+            let mut count = 0u64;
+            loop {
+                timer.sleep(interval).await;
+
+                let (flag_rx, flag_msg) =
+                    ControlMessage::<MessageDefinitions, TokioChannels>::query_reboot_flag();
+                let Some(sender) = weak_sender.upgrade() else {
+                    tracing::info!("Client shut down, stopping SD announcements");
+                    break;
+                };
+                let enqueue_ok = sender.send(flag_msg).await.is_ok();
+                drop(sender);
+                if !enqueue_ok {
+                    tracing::warn!("SD announcement channel closed, stopping");
+                    break;
+                }
+                let reboot = match flag_rx.recv().await {
+                    Ok(Ok(flag)) => flag,
+                    Ok(Err(e)) => {
+                        tracing::warn!(
+                            "SD announcement reboot-flag query returned error ({:?}), skipping tick",
+                            e
+                        );
+                        continue;
+                    }
+                    Err(_) => {
+                        tracing::warn!("SD announcement reboot-flag query dropped, stopping");
+                        break;
+                    }
+                };
+                let mut header = sd_header.clone();
+                MessageDefinitions::set_reboot_flag(&mut header, reboot);
+
+                let (response, message) =
+                    ControlMessage::<MessageDefinitions, TokioChannels>::send_sd(target, header);
+
+                let Some(sender) = weak_sender.upgrade() else {
+                    tracing::info!("Client shut down, stopping SD announcements");
+                    break;
+                };
+                let send_ok = sender.send(message).await.is_ok();
+                drop(sender);
+
+                if !send_ok {
+                    tracing::warn!("SD announcement channel closed, stopping");
+                    break;
+                }
+
+                match response.recv().await {
+                    Ok(Ok(())) => {
+                        count += 1;
+                        if count == 1 {
+                            tracing::info!("Sent first client SD announcement");
+                        } else {
+                            tracing::trace!("Sent {count} client SD announcements");
+                        }
+                    }
+                    Ok(Err(e)) => {
+                        tracing::error!("Failed to send SD announcement: {e:?}");
+                    }
+                    Err(_) => {
+                        tracing::warn!("SD announcement response dropped, stopping");
+                        break;
+                    }
+                }
+            }
+        }
+    }
+}
+
+#[cfg(all(test, feature = "client-tokio"))]
 mod tests {
     use super::*;
     use crate::protocol::sd::test_support::{TestPayload, empty_sd_header};
     use crate::traits::WireFormat;
     use std::format;
 
-    type TestClient = Client<TestPayload>;
+    type TestClient =
+        Client<TestPayload, Arc<Mutex<E2ERegistry>>, Arc<RwLock<Ipv4Addr>>, TokioChannels>;
 
     #[tokio::test]
     async fn test_client_new_and_interface() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         assert_eq!(client.interface(), Ipv4Addr::LOCALHOST);
         client.shut_down();
     }
 
     #[tokio::test]
     async fn test_client_debug() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let debug_str = format!("{client:?}");
         assert!(debug_str.contains("Client"));
         assert!(debug_str.contains("127.0.0.1"));
@@ -704,7 +1182,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_subscribe_unknown_service_returns_error() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let result = client.subscribe(0xFFFF, 0xFFFF, 1, 3, 0x01, 0).await;
         assert!(
             matches!(result, Err(Error::ServiceNotFound)),
@@ -715,7 +1194,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_subscribe_no_wait_unknown_service_does_not_panic() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         // subscribe_no_wait is fire-and-forget — it should not panic even
         // when the service is unknown (the inner loop sends ServiceNotFound
         // on the dropped response channel, which is harmless).
@@ -725,9 +1205,50 @@ mod tests {
         client.shut_down();
     }
 
+    /// Stress test: 200 back-to-back `subscribe_no_wait` calls, each of
+    /// which drops its response oneshot. The code removed the
+    /// `tokio::spawn(drain-the-oneshot)` wrapper this function used to
+    /// have, and dropped the `warn!("...response receiver dropped")`
+    /// sites in the inner loop. Regressions that re-introduce either
+    /// would show up as either (a) hundreds of orphan spawned tasks
+    /// (not directly testable without instrumentation) or (b) log-noise
+    /// pollution / a hung inner loop (directly testable — asserted by
+    /// `assert_inner_alive` at the end).
+    #[tokio::test]
+    async fn test_subscribe_no_wait_fire_and_forget_stress() {
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
+
+        // Unknown service so the inner loop's ServiceNotFound branch
+        // fires on every iteration — that's the path where the
+        // response oneshot is dropped and the (removed) warn used to
+        // fire. 200 iterations is well above the control-channel
+        // buffer size (4) to also exercise backpressure.
+        for _ in 0..200 {
+            client
+                .subscribe_no_wait(0xFFFF, 0xFFFF, 1, 3, 0x01, 0)
+                .await;
+        }
+
+        // Inner loop must still be responsive after the stress.
+        let msg = crate::protocol::Message::new_sd(1, &empty_sd_header());
+        let result = tokio::time::timeout(
+            std::time::Duration::from_secs(2),
+            client.request(0xFFFF, 0xFFFF, msg),
+        )
+        .await
+        .expect("inner loop unresponsive after 200 subscribe_no_wait calls");
+        assert!(
+            matches!(result, Err(Error::ServiceNotFound)),
+            "expected ServiceNotFound, got {result:?}"
+        );
+        client.shut_down();
+    }
+
     #[tokio::test]
     async fn test_bind_discovery_and_unbind() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         client.bind_discovery().await.unwrap();
         client.unbind_discovery().await.unwrap();
         client.shut_down();
@@ -735,7 +1256,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_set_interface() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let new_addr = Ipv4Addr::LOCALHOST;
         client.set_interface(new_addr).await.unwrap();
         assert_eq!(client.interface(), new_addr);
@@ -744,7 +1266,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_add_endpoint_succeeds() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let addr = SocketAddrV4::new(Ipv4Addr::new(192, 168, 1, 1), 30000);
         client.add_endpoint(0x1234, 0x0001, addr, 0).await.unwrap();
         client.shut_down();
@@ -752,7 +1275,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_send_to_service_unknown_returns_error() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let msg = crate::protocol::Message::new_sd(1, &empty_sd_header());
         let result = client.send_to_service(0xFFFF, 0xFFFF, msg).await;
         assert!(
@@ -764,7 +1288,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_remove_endpoint_succeeds() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let addr = SocketAddrV4::new(Ipv4Addr::new(192, 168, 1, 1), 30000);
         client.add_endpoint(0x1234, 0x0001, addr, 0).await.unwrap();
         client.remove_endpoint(0x1234, 0x0001).await.unwrap();
@@ -773,16 +1298,16 @@ mod tests {
 
     #[test]
     fn test_pending_response_debug() {
-        let (_tx, rx) = oneshot::channel::<Result<TestPayload, Error>>();
-        let pending = PendingResponse { receiver: rx };
+        let (_tx, rx) = TokioChannels::oneshot::<Result<TestPayload, Error>>();
+        let pending: PendingResponse<TestPayload, TokioChannels> = PendingResponse { receiver: rx };
         let s = format!("{pending:?}");
         assert!(s.contains("PendingResponse"));
     }
 
     #[tokio::test]
     async fn test_pending_response_resolves_ok() {
-        let (tx, rx) = oneshot::channel::<Result<TestPayload, Error>>();
-        let pending = PendingResponse { receiver: rx };
+        let (tx, rx) = TokioChannels::oneshot::<Result<TestPayload, Error>>();
+        let pending: PendingResponse<TestPayload, TokioChannels> = PendingResponse { receiver: rx };
         let payload = TestPayload {
             header: empty_sd_header(),
         };
@@ -793,8 +1318,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_pending_response_resolves_err() {
-        let (tx, rx) = oneshot::channel::<Result<TestPayload, Error>>();
-        let pending = PendingResponse { receiver: rx };
+        let (tx, rx) = TokioChannels::oneshot::<Result<TestPayload, Error>>();
+        let pending: PendingResponse<TestPayload, TokioChannels> = PendingResponse { receiver: rx };
         tx.send(Err(Error::ServiceNotFound)).unwrap();
         let result = pending.response().await;
         assert!(
@@ -805,7 +1330,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_send_sd_message() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         // Bind discovery first so the send path uses the existing socket
         client.bind_discovery().await.unwrap();
         let target = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 30490);
@@ -816,7 +1342,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_send_to_service_success_returns_pending_response() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 30000);
         client.add_endpoint(0x1234, 0x0001, addr, 0).await.unwrap();
         let msg = crate::protocol::Message::new_sd(1, &empty_sd_header());
@@ -828,7 +1355,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_recv_returns_none_after_shutdown() {
-        let (client, mut updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, mut updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         client.shut_down();
         // Now the inner loop should exit; recv() should return None
         let result = tokio::time::timeout(std::time::Duration::from_secs(2), updates.recv()).await;
@@ -838,7 +1366,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_register_and_unregister_e2e() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let key = E2EKey {
             service_id: 0x1234,
             method_or_event_id: 0x0001,
@@ -851,7 +1380,8 @@ mod tests {
 
     #[tokio::test]
     async fn test_client_is_clone() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let client2 = client.clone();
         assert_eq!(client.interface(), client2.interface());
         client.shut_down();
@@ -859,14 +1389,16 @@ mod tests {
 
     #[tokio::test]
     async fn test_client_updates_debug() {
-        let (_client, updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (_client, updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let debug_str = format!("{updates:?}");
         assert!(debug_str.contains("ClientUpdates"));
     }
 
     #[tokio::test]
     async fn test_request_unknown_service_returns_error() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         let msg = crate::protocol::Message::new_sd(1, &empty_sd_header());
         let result = client.request(0xFFFF, 0xFFFF, msg).await;
         assert!(
@@ -877,13 +1409,15 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn test_start_sd_announcements_does_not_panic() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    async fn test_sd_announcements_loop_does_not_panic() {
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         client.bind_discovery().await.unwrap();
 
         let sd_header = empty_sd_header();
-        let handle =
-            client.start_sd_announcements(sd_header, std::time::Duration::from_millis(100));
+        let handle = tokio::spawn(
+            client.sd_announcements_loop(sd_header, std::time::Duration::from_millis(100)),
+        );
 
         // Let the task fire at least once (may fail to send on loopback, that's OK).
         tokio::time::sleep(std::time::Duration::from_millis(250)).await;
@@ -900,12 +1434,14 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn test_start_sd_announcements_without_discovery_bound() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    async fn test_sd_announcements_loop_without_discovery_bound() {
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         // Don't bind discovery — the task should handle the error gracefully.
         let sd_header = empty_sd_header();
-        let handle =
-            client.start_sd_announcements(sd_header, std::time::Duration::from_millis(100));
+        let handle = tokio::spawn(
+            client.sd_announcements_loop(sd_header, std::time::Duration::from_millis(100)),
+        );
 
         tokio::time::sleep(std::time::Duration::from_millis(250)).await;
 
@@ -921,13 +1457,15 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn test_start_sd_announcements_abort_stops_task() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    async fn test_sd_announcements_loop_abort_stops_task() {
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         client.bind_discovery().await.unwrap();
 
         let sd_header = empty_sd_header();
-        let handle =
-            client.start_sd_announcements(sd_header, std::time::Duration::from_millis(100));
+        let handle = tokio::spawn(
+            client.sd_announcements_loop(sd_header, std::time::Duration::from_millis(100)),
+        );
 
         handle.abort();
         let result = handle.await;
@@ -941,14 +1479,16 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn test_start_sd_announcements_overrides_caller_reboot_flag() {
+    async fn test_sd_announcements_loop_overrides_caller_reboot_flag() {
         // Regression test for the auto-refresh behavior: a caller who bakes
         // `Continuous` into `sd_header.flags` must still observe the client's
         // tracked flag on the wire (here, `RecentlyRebooted`, because the
         // session counter has not wrapped on a freshly-bound socket). This
         // verifies the announcer calls `set_reboot_flag` on each tick rather
         // than using the stale caller-supplied value.
-        let (client, mut updates) = TestClient::new_with_loopback(Ipv4Addr::LOCALHOST, true);
+        let (client, mut updates, run_fut) =
+            TestClient::new_with_loopback(Ipv4Addr::LOCALHOST, true);
+        let _run_handle = tokio::spawn(run_fut);
         client.bind_discovery().await.unwrap();
 
         // Caller bakes in Continuous — the announcer must override this.
@@ -956,12 +1496,15 @@ mod tests {
         sd_header.flags =
             crate::protocol::sd::Flags::new_sd(crate::protocol::sd::RebootFlag::Continuous);
 
-        let handle =
-            client.start_sd_announcements(sd_header, std::time::Duration::from_millis(100));
+        let handle = tokio::spawn(
+            client.sd_announcements_loop(sd_header, std::time::Duration::from_millis(100)),
+        );
 
         // Loopback delivers our own SD announcements back as DiscoveryUpdated.
-        // Drain updates until we see one (tokio::time::interval skips the
-        // first immediate tick, so the first real send lands at ~100-200ms).
+        // Drain updates until we see one. `sd_announcements_loop` uses
+        // `Timer::sleep` repeatedly (not `tokio::time::interval`), so the
+        // first send lands ~one interval after the loop is polled, i.e.
+        // ~100ms here.
         let received = tokio::time::timeout(std::time::Duration::from_secs(2), async {
             loop {
                 match updates.recv().await {
@@ -997,20 +1540,24 @@ mod tests {
         // past 0xFFFF would regress to `RecentlyRebooted` on the next
         // `reboot_flag()` call after unbind — falsely advertising a reboot
         // to peers on the next manually-built SD header.
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
 
         // No discovery bound. Fallback should reflect persisted state.
         // Default (unwrapped) → RecentlyRebooted.
         assert_eq!(
-            client.reboot_flag().await,
+            client.reboot_flag().await.expect("reboot_flag"),
             crate::protocol::sd::RebootFlag::RecentlyRebooted
         );
 
         // Simulate post-wrap state (normally set by `unbind_discovery`
         // reading the departing socket's `reboot_flag`).
-        client.force_sd_session_wrapped_for_test(true).await;
+        client
+            .force_sd_session_wrapped_for_test(true)
+            .await
+            .expect("force_sd_session_wrapped_for_test");
         assert_eq!(
-            client.reboot_flag().await,
+            client.reboot_flag().await.expect("reboot_flag"),
             crate::protocol::sd::RebootFlag::Continuous,
             "reboot_flag must report Continuous from persisted state while \
              discovery is unbound"
@@ -1020,7 +1567,7 @@ mod tests {
         // `bind_discovery_seeded`, so the live flag agrees.
         client.bind_discovery().await.unwrap();
         assert_eq!(
-            client.reboot_flag().await,
+            client.reboot_flag().await.expect("reboot_flag"),
             crate::protocol::sd::RebootFlag::Continuous,
             "seeded socket must report Continuous after wrapped rebind"
         );
@@ -1030,29 +1577,51 @@ mod tests {
 
     #[tokio::test]
     async fn test_reboot_flag_defaults_to_recently_rebooted() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         // Discovery not bound — should fall back to RecentlyRebooted.
         assert_eq!(
-            client.reboot_flag().await,
+            client.reboot_flag().await.expect("reboot_flag"),
             crate::protocol::sd::RebootFlag::RecentlyRebooted
         );
         client.bind_discovery().await.unwrap();
         // Freshly bound socket also reports RecentlyRebooted (session has not wrapped).
         assert_eq!(
-            client.reboot_flag().await,
+            client.reboot_flag().await.expect("reboot_flag"),
             crate::protocol::sd::RebootFlag::RecentlyRebooted
         );
         client.shut_down();
     }
 
     #[tokio::test]
-    async fn test_start_sd_announcements_stops_on_shutdown() {
-        let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    async fn reboot_flag_returns_shutdown_error_when_run_loop_dropped() {
+        // Regression for the migration of `reboot_flag` from `.unwrap()`
+        // panics to `Result<RebootFlag, Error>` (matches every other
+        // public Client method's Shutdown semantics). Dropping the run
+        // future closes the control channel; calling `reboot_flag` must
+        // surface `Err(Error::Shutdown)` rather than panicking.
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        drop(run_fut);
+        let err = client
+            .reboot_flag()
+            .await
+            .expect_err("reboot_flag must return an error after run loop is dropped");
+        assert!(
+            matches!(err, Error::Shutdown),
+            "expected Shutdown, got {err:?}"
+        );
+    }
+
+    #[tokio::test]
+    async fn test_sd_announcements_loop_stops_on_shutdown() {
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let _run_handle = tokio::spawn(run_fut);
         client.bind_discovery().await.unwrap();
 
         let sd_header = empty_sd_header();
-        let handle =
-            client.start_sd_announcements(sd_header, std::time::Duration::from_millis(100));
+        let handle = tokio::spawn(
+            client.sd_announcements_loop(sd_header, std::time::Duration::from_millis(100)),
+        );
 
         // Shut down the client — the weak sender should fail to upgrade
         // and the task should exit cleanly without needing abort().
@@ -1067,4 +1636,273 @@ mod tests {
             "task should have exited cleanly, not panicked"
         );
     }
+
+    /// Documents the footgun: if the caller drops `run_fut` without ever
+    /// polling it, the control channel's receiver goes with it and
+    /// subsequent `Client` method calls return [`Error::Shutdown`]
+    /// rather than panicking.
+    ///
+    /// This is intrinsic to the caller-driven lifecycle — the run loop
+    /// is no longer owned by `Client::new`, so failing to spawn it is
+    /// the caller's responsibility. The test pins the behavior
+    /// deterministically so that any attempt to silently "fix" this
+    /// (e.g. internal spawn fallback) would break it and force a review.
+    ///
+    /// Prior to the API change these call sites panicked on `.unwrap()`
+    /// of the send `Result`; the typed error surfaced here lets library
+    /// consumers observe lifecycle mismatches cleanly instead of bringing
+    /// down the caller's task.
+    #[tokio::test]
+    async fn dropping_run_future_without_spawn_returns_shutdown_error() {
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        // Caller explicitly discards the run loop.
+        drop(run_fut);
+        let err = client
+            .bind_discovery()
+            .await
+            .expect_err("must surface a typed error, not Ok or panic");
+        assert!(
+            matches!(err, Error::Shutdown),
+            "expected Error::Shutdown after run-loop drop, got {err:?}",
+        );
+    }
+
+    /// If the run loop is cancelled mid-poll (caller-initiated timeout,
+    /// graceful shutdown), subsequent `Client` calls see the control
+    /// channel closed and surface [`Error::Shutdown`]. Same structural
+    /// contract as dropping the run future.
+    #[tokio::test]
+    async fn cancelling_run_future_closes_control_channel_returns_shutdown_error() {
+        let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let handle = tokio::spawn(run_fut);
+        // Let the loop start.
+        tokio::time::sleep(std::time::Duration::from_millis(50)).await;
+        handle.abort();
+        // Give the abort time to land.
+        tokio::time::sleep(std::time::Duration::from_millis(50)).await;
+
+        let err = client
+            .bind_discovery()
+            .await
+            .expect_err("must surface a typed error, not Ok or panic");
+        assert!(
+            matches!(err, Error::Shutdown),
+            "expected Error::Shutdown after run-loop cancel, got {err:?}",
+        );
+    }
+
+    /// Pins the cadence of `sd_announcements_loop` under a healthy
+    /// (non-backpressured) control channel by counting how many
+    /// announcements land on the `Inner` loop's discovery socket
+    /// within a bounded window.
+    ///
+    /// The implementation uses repeated `Timer::sleep` calls (interval +
+    /// body time, no catch-up) rather than wall-clock aligned intervals.
+    /// For a healthy event loop the body is microseconds, so the observed
+    /// cadence is very close to the requested interval. If a future
+    /// change regresses this to "2 * interval" or worse, this test fires.
+    ///
+    /// The test creates a multicast receiver on the SD port/address
+    /// with loopback enabled, then runs a client with
+    /// `new_with_loopback(true)` and counts received announcements
+    /// over a 550ms window with an interval of 100ms. Expected: the
+    /// first announcement lands at t≈100ms, then ~every 100ms after,
+    /// so we expect 4-5 announcements in the window. Asserting `>= 3`
+    /// gives tolerance for scheduler jitter but still catches a 2x+
+    /// cadence regression.
+    #[ignore = "requires MULTICAST on the loopback interface; dev \
+                machines where `lo` lacks the MULTICAST flag will not \
+                deliver loopback multicast and this test will fail. \
+                Runs in any environment where loopback multicast is \
+                available (e.g. CI)."]
+    #[tokio::test]
+    async fn sd_announcements_loop_cadence_stays_close_to_requested() {
+        use crate::protocol::sd;
+        use socket2::{Domain, Protocol, Socket, Type};
+
+        let iface = Ipv4Addr::LOCALHOST;
+
+        // Build a loopback multicast receiver on the SD port.
+        let recv = {
+            let s = Socket::new(Domain::IPV4, Type::DGRAM, Some(Protocol::UDP)).unwrap();
+            s.set_reuse_address(true).unwrap();
+            #[cfg(unix)]
+            s.set_reuse_port(true).unwrap();
+            s.bind(&std::net::SocketAddr::from((iface, sd::MULTICAST_PORT)).into())
+                .unwrap();
+            s.set_nonblocking(true).unwrap();
+            let std_s: std::net::UdpSocket = s.into();
+            let rs = tokio::net::UdpSocket::from_std(std_s).unwrap();
+            rs.join_multicast_v4(sd::MULTICAST_IP, iface).unwrap();
+            rs
+        };
+
+        let (client, _updates, run_fut) = TestClient::new_with_loopback(iface, true);
+        let _run_handle = tokio::spawn(run_fut);
+        client.bind_discovery().await.unwrap();
+
+        let interval = std::time::Duration::from_millis(100);
+        let loop_handle = tokio::spawn(client.sd_announcements_loop(empty_sd_header(), interval));
+
+        // Collect announcements over a 550ms window. First send fires
+        // at ~100ms, subsequent at ~100ms intervals; expect 4-5 packets.
+        let start = std::time::Instant::now();
+        let mut count = 0u32;
+        let mut buf = [0u8; 1500];
+        while start.elapsed() < std::time::Duration::from_millis(550) {
+            if tokio::time::timeout(
+                std::time::Duration::from_millis(200),
+                recv.recv_from(&mut buf),
+            )
+            .await
+            .map(|r| r.is_ok())
+            .unwrap_or(false)
+            {
+                count += 1;
+            }
+        }
+
+        loop_handle.abort();
+        client.shut_down();
+
+        assert!(
+            count >= 3,
+            "expected >= 3 announcements in 550ms at 100ms interval, got {count} — \
+             cadence may have regressed"
+        );
+    }
+
+    /// Pins the first-announcement latency of `sd_announcements_loop`
+    /// to a single interval. A prior revision slept once before the
+    /// loop AND at the top of each iteration, so the first packet
+    /// landed at ~2× interval. This test catches that regression by
+    /// measuring the time from loop start to the first received
+    /// announcement and requiring it to be well under 2× interval.
+    ///
+    /// Uses the same loopback-multicast catch pattern as
+    /// `sd_announcements_loop_cadence_stays_close_to_requested`.
+    #[ignore = "requires MULTICAST on the loopback interface; same \
+                constraint as `sd_announcements_loop_cadence_stays_close_to_requested`. \
+                Runs in any environment where loopback multicast is \
+                available (e.g. CI)."]
+    #[tokio::test]
+    async fn sd_announcements_loop_first_emit_within_one_interval() {
+        use crate::protocol::sd;
+        use socket2::{Domain, Protocol, Socket, Type};
+
+        let iface = Ipv4Addr::LOCALHOST;
+
+        let recv = {
+            let s = Socket::new(Domain::IPV4, Type::DGRAM, Some(Protocol::UDP)).unwrap();
+            s.set_reuse_address(true).unwrap();
+            #[cfg(unix)]
+            s.set_reuse_port(true).unwrap();
+            s.bind(&std::net::SocketAddr::from((iface, sd::MULTICAST_PORT)).into())
+                .unwrap();
+            s.set_nonblocking(true).unwrap();
+            let std_s: std::net::UdpSocket = s.into();
+            let rs = tokio::net::UdpSocket::from_std(std_s).unwrap();
+            rs.join_multicast_v4(sd::MULTICAST_IP, iface).unwrap();
+            rs
+        };
+
+        let (client, _updates, run_fut) = TestClient::new_with_loopback(iface, true);
+        let _run_handle = tokio::spawn(run_fut);
+        client.bind_discovery().await.unwrap();
+
+        let interval = std::time::Duration::from_millis(100);
+        let start = std::time::Instant::now();
+        let loop_handle = tokio::spawn(client.sd_announcements_loop(empty_sd_header(), interval));
+
+        let mut buf = [0u8; 1500];
+        let first = tokio::time::timeout(
+            std::time::Duration::from_millis(500),
+            recv.recv_from(&mut buf),
+        )
+        .await
+        .expect("first SD announcement did not arrive within 500ms")
+        .expect("recv_from errored");
+        let first_emit_elapsed = start.elapsed();
+        let _ = first;
+
+        loop_handle.abort();
+        client.shut_down();
+
+        assert!(
+            first_emit_elapsed < std::time::Duration::from_millis(250),
+            "first announcement took {first_emit_elapsed:?}, expected < 250ms at 100ms interval — \
+             likely double-sleep regression"
+        );
+    }
+
+    /// Compile-time-ish assertion that `Client::new`'s returned run
+    /// future is `Send + 'static`. If a future refactor captures a
+    /// `!Send` or borrowed type in `Inner::run_future`, `thread::spawn`
+    /// rejects the move and this test fails to compile — surfacing the
+    /// regression at the site that introduced it rather than at a
+    /// distant `tokio::spawn` call site.
+    ///
+    /// The test doesn't actually need to drive the future; it's a
+    /// type-level check that happens to execute a no-op thread.
+    #[test]
+    fn client_new_run_future_is_send_static() {
+        let (_client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+        let handle = std::thread::spawn(move || drop(run_fut));
+        handle.join().unwrap();
+    }
+
+    /// Proves `Client::new_with_spawner_and_loopback` actually routes
+    /// per-socket spawns through the user-provided `Spawner`. The
+    /// `CountingSpawner` below increments a shared counter on every
+    /// `spawn` call AND delegates to `tokio::spawn` so the spawned
+    /// futures still run. Calling `bind_discovery` should cause
+    /// exactly one spawn (the SD socket's I/O loop); calling
+    /// `bind_discovery` again is a no-op (socket already bound) so
+    /// the count stays at 1.
+    #[tokio::test]
+    async fn client_new_with_spawner_routes_socket_spawns_through_it() {
+        use core::sync::atomic::{AtomicUsize, Ordering};
+        use std::sync::Arc;
+
+        #[derive(Clone)]
+        struct CountingSpawner {
+            count: Arc<AtomicUsize>,
+        }
+
+        impl Spawner for CountingSpawner {
+            fn spawn(&self, future: impl core::future::Future<Output = ()> + Send + 'static) {
+                self.count.fetch_add(1, Ordering::SeqCst);
+                let _run_handle = tokio::spawn(future);
+            }
+        }
+
+        let count = Arc::new(AtomicUsize::new(0));
+        let spawner = CountingSpawner {
+            count: Arc::clone(&count),
+        };
+
+        let (client, _updates, run_fut) =
+            TestClient::new_with_spawner_and_loopback(Ipv4Addr::LOCALHOST, false, spawner);
+        let _run_handle = tokio::spawn(run_fut);
+
+        client
+            .bind_discovery()
+            .await
+            .expect("bind_discovery must succeed");
+        // Idempotent second call; must NOT spawn again.
+        client
+            .bind_discovery()
+            .await
+            .expect("second bind_discovery is idempotent");
+
+        assert_eq!(
+            count.load(Ordering::SeqCst),
+            1,
+            "expected exactly one spawn for the SD socket loop, \
+             got {}",
+            count.load(Ordering::SeqCst)
+        );
+
+        client.shut_down();
+    }
 }
diff --git a/src/client/service_registry.rs b/src/client/service_registry.rs
index bbb24bf..1184ee5 100644
--- a/src/client/service_registry.rs
+++ b/src/client/service_registry.rs
@@ -1,4 +1,13 @@
-use std::{collections::HashMap, net::SocketAddrV4};
+use core::net::SocketAddrV4;
+use heapless::index_map::FnvIndexMap;
+
+/// Maximum number of service-endpoint entries the registry can track.
+/// Must be a power of two ([`FnvIndexMap`] requirement). A real
+/// vehicle-side SOME/IP deployment typically tracks at most a few dozen
+/// services per ECU, so 32 is generous; bare-metal callers wanting a
+/// tighter cap can fork. The cap exists so the registry is heap-free
+/// (`heapless::FnvIndexMap` stores entries inline).
+pub const SERVICE_REGISTRY_CAP: usize = 32;
 
 #[derive(Clone, Copy, Debug, Eq, Hash, PartialEq)]
 pub struct ServiceInstanceId {
@@ -18,16 +27,31 @@ pub struct ServiceEndpointInfo {
 
 #[derive(Debug, Default)]
 pub struct ServiceRegistry {
-    endpoints: HashMap<ServiceInstanceId, ServiceEndpointInfo>,
+    endpoints: FnvIndexMap<ServiceInstanceId, ServiceEndpointInfo, SERVICE_REGISTRY_CAP>,
 }
 
+/// Returned by [`ServiceRegistry::insert`] when the registry is full.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub struct ServiceRegistryFull;
+
 impl ServiceRegistry {
-    pub fn insert(&mut self, id: ServiceInstanceId, info: ServiceEndpointInfo) {
-        self.endpoints.insert(id, info);
+    /// Insert or replace the endpoint for `id`. Returns `Ok(())` whether
+    /// a previous value was replaced or this is a fresh entry. Returns
+    /// `Err(ServiceRegistryFull)` if the registry is at
+    /// [`SERVICE_REGISTRY_CAP`] and `id` is not already present.
+    pub fn insert(
+        &mut self,
+        id: ServiceInstanceId,
+        info: ServiceEndpointInfo,
+    ) -> Result<(), ServiceRegistryFull> {
+        self.endpoints
+            .insert(id, info)
+            .map(|_| ())
+            .map_err(|_| ServiceRegistryFull)
     }
 
     pub fn remove(&mut self, id: ServiceInstanceId) -> Option<ServiceEndpointInfo> {
-        self.endpoints.remove(&id)
+        self.endpoints.swap_remove(&id)
     }
 
     pub fn get(&self, id: ServiceInstanceId) -> Option<&ServiceEndpointInfo> {
@@ -38,7 +62,7 @@ impl ServiceRegistry {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use std::net::Ipv4Addr;
+    use core::net::Ipv4Addr;
 
     fn test_id(service: u16, instance: u16) -> ServiceInstanceId {
         ServiceInstanceId {
@@ -60,7 +84,7 @@ mod tests {
     fn insert_and_get() {
         let mut reg = ServiceRegistry::default();
         let id = test_id(0x1234, 0x0001);
-        reg.insert(id, test_info(30000));
+        reg.insert(id, test_info(30000)).unwrap();
         let info = reg.get(id).unwrap();
         assert_eq!(info.addr.port(), 30000);
         assert_eq!(info.major_version, 1);
@@ -70,7 +94,7 @@ mod tests {
     fn remove_returns_info() {
         let mut reg = ServiceRegistry::default();
         let id = test_id(0x1234, 0x0001);
-        reg.insert(id, test_info(30000));
+        reg.insert(id, test_info(30000)).unwrap();
         let removed = reg.remove(id).unwrap();
         assert_eq!(removed.addr.port(), 30000);
         assert!(reg.get(id).is_none());
@@ -80,8 +104,8 @@ mod tests {
     fn overwrite_replaces_info() {
         let mut reg = ServiceRegistry::default();
         let id = test_id(0x1234, 0x0001);
-        reg.insert(id, test_info(30000));
-        reg.insert(id, test_info(40000));
+        reg.insert(id, test_info(30000)).unwrap();
+        reg.insert(id, test_info(40000)).unwrap();
         assert_eq!(reg.get(id).unwrap().addr.port(), 40000);
     }
 
@@ -96,4 +120,34 @@ mod tests {
         let mut reg = ServiceRegistry::default();
         assert!(reg.remove(test_id(0xFFFF, 0xFFFF)).is_none());
     }
+
+    #[test]
+    fn insert_returns_full_at_cap() {
+        let mut reg = ServiceRegistry::default();
+        for i in 0..SERVICE_REGISTRY_CAP {
+            #[allow(clippy::cast_possible_truncation)]
+            let id = test_id(i as u16, 0);
+            assert!(reg.insert(id, test_info(0)).is_ok());
+        }
+        let overflow_id = test_id(0xFFFF, 0xFFFF);
+        assert_eq!(
+            reg.insert(overflow_id, test_info(0)),
+            Err(ServiceRegistryFull),
+        );
+    }
+
+    #[test]
+    fn insert_at_cap_for_existing_key_succeeds() {
+        let mut reg = ServiceRegistry::default();
+        for i in 0..SERVICE_REGISTRY_CAP {
+            #[allow(clippy::cast_possible_truncation)]
+            let id = test_id(i as u16, 0);
+            assert!(reg.insert(id, test_info(0)).is_ok());
+        }
+        // Re-inserting an existing key replaces and does not require new
+        // capacity.
+        let existing = test_id(0, 0);
+        assert!(reg.insert(existing, test_info(9999)).is_ok());
+        assert_eq!(reg.get(existing).unwrap().addr.port(), 9999);
+    }
 }
diff --git a/src/client/session.rs b/src/client/session.rs
index 9aa6366..268b0b2 100644
--- a/src/client/session.rs
+++ b/src/client/session.rs
@@ -1,5 +1,12 @@
 use crate::protocol::sd::RebootFlag;
-use std::{collections::HashMap, net::SocketAddr};
+use heapless::index_map::FnvIndexMap;
+use std::net::SocketAddr;
+
+/// Max number of distinct `(sender, transport, service, instance)` tuples tracked
+/// for reboot detection. Must be a power of two (heapless `FnvIndexMap`
+/// requirement). Sized for a small fleet of peers each offering several
+/// services; bare-metal builds with more peers may need to edit this constant.
+const SESSION_CAP: usize = 64;
 
 /// Distinguishes multicast vs unicast transport for per-sender session tracking.
 /// The AUTOSAR spec requires separate session ID tracking per transport.
@@ -28,8 +35,9 @@ struct SessionState {
 pub enum SessionVerdict {
     /// Session is valid (normal increment or first message with matching state).
     Ok,
-    /// Sender has rebooted (reboot flag 0→1 transition, or session ID decreased
-    /// while reboot flag remains 1 within the same service instance stream).
+    /// Sender has rebooted (reboot flag transitioned `Continuous → RecentlyRebooted`,
+    /// or session ID decreased while the reboot flag remains `RecentlyRebooted`
+    /// within the same service instance stream).
     Reboot,
     /// First message ever seen from this service instance on this transport.
     Initial,
@@ -39,20 +47,63 @@ pub enum SessionVerdict {
 ///
 /// A reboot is detected when, for a given `(sender, transport, service_id,
 /// instance_id)` tuple:
-/// - The reboot flag transitions from 0 to 1, **or**
-/// - The session ID decreases while the reboot flag remains 1
+/// - The reboot flag transitions from `Continuous` to `RecentlyRebooted`, **or**
+/// - The session ID decreases while the reboot flag remains `RecentlyRebooted`
 ///
 /// Tracking per service instance (rather than per sender) avoids false
 /// positives when a sensor interleaves SD offers for multiple services
 /// with independent session counters on the same source address.
-#[derive(Debug, Default)]
+///
+/// Capacity is bounded at compile time by [`SESSION_CAP`].
+/// When the map is full, new sender entries are dropped with a `warn!` log
+/// and reboot detection for those senders is disabled.
+///
+/// # Security posture
+///
+/// The backing map uses FNV hashing rather than the DoS-resistant hasher used
+/// by `std::collections::HashMap`. For SOME/IP on isolated automotive or
+/// sensor networks this is not a concern. Deployments where `SessionKey`
+/// inputs (notably `SocketAddr`) are adversary-controlled should be aware
+/// that an attacker can craft keys to force collisions and degrade lookup
+/// cost; the blast radius is bounded by [`SESSION_CAP`].
+#[derive(Debug)]
 pub struct SessionTracker {
-    state: HashMap<SessionKey, SessionState>,
+    state: FnvIndexMap<SessionKey, SessionState, SESSION_CAP>,
+    /// Set after the first saturation warning. Prevents the saturated-map
+    /// log from firing on every `check()` for every new key once capacity
+    /// is reached — which would spam the log at the packet rate.
+    saturation_warned: bool,
+}
+
+impl Default for SessionTracker {
+    fn default() -> Self {
+        Self {
+            state: FnvIndexMap::new(),
+            saturation_warned: false,
+        }
+    }
 }
 
 impl SessionTracker {
     /// Check the session ID and reboot flag for a specific service instance
-    /// and return a verdict. Always updates the stored state after the check.
+    /// and return a verdict.
+    ///
+    /// On the normal (non-saturated) path, the stored state is updated
+    /// after the check so subsequent calls see the latest session id and
+    /// reboot flag for the key.
+    ///
+    /// # Capacity behavior
+    ///
+    /// The tracker is backed by a `heapless::FnvIndexMap` bounded by
+    /// [`SESSION_CAP`]. If the map is already full and the incoming key
+    /// is new, the insert fails and stored state is **not** updated for
+    /// that key — subsequent `check()` calls with the same new key will
+    /// continue to return [`SessionVerdict::Initial`] until an existing
+    /// key is evicted or capacity is raised. A single `warn!` fires the
+    /// first time saturation is hit (further saturation drops are
+    /// suppressed to avoid log spam at the packet rate). For existing
+    /// keys under saturation the update still succeeds, because
+    /// `FnvIndexMap::insert` replaces in place.
     ///
     /// Call this once per service entry in an SD message (not once per message),
     /// so each service instance gets its own session counter.
@@ -89,13 +140,31 @@ impl SessionTracker {
                 }
             }
         };
-        self.state.insert(
-            key,
-            SessionState {
-                last_session_id: session_id,
-                last_reboot_flag: reboot_flag,
-            },
-        );
+        let new_state = SessionState {
+            last_session_id: session_id,
+            last_reboot_flag: reboot_flag,
+        };
+        if self.state.insert(key, new_state).is_err() {
+            // Map at capacity and key is new — silently dropping the update
+            // would lose reboot-detection state. Log the first time we hit
+            // the wall so bare-metal users can size `SESSION_CAP` up, then
+            // suppress further warnings so a saturated tracker does not
+            // spam the log at the incoming-packet rate.
+            if !self.saturation_warned {
+                tracing::warn!(
+                    "SessionTracker at capacity ({}); dropping new sender state for \
+                     sender={} transport={:?} svc=0x{:04X} inst=0x{:04X}. Reboot \
+                     detection disabled for this entry and any further new entries \
+                     (subsequent drops not logged).",
+                    SESSION_CAP,
+                    sender,
+                    transport,
+                    service_id,
+                    instance_id
+                );
+                self.saturation_warned = true;
+            }
+        }
         verdict
     }
 }
@@ -310,4 +379,57 @@ mod tests {
         let verdict = tracker.check(addr(1000), TransportKind::Multicast, SVC, INST, 2, CONT);
         assert_eq!(verdict, SessionVerdict::Ok);
     }
+
+    #[test]
+    fn capacity_overflow_drops_new_entries_but_keeps_existing_tracking() {
+        // Fill the tracker to capacity with unique (sender, service) tuples.
+        let mut tracker = SessionTracker::default();
+        for i in 0..super::SESSION_CAP {
+            let port = 1000 + u16::try_from(i).unwrap();
+            let v = tracker.check(addr(port), TransportKind::Multicast, SVC, INST, 1, RB);
+            assert_eq!(v, SessionVerdict::Initial);
+        }
+
+        // One more insert — map is full, new entry dropped. The verdict is
+        // still Initial (no prior state for this key), but the state is
+        // never stored so a follow-up is also Initial.
+        let overflow_addr = addr(9999);
+        let v = tracker.check(overflow_addr, TransportKind::Multicast, SVC, INST, 1, RB);
+        assert_eq!(v, SessionVerdict::Initial);
+        // Because the insert failed, a second call with the same key still
+        // sees no stored state.
+        let v = tracker.check(overflow_addr, TransportKind::Multicast, SVC, INST, 2, RB);
+        assert_eq!(v, SessionVerdict::Initial);
+
+        // Previously-tracked senders continue to work normally.
+        let v = tracker.check(addr(1000), TransportKind::Multicast, SVC, INST, 2, RB);
+        assert_eq!(v, SessionVerdict::Ok);
+    }
+
+    #[test]
+    fn capacity_overflow_warns_only_on_first_hit() {
+        // `saturation_warned` is the latch that guards the tracing::warn!
+        // call in `check()`. It must flip false → true on the first
+        // rejected insert and stay true for subsequent hits — otherwise
+        // a saturated tracker spams the log at the packet rate.
+        let mut tracker = SessionTracker::default();
+        for i in 0..super::SESSION_CAP {
+            let port = 1000 + u16::try_from(i).unwrap();
+            tracker.check(addr(port), TransportKind::Multicast, SVC, INST, 1, RB);
+        }
+        assert!(
+            !tracker.saturation_warned,
+            "filling to exactly capacity must not trip the warn flag",
+        );
+
+        // First overflowing key: flag flips to true.
+        tracker.check(addr(9001), TransportKind::Multicast, SVC, INST, 1, RB);
+        assert!(tracker.saturation_warned);
+
+        // Subsequent overflows leave the flag true; the flag is what the
+        // implementation checks before emitting a fresh warn!.
+        tracker.check(addr(9002), TransportKind::Multicast, SVC, INST, 1, RB);
+        tracker.check(addr(9003), TransportKind::Multicast, SVC, INST, 1, RB);
+        assert!(tracker.saturation_warned);
+    }
 }
diff --git a/src/client/socket_manager.rs b/src/client/socket_manager.rs
index 13a8f6c..6fdad5d 100644
--- a/src/client/socket_manager.rs
+++ b/src/client/socket_manager.rs
@@ -1,20 +1,71 @@
+//! Client-side UDP socket management.
+//!
+//! Each bound socket is backed by a transport socket (concrete
+//! `TokioSocket` on `std + tokio`, pluggable via [`TransportFactory`] on
+//! bare-metal — see the `bind_discovery_seeded_with_transport` docstring
+//! for the RTN-gap analysis) with its I/O loop running on a
+//! caller-supplied [`crate::transport::Spawner`]. The `Spawner` trait
+//! makes the task-submission point pluggable; on `std + tokio` consumers
+//! pass [`crate::tokio_transport::TokioSpawner`] and the behavior matches
+//! a direct `tokio::spawn` call.
+//!
+//! # Why `Inner` can't drive per-socket futures itself
+//!
+//! Briefly experimented with having `Inner` drive per-socket futures
+//! via `FuturesUnordered`. That deadlocks: `Inner::handle_control_message`
+//! awaits `SocketManager::send`, which internally awaits an mpsc→oneshot
+//! round-trip that requires the socket loop to make progress. But
+//! `Inner::run_future` is parked inside the handler, so nothing polls
+//! the socket loop. Concurrency between the two is mandatory and cannot
+//! come from the same task — hence the `Spawner` hook.
+//!
+//! # Bare-metal readiness
+//!
+//! The `client` feature exposes the full trait-surface client without
+//! pulling tokio or socket2. The tokio convenience constructors
+//! (`Client::new`, `Client::new_with_loopback`, etc.) that default to
+//! `TokioTransport` + `TokioSpawner` are gated behind `client-tokio`.
+//!
+//! **Completed abstractions:**
+//! - `Spawner` / `LocalSpawner` traits: task submission is pluggable.
+//! - `E2ERegistryHandle` / `InterfaceHandle`: lock handles abstracted
+//!   away from `Arc<Mutex<_>>` / `Arc<RwLock<_>>`.
+//! - `ChannelFactory`: channel primitives abstracted via `TokioChannels`
+//!   (std) and `EmbassySyncChannels` / `define_static_channels!` (`bare_metal`).
+//! - `TransportSocket` GATs: `Socket = TokioSocket` pin removed;
+//!   `SendFuture` / `RecvFuture` associated types express `Send` bounds
+//!   for spawnable socket loops.
+//!
+//! For `no_alloc` SOME/IP usage, consume `protocol`, `e2e`, and the
+//! `transport` trait layer directly — the `bare_metal_client` /
+//! `bare_metal_server` example workspace members demonstrate that surface.
+
 use crate::{
-    e2e::{E2ECheckStatus, E2EKey, E2ERegistry, PROFILE4_HEADER_SIZE},
+    UDP_BUFFER_SIZE,
+    e2e::{E2ECheckStatus, E2EKey},
     protocol::{Message, MessageView, sd},
     traits::{PayloadWireFormat, WireFormat},
+    transport::{
+        ChannelFactory, E2ERegistryHandle, LocalSpawner, MpscRecv, MpscSend, OneshotRecv,
+        OneshotSend, ReceivedDatagram, SocketOptions, Spawner, TransportFactory, TransportSocket,
+    },
 };
 
 use super::error::Error;
+use futures::{FutureExt, pin_mut, select};
 use std::{
-    net::{IpAddr, Ipv4Addr, SocketAddr, SocketAddrV4},
-    sync::{Arc, Mutex},
+    net::{Ipv4Addr, SocketAddr, SocketAddrV4},
     task::{Context, Poll},
-    vec,
 };
-use tokio::{net::UdpSocket, select, sync::mpsc};
-use tracing::{error, info, trace};
+use tracing::{debug, error, info, trace, warn};
 
 /// A received message together with the source address it came from.
+///
+/// TODO: narrow `source` to `SocketAddrV4` to match the `TransportSocket`
+/// trait's IPv4-only contract — today the field is always a
+/// `SocketAddr::V4(_)` wrapping, and the V6 variant is unreachable.
+/// Deferred because the rename ripples through `DiscoveryMessage` and
+/// `ClientUpdate::Unicast`.
 #[derive(Clone, Debug)]
 pub struct ReceivedMessage<P> {
     pub message: Message<P>,
@@ -23,19 +74,43 @@ pub struct ReceivedMessage<P> {
 }
 
 /// Structure representing a request to send a message
-#[derive(Debug)]
-pub struct SendMessage<PayloadDefinitions> {
+pub struct SendMessage<PayloadDefinitions: Send + 'static, C: ChannelFactory> {
     pub target_addr: SocketAddrV4,
     pub message: Message<PayloadDefinitions>,
-    response: tokio::sync::oneshot::Sender<Result<(), Error>>,
+    response: C::OneshotSender<Result<(), Error>>,
+}
+
+impl<P: PayloadWireFormat + Send + 'static, C: ChannelFactory> std::fmt::Debug
+    for SendMessage<P, C>
+{
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        f.debug_struct("SendMessage")
+            .field("target_addr", &self.target_addr)
+            .field("message", &self.message)
+            .finish_non_exhaustive()
+    }
+}
+
+/// One iteration's select-outcome in `socket_loop_future`. The inner
+/// block returns this scalar so the pinned per-iteration `send_fut` /
+/// `recv_fut` futures drop before the processing body — releasing their
+/// `&mut buf` / `&mut socket` borrows.
+enum Outcome<P: PayloadWireFormat + Send + 'static, C: ChannelFactory> {
+    Send(Option<SendMessage<P, C>>),
+    Recv(Result<ReceivedDatagram, crate::transport::TransportError>),
 }
 
-impl<PayloadDefinitions: PayloadWireFormat + 'static> SendMessage<PayloadDefinitions> {
+impl<PayloadDefinitions, C> SendMessage<PayloadDefinitions, C>
+where
+    PayloadDefinitions: PayloadWireFormat + Send + 'static,
+    C: ChannelFactory,
+    Result<(), Error>: crate::transport::OneshotPooled<C>,
+{
     pub fn new(
         target_addr: SocketAddrV4,
         message: Message<PayloadDefinitions>,
-    ) -> (tokio::sync::oneshot::Receiver<Result<(), Error>>, Self) {
-        let (response_tx, response_rx) = tokio::sync::oneshot::channel();
+    ) -> (C::OneshotReceiver<Result<(), Error>>, Self) {
+        let (response_tx, response_rx) = C::oneshot();
         (
             response_rx,
             Self {
@@ -47,10 +122,9 @@ impl<PayloadDefinitions: PayloadWireFormat + 'static> SendMessage<PayloadDefinit
     }
 }
 
-#[derive(Debug)]
-pub struct SocketManager<PayloadDefinitions> {
-    receiver: mpsc::Receiver<Result<ReceivedMessage<PayloadDefinitions>, Error>>,
-    sender: mpsc::Sender<SendMessage<PayloadDefinitions>>,
+pub struct SocketManager<PayloadDefinitions: Send + 'static, C: ChannelFactory> {
+    receiver: C::BoundedReceiver<Result<ReceivedMessage<PayloadDefinitions>, Error>, 16>,
+    sender: C::BoundedSender<SendMessage<PayloadDefinitions, C>, 16>,
     local_port: u16,
     session_id: u16,
     /// Set to true once `session_id` has wrapped from 0xFFFF → 1.
@@ -59,36 +133,121 @@ pub struct SocketManager<PayloadDefinitions> {
     session_has_wrapped: bool,
 }
 
-impl<MessageDefinitions> SocketManager<MessageDefinitions>
+impl<P: PayloadWireFormat + Send + 'static, C: ChannelFactory> std::fmt::Debug
+    for SocketManager<P, C>
+{
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        f.debug_struct("SocketManager")
+            .field("local_port", &self.local_port)
+            .field("session_id", &self.session_id)
+            .finish_non_exhaustive()
+    }
+}
+
+impl<MessageDefinitions, C> SocketManager<MessageDefinitions, C>
 where
-    MessageDefinitions: PayloadWireFormat + 'static,
+    MessageDefinitions: PayloadWireFormat + Send + 'static,
+    C: ChannelFactory,
+    Result<(), Error>: crate::transport::OneshotPooled<C>,
+    SendMessage<MessageDefinitions, C>: crate::transport::BoundedPooled<C, 16>,
+    Result<ReceivedMessage<MessageDefinitions>, Error>: crate::transport::BoundedPooled<C, 16>,
 {
-    /// Bind the SD multicast socket, seeding the session counter and wrap state from
-    /// a previous socket when rebinding. Pass `(1, false)` for a fresh bind.
-    /// Preserving state across rebinds avoids emitting a false reboot signal
-    /// (`reboot_flag=1`) to peers after `unbind_discovery` + `bind_discovery`.
-    pub fn bind_discovery_seeded(
+    /// Bind the SD multicast socket, seeding the session counter and wrap
+    /// state from a previous socket when rebinding. Pass `(1, false)` for a
+    /// fresh bind. Preserving state across rebinds avoids emitting a false
+    /// reboot signal (`reboot_flag=1`) to peers after
+    /// `unbind_discovery` + `bind_discovery`.
+    ///
+    /// Uses the default `crate::tokio_transport::TokioTransport` and
+    /// `crate::tokio_transport::TokioSpawner` backends (rendered as
+    /// code literals because `tokio_transport` is only compiled with
+    /// the `client`/`server` features and an intra-doc link would
+    /// break default-feature rustdoc builds).
+    /// For tests or alternate bind logic (e.g. an interceptor factory
+    /// around `TokioTransport`), use
+    /// [`Self::bind_discovery_seeded_with_transport`].
+    ///
+    /// Currently `#[cfg(test)]`-gated: production callers reach the
+    /// socket through the `_with_transport` variant so the `Spawner`
+    /// trait can be exercised end-to-end. Additionally requires the
+    /// `client-tokio` feature because the convenience defaults
+    /// (`TokioTransport`, `TokioSpawner`) live behind it; under
+    /// `--features client` the `socket_manager` module is compiled
+    /// but this convenience method is not.
+    #[cfg(all(test, feature = "client-tokio"))]
+    pub async fn bind_discovery_seeded<R: E2ERegistryHandle>(
         interface: Ipv4Addr,
-        e2e_registry: Arc<Mutex<E2ERegistry>>,
+        e2e_registry: R,
         session_id: u16,
         session_has_wrapped: bool,
         multicast_loopback: bool,
     ) -> Result<Self, Error> {
-        let (rx_tx, rx_rx) = mpsc::channel(16);
-        let (tx_tx, tx_rx) = mpsc::channel(16);
-        let bind_addr =
-            std::net::SocketAddr::new(IpAddr::V4(Ipv4Addr::UNSPECIFIED), sd::MULTICAST_PORT);
-
-        // Create socket with SO_REUSEADDR to allow quick restart
-        let socket = socket2::Socket::new(
-            socket2::Domain::IPV4,
-            socket2::Type::DGRAM,
-            Some(socket2::Protocol::UDP),
-        )?;
-        socket.set_reuse_address(true)?;
-        #[cfg(unix)]
-        socket.set_reuse_port(true)?;
-        socket.set_multicast_if_v4(&interface)?;
+        use crate::tokio_transport::{TokioSpawner, TokioTransport};
+        Self::bind_discovery_seeded_with_transport(
+            &TokioTransport,
+            &TokioSpawner,
+            interface,
+            e2e_registry,
+            session_id,
+            session_has_wrapped,
+            multicast_loopback,
+        )
+        .await
+    }
+
+    /// Variant of [`Self::bind_discovery_seeded`] that constructs the
+    /// underlying socket through a caller-supplied [`TransportFactory`]
+    /// and submits the socket's I/O loop through a caller-supplied
+    /// [`Spawner`].
+    ///
+    /// # Socket bounds
+    ///
+    /// [`TransportSocket`] uses GATs so the factory's socket type must
+    /// satisfy:
+    ///
+    /// - `Send + Sync + 'static` — so the socket loop future can be
+    ///   spawned on a multithreaded executor and outlive its owner.
+    /// - `for<'a> SendFuture<'a>: Send` and `for<'a> RecvFuture<'a>: Send`
+    ///   — the named GAT futures must themselves be `Send` so the
+    ///   spawned loop crosses thread boundaries cleanly. The `for<'a>`
+    ///   higher-ranked bound expresses "for any borrow lifetime" without
+    ///   needing nightly-only Return-Type Notation (RFC 3654).
+    ///
+    /// Stable Rust cannot express `Send` bounds on the anonymous future
+    /// types of `async fn` trait methods at use sites, which is why
+    /// the trait uses named associated types over RPITIT. See
+    /// [`TransportSocket::SendFuture`](crate::transport::TransportSocket::SendFuture).
+    ///
+    /// # Bare-metal path
+    ///
+    /// The channel primitives are abstracted behind
+    /// [`ChannelFactory`](crate::transport::ChannelFactory). The
+    /// `bare_metal` feature activates `EmbassySyncChannels` and
+    /// `define_static_channels!` as alternatives to `TokioChannels`.
+    /// Bare-metal consumers can supply their own `TransportSocket` impl
+    /// (e.g. wrapping `embassy_net::udp::UdpSocket`) as long as it is
+    /// `Send + Sync + 'static` and its `SendFuture` / `RecvFuture` GAT
+    /// projections are `Send` for every borrow lifetime.
+    pub async fn bind_discovery_seeded_with_transport<F, S, R>(
+        factory: &F,
+        spawner: &S,
+        interface: Ipv4Addr,
+        e2e_registry: R,
+        session_id: u16,
+        session_has_wrapped: bool,
+        multicast_loopback: bool,
+    ) -> Result<Self, Error>
+    where
+        F: TransportFactory,
+        F::Socket: Send + Sync + 'static,
+        for<'a> <F::Socket as TransportSocket>::SendFuture<'a>: Send,
+        for<'a> <F::Socket as TransportSocket>::RecvFuture<'a>: Send,
+        S: Spawner,
+        R: E2ERegistryHandle,
+    {
+        let (rx_tx, rx_rx) = C::bounded::<Result<ReceivedMessage<MessageDefinitions>, Error>, 16>();
+        let (tx_tx, tx_rx) = C::bounded::<SendMessage<MessageDefinitions, C>, 16>();
+
         // Control whether multicast packets sent by this socket are looped
         // back to sockets on the same host — INCLUDING this socket itself.
         // Disabled by default to avoid parsing self-sent OfferService /
@@ -97,15 +256,64 @@ where
         // deliver this socket's own SD multicasts back to it, so higher-level
         // consumers must be prepared to see their own announcements surface
         // as inbound discovery traffic.
-        socket.set_multicast_loop_v4(multicast_loopback)?;
-        socket.bind(&bind_addr.into())?;
-        socket.set_nonblocking(true)?;
-        let socket: std::net::UdpSocket = socket.into();
-        let socket = UdpSocket::from_std(socket)?;
+        let options = {
+            let mut o = SocketOptions::new();
+            o.reuse_address = true;
+            o.reuse_port = true;
+            o.multicast_if_v4 = Some(interface);
+            o.multicast_loop_v4 = Some(multicast_loopback);
+            o
+        };
+        let bind_addr = SocketAddrV4::new(Ipv4Addr::UNSPECIFIED, sd::MULTICAST_PORT);
 
+        let socket = factory.bind(bind_addr, &options).await?;
         socket.join_multicast_v4(sd::MULTICAST_IP, interface)?;
 
-        Self::spawn_socket_loop(socket, rx_tx, tx_rx, e2e_registry);
+        let fut = Self::socket_loop_future(socket, rx_tx, tx_rx, e2e_registry);
+        spawner.spawn(fut);
+        Ok(Self {
+            receiver: rx_rx,
+            sender: tx_tx,
+            local_port: sd::MULTICAST_PORT,
+            session_id: session_id.max(1),
+            session_has_wrapped,
+        })
+    }
+
+    /// `!Send` counterpart to [`Self::bind_discovery_seeded_with_transport`].
+    ///
+    /// Called by [`super::bind_dispatch::LocalSpawnerDispatch`] which is
+    /// wired through [`super::Client::new_with_deps_local`].
+    pub async fn bind_discovery_seeded_with_transport_local<F, S, R>(
+        factory: &F,
+        spawner: &S,
+        interface: Ipv4Addr,
+        e2e_registry: R,
+        session_id: u16,
+        session_has_wrapped: bool,
+        multicast_loopback: bool,
+    ) -> Result<Self, Error>
+    where
+        F: TransportFactory,
+        F::Socket: 'static,
+        S: LocalSpawner,
+        R: E2ERegistryHandle,
+    {
+        let (rx_tx, rx_rx) = C::bounded::<Result<ReceivedMessage<MessageDefinitions>, Error>, 16>();
+        let (tx_tx, tx_rx) = C::bounded::<SendMessage<MessageDefinitions, C>, 16>();
+        let options = {
+            let mut o = SocketOptions::new();
+            o.reuse_address = true;
+            o.reuse_port = true;
+            o.multicast_if_v4 = Some(interface);
+            o.multicast_loop_v4 = Some(multicast_loopback);
+            o
+        };
+        let bind_addr = SocketAddrV4::new(Ipv4Addr::UNSPECIFIED, sd::MULTICAST_PORT);
+        let socket = factory.bind(bind_addr, &options).await?;
+        socket.join_multicast_v4(sd::MULTICAST_IP, interface)?;
+        let fut = Self::socket_loop_future(socket, rx_tx, tx_rx, e2e_registry);
+        spawner.spawn_local(fut);
         Ok(Self {
             receiver: rx_rx,
             sender: tx_tx,
@@ -115,24 +323,112 @@ where
         })
     }
 
-    pub fn bind(port: u16, e2e_registry: Arc<Mutex<E2ERegistry>>) -> Result<Self, Error> {
-        let (rx_tx, rx_rx) = mpsc::channel(4);
-        let (tx_tx, tx_rx) = mpsc::channel(4);
-        let bind_addr = std::net::SocketAddr::new(IpAddr::V4(Ipv4Addr::UNSPECIFIED), port);
-
-        // Create socket with SO_REUSEADDR and SO_REUSEPORT to allow quick restart
-        let socket = socket2::Socket::new(
-            socket2::Domain::IPV4,
-            socket2::Type::DGRAM,
-            Some(socket2::Protocol::UDP),
-        )?;
-        socket.set_reuse_address(true)?;
-        socket.bind(&bind_addr.into())?;
-        socket.set_nonblocking(true)?;
-        let socket: std::net::UdpSocket = socket.into();
-        let socket = UdpSocket::from_std(socket)?;
+    /// Bind a unicast SOME/IP socket on `port` using the default
+    /// `crate::tokio_transport::TokioTransport` and
+    /// `crate::tokio_transport::TokioSpawner` backends (rendered as
+    /// code literals for the same rustdoc-feature-gating reason
+    /// described on [`Self::bind_discovery_seeded`]). See
+    /// [`Self::bind_with_transport`] for the generic variant.
+    ///
+    /// Currently `#[cfg(test)]`-gated: production callers reach the
+    /// socket through the `_with_transport` variant so the `Spawner`
+    /// trait can be exercised end-to-end. Additionally requires the
+    /// `client-tokio` feature because the convenience defaults live
+    /// behind it.
+    #[cfg(all(test, feature = "client-tokio"))]
+    pub async fn bind<R: E2ERegistryHandle>(port: u16, e2e_registry: R) -> Result<Self, Error> {
+        use crate::tokio_transport::{TokioSpawner, TokioTransport};
+        Self::bind_with_transport(&TokioTransport, &TokioSpawner, port, e2e_registry).await
+    }
+
+    /// Variant of [`Self::bind`] that constructs the underlying socket
+    /// through a caller-supplied [`TransportFactory`] and submits the
+    /// socket's I/O loop through a caller-supplied [`Spawner`].
+    ///
+    /// # Generic bounds
+    ///
+    /// The factory's socket must be `Send + Sync + 'static` and its async
+    /// methods must return `Send` futures so the socket loop can be
+    /// spawned onto a multithreaded executor. See
+    /// [`TransportSocket::SendFuture`](crate::transport::TransportSocket::SendFuture)
+    /// for background on the GAT approach.
+    pub async fn bind_with_transport<F, S, R>(
+        factory: &F,
+        spawner: &S,
+        port: u16,
+        e2e_registry: R,
+    ) -> Result<Self, Error>
+    where
+        F: TransportFactory,
+        F::Socket: Send + Sync + 'static,
+        for<'a> <F::Socket as TransportSocket>::SendFuture<'a>: Send,
+        for<'a> <F::Socket as TransportSocket>::RecvFuture<'a>: Send,
+        S: Spawner,
+        R: E2ERegistryHandle,
+    {
+        // Standardized to N=16 across both discovery and unicast bind
+        // paths (was N=4 here historically — a tokio-conservative
+        // choice). The trait's const-N now propagates to the GAT, so
+        // the stored receiver/sender types must commit to a single N;
+        // 16 matches what embassy-sync hardcodes and what discovery
+        // already used. Bumping the unicast capacity from 4 to 16 has
+        // no semantic effect — it just lets the channels absorb a
+        // brief burst before backpressure kicks in.
+        let (rx_tx, rx_rx) = C::bounded::<Result<ReceivedMessage<MessageDefinitions>, Error>, 16>();
+        let (tx_tx, tx_rx) = C::bounded::<SendMessage<MessageDefinitions, C>, 16>();
+
+        let options = {
+            let mut o = SocketOptions::new();
+            o.reuse_address = true;
+            o
+        };
+        let bind_addr = SocketAddrV4::new(Ipv4Addr::UNSPECIFIED, port);
+
+        let socket = factory.bind(bind_addr, &options).await?;
+        let port = socket.local_addr()?.port();
+        let fut = Self::socket_loop_future(socket, rx_tx, tx_rx, e2e_registry);
+        spawner.spawn(fut);
+        Ok(Self {
+            receiver: rx_rx,
+            sender: tx_tx,
+            local_port: port,
+            session_id: 1,
+            session_has_wrapped: false,
+        })
+    }
+
+    /// `!Send` counterpart to [`Self::bind_with_transport`].
+    ///
+    /// Identical to the Send variant except: the factory's socket and
+    /// its GAT futures are not required to be `Send`, and the per-socket
+    /// I/O loop is submitted through a [`LocalSpawner`] (single-threaded
+    /// executor) rather than a [`Spawner`] (multi-threaded). Use this
+    /// path when the underlying transport (e.g. embassy-net) produces
+    /// non-`Send` socket state.
+    pub async fn bind_with_transport_local<F, S, R>(
+        factory: &F,
+        spawner: &S,
+        port: u16,
+        e2e_registry: R,
+    ) -> Result<Self, Error>
+    where
+        F: TransportFactory,
+        F::Socket: 'static,
+        S: LocalSpawner,
+        R: E2ERegistryHandle,
+    {
+        let (rx_tx, rx_rx) = C::bounded::<Result<ReceivedMessage<MessageDefinitions>, Error>, 16>();
+        let (tx_tx, tx_rx) = C::bounded::<SendMessage<MessageDefinitions, C>, 16>();
+        let options = {
+            let mut o = SocketOptions::new();
+            o.reuse_address = true;
+            o
+        };
+        let bind_addr = SocketAddrV4::new(Ipv4Addr::UNSPECIFIED, port);
+        let socket = factory.bind(bind_addr, &options).await?;
         let port = socket.local_addr()?.port();
-        Self::spawn_socket_loop(socket, rx_tx, tx_rx, e2e_registry);
+        let fut = Self::socket_loop_future(socket, rx_tx, tx_rx, e2e_registry);
+        spawner.spawn_local(fut);
         Ok(Self {
             receiver: rx_rx,
             sender: tx_tx,
@@ -147,14 +443,33 @@ where
         target_addr: SocketAddrV4,
         message: Message<MessageDefinitions>,
     ) -> Result<(), Error> {
-        let (result_channel, message) = SendMessage::new(target_addr, message);
-        self.sender.send(message).await.map_err(|e| {
-            error!("Socket error: {e} when attempting to send message");
+        // Pre-encode size check: fail fast with `Error::Capacity("udp_buffer")`
+        // for messages that exceed `UDP_BUFFER_SIZE`. Mirrors the analogous
+        // check in `server::EventPublisher` so callers see a uniform
+        // overload signal regardless of which path produced the oversize
+        // message. Without this, an oversize encode would surface as a
+        // protocol-level I/O error from inside the socket loop.
+        let required = message.required_size();
+        if required > UDP_BUFFER_SIZE {
+            warn!(
+                "outgoing message size {required} exceeds UDP_BUFFER_SIZE ({UDP_BUFFER_SIZE}); rejecting with Capacity(\"udp_buffer\")"
+            );
+            return Err(Error::Capacity("udp_buffer"));
+        }
+        let (result_channel, message) =
+            SendMessage::<MessageDefinitions, C>::new(target_addr, message);
+        self.sender.send(message).await.map_err(|()| {
+            error!("Socket error when attempting to send message");
             Error::SocketClosedUnexpectedly
         })?;
-        result_channel
-            .await
-            .expect("Socket manager must always return result of send before dropping channel")?;
+        // The socket loop's response sender can be dropped without sending
+        // (executor cancellation, bare-metal `Spawner` that drops futures,
+        // or a panic in the loop). Surface that as a typed error rather
+        // than `.expect`-panicking the caller.
+        result_channel.recv().await.map_err(|_| {
+            debug!("send result channel dropped (socket loop gone)");
+            Error::SocketClosedUnexpectedly
+        })??;
         if self.session_id == u16::MAX {
             self.session_id = 1;
             self.session_has_wrapped = true;
@@ -174,7 +489,7 @@ where
     }
 
     pub async fn receive(&mut self) -> Option<Result<ReceivedMessage<MessageDefinitions>, Error>> {
-        self.receiver.recv().await
+        MpscRecv::recv(&mut self.receiver).await
     }
 
     /// Poll the receiver for a message without blocking.
@@ -201,171 +516,320 @@ where
             ..
         } = self;
         drop(sender);
-        _ = receiver.recv().await;
+        // Drain until the receiver returns `None` — i.e. the socket
+        // loop has dropped its sender. A single `recv()` could
+        // resolve via a buffered `ReceivedMessage` while the loop is
+        // still running and still holding the underlying transport
+        // socket; that would leave the OS-level fd / multicast group
+        // potentially still bound when the next `bind_*` ran. Loop
+        // until close is observed.
+        while MpscRecv::recv(&mut receiver).await.is_some() {}
     }
 
+    /// Build the I/O loop over any [`TransportSocket`] as a future.
+    /// Callers are expected to spawn this future alongside [`Self`];
+    /// the socket loop runs concurrently with its owner so
+    /// `SocketManager::send`'s internal oneshot wait can complete.
+    /// The reasoning for why the spawn hasn't been hoisted is in the
+    /// module-level docs.
+    ///
+    /// # `Send` bounds
+    ///
+    /// The returned future must be `Send + 'static` for `Spawner::spawn`.
+    /// This works on stable Rust (no RTN required) because:
+    /// - `T: Send + Sync + 'static` makes the captured socket `Send`.
+    /// - The HRTBs `for<'a> T::SendFuture<'a>: Send` and
+    ///   `for<'a> T::RecvFuture<'a>: Send` make the GAT-projected futures
+    ///   `Send` for every borrow lifetime, which is what propagates
+    ///   `Send` to the enclosing `async` block.
+    /// - All other captured state (`buf`, channels, registry) is `Send`.
+    ///
+    /// Bare-metal `TransportSocket` impls must ensure their `SendFuture`
+    /// and `RecvFuture` associated types are `Send` (e.g. by avoiding
+    /// `Rc` / `RefCell` in the future state) for this to compile.
     #[allow(clippy::too_many_lines)]
-    fn spawn_socket_loop(
-        socket: UdpSocket,
-        rx_tx: mpsc::Sender<Result<ReceivedMessage<MessageDefinitions>, Error>>,
-        mut tx_rx: mpsc::Receiver<SendMessage<MessageDefinitions>>,
-        e2e_registry: Arc<Mutex<E2ERegistry>>,
-    ) {
-        tokio::spawn(async move {
-            let mut buf = vec![0; 1400];
-            loop {
+    async fn socket_loop_future<T, R>(
+        socket: T,
+        rx_tx: C::BoundedSender<Result<ReceivedMessage<MessageDefinitions>, Error>, 16>,
+        mut tx_rx: C::BoundedReceiver<SendMessage<MessageDefinitions, C>, 16>,
+        e2e_registry: R,
+    ) where
+        T: TransportSocket + 'static,
+        R: E2ERegistryHandle,
+    {
+        // Maximum number of consecutive `recv_from` errors tolerated before
+        // the socket loop gives up. A single failure (transient I/O, peer
+        // RST, ICMP port-unreachable amplified into `ConnectionRefused`)
+        // is normal and should not tear down the socket. A persistent
+        // failure (e.g. `EBADF` after the kernel closed the fd, or a
+        // platform-level network-stack collapse) used to pin a CPU on a
+        // tight `error!` log loop with no exit; this counter caps that.
+        const MAX_CONSECUTIVE_RECV_ERRORS: u32 = 16;
+        let mut consecutive_recv_errors: u32 = 0;
+        let mut buf = [0u8; UDP_BUFFER_SIZE];
+
+        loop {
+            // `select!` (not `select_biased!`) gives pseudo-random
+            // fairness across ready arms — matches prior
+            // `tokio::select!` behavior and avoids starving either
+            // the send or recv arm under sustained one-sided load.
+            //
+            // The fresh `.fuse()`'d per-iteration futures are pinned
+            // on the stack (required: `Fuse<_>` is not `Unpin`).
+            // Returning an `Outcome<P>` scalar from the inner block
+            // drops both pinned futures — and their `&mut buf` /
+            // `&mut socket` borrows — before the processing body
+            // below runs, so the body can re-borrow `buf` freely.
+            let outcome: Outcome<MessageDefinitions, C> = {
+                let send_fut = MpscRecv::recv(&mut tx_rx).fuse();
+                let recv_fut = socket.recv_from(&mut buf).fuse();
+                pin_mut!(send_fut, recv_fut);
                 select! {
-                    result = socket.recv_from(&mut buf) => {
-                        match result {
-                            Ok((bytes_received, source_address)) => {
-                                let parse_result = MessageView::parse(&buf[..bytes_received])
-                                    .and_then(|view| {
-                                        let header = view.header().to_owned();
-                                        let upper_header = header.upper_header_bytes();
-                                        let key = E2EKey::from_message_id(header.message_id());
-                                        let payload_bytes = view.payload_bytes();
-
-                                        // Apply E2E check if configured
-                                        let (e2e_status, effective_payload) = {
-                                            let mut registry = e2e_registry.lock().expect("e2e registry lock poisoned");
-                                            match registry.check(key, payload_bytes, upper_header) {
-                                                Some((status, stripped)) => (Some(status), stripped),
-                                                None => (None, payload_bytes),
-                                            }
-                                        };
-
-                                        let payload = MessageDefinitions::from_payload_bytes(header.message_id(), effective_payload)?;
-                                        Ok(ReceivedMessage {
-                                            message: Message::new(header, payload),
-                                            source: source_address,
-                                            e2e_status,
-                                        })
-                                    })
-                                    .map_err(Error::from);
-                                if let Ok(()) = rx_tx.send( parse_result ).await {} else {
-                                    info!("Socket Dropping");
-                                    // The receiver has been dropped, so we should exit
-                                    break;
+                    message = send_fut => Outcome::Send(message),
+                    result = recv_fut => Outcome::Recv(result),
+                }
+            };
+
+            match outcome {
+                Outcome::Send(Some(send_message)) => {
+                    trace!("Sending: {:?}", &send_message);
+                    let mut message_length =
+                        match send_message.message.encode(&mut buf.as_mut_slice()) {
+                            Ok(length) => length,
+                            Err(e) => {
+                                error!("Failed to encode message: {:?}", e);
+                                // If the sender is already closed we can't send the error back, so we shut everything down
+                                if let Ok(()) = send_message.response.send(Err(e.into())) {
+                                    // Successfully sent error back to sender, carry on
+                                    continue;
                                 }
+                                error!("Socket owner closed channel unexpectedly, closing socket.");
+                                break;
                             }
-                            Err(e) => {
+                        };
 
-                                error!("Error decoding message: {:?}", e);
-                            }
-                        }
-                    },
-                    message = tx_rx.recv() => {
-                        if let Some(send_message) = message {
-                            trace!("Sending: {:?}", &send_message);
-                            let mut message_length = match send_message.message.encode(&mut buf.as_mut_slice()) {
-                                Ok(length) => length,
-                                Err(e) => {
-                                    error!("Failed to encode message: {:?}", e);
-                                    // If the sender is already closed we can't send the error back, so we shut everything down
-                                    if let Ok(()) = send_message.response.send(Err(e.into())) {
-                                        // Successfully sent error back to sender, carry on
+                    // Apply E2E protect if configured. `protected`
+                    // is a disjoint stack buffer, so the input can
+                    // be borrowed directly out of `buf[16..]` with
+                    // no intermediate copy.
+                    {
+                        let key =
+                            E2EKey::from_message_id(send_message.message.header().message_id());
+                        if e2e_registry.contains_key(&key) {
+                            let upper_header: [u8; 8] =
+                                buf[8..16].try_into().expect("upper header slice");
+                            let mut protected = [0u8; UDP_BUFFER_SIZE];
+                            let result = e2e_registry.protect(
+                                key,
+                                &buf[16..message_length],
+                                upper_header,
+                                &mut protected,
+                            );
+                            match result {
+                                Some(Ok(protected_len)) => {
+                                    if 16 + protected_len > UDP_BUFFER_SIZE {
+                                        error!(
+                                            "E2E-protected payload ({} bytes) exceeds UDP_BUFFER_SIZE ({}); dropping send",
+                                            16 + protected_len,
+                                            UDP_BUFFER_SIZE
+                                        );
+                                        let _ = send_message
+                                            .response
+                                            .send(Err(Error::Capacity("udp_buffer")));
                                         continue;
                                     }
-                                    error!("Socket owner closed channel unexpectedly, closing socket.");
-                                    break;
+                                    #[allow(clippy::cast_possible_truncation)]
+                                    let new_length: u32 = 8 + protected_len as u32;
+                                    buf[4..8].copy_from_slice(&new_length.to_be_bytes());
+                                    buf[16..16 + protected_len]
+                                        .copy_from_slice(&protected[..protected_len]);
+                                    message_length = 16 + protected_len;
                                 }
-                            };
-
-                            // Apply E2E protect if configured
-                            {
-                                let key = E2EKey::from_message_id(send_message.message.header().message_id());
-                                let mut registry = e2e_registry.lock().expect("e2e registry lock poisoned");
-                                if registry.contains_key(&key) {
-                                    let original_payload = buf[16..message_length].to_vec();
-                                    let upper_header: [u8; 8] = buf[8..16].try_into().expect("upper header slice");
-                                    let mut protected = vec![0u8; original_payload.len() + PROFILE4_HEADER_SIZE];
-                                    match registry.protect(key, &original_payload, upper_header, &mut protected) {
-                                        Some(Ok(protected_len)) => {
-                                            #[allow(clippy::cast_possible_truncation)]
-                                            let new_length: u32 = 8 + protected_len as u32;
-                                            buf[4..8].copy_from_slice(&new_length.to_be_bytes());
-                                            if 16 + protected_len > buf.len() {
-                                                buf.resize(16 + protected_len, 0);
-                                            }
-                                            buf[16..16 + protected_len].copy_from_slice(&protected[..protected_len]);
-                                            message_length = 16 + protected_len;
-                                        }
-                                        Some(Err(e)) => {
-                                            error!("E2E protect error: {:?}", e);
-                                        }
-                                        None => unreachable!("contains_key was true"),
-                                    }
+                                Some(Err(e)) => {
+                                    error!(
+                                        "E2E protect failed for configured key {:?}: {:?}; \
+                                         refusing to send unprotected datagram",
+                                        key, e
+                                    );
+                                    let _ = send_message.response.send(Err(Error::E2e(e)));
+                                    continue;
                                 }
+                                None => unreachable!("contains_key was true"),
                             }
+                        }
+                    }
 
-                            match socket.send_to(&buf[..message_length], send_message.target_addr).await {
-                                Ok(_bytes_sent) => {
-                                    trace!("Sent {} bytes to {}", message_length, send_message.target_addr);
-                                    if let Ok(()) = send_message.response.send(Ok(())) {} else {
-                                        info!("Socket owner closed channel, closing socket.");
-                                        // The sender has been dropped, so we should exit
-                                        break;
-                                    }
-                                }
-                                Err(e) => {
-                                    error!("Failed to send message with error: {:?}", e);
-                                    if let Ok(()) = send_message.response.send(Err(Error::Io(e))) {  } else {
-                                        error!("Socket owner closed channel unexpectedly, closing socket.");
-                                        break;
-                                    }
-                                }
+                    match socket
+                        .send_to(&buf[..message_length], send_message.target_addr)
+                        .await
+                    {
+                        Ok(()) => {
+                            trace!(
+                                "Sent {} bytes to {}",
+                                message_length, send_message.target_addr
+                            );
+                            if let Ok(()) = send_message.response.send(Ok(())) {
+                            } else {
+                                info!("Socket owner closed channel, closing socket.");
+                                // The sender has been dropped, so we should exit
+                                break;
+                            }
+                        }
+                        Err(e) => {
+                            error!("Failed to send message with error: {:?}", e);
+                            if let Ok(()) = send_message.response.send(Err(Error::Transport(e))) {
+                            } else {
+                                error!("Socket owner closed channel unexpectedly, closing socket.");
+                                break;
                             }
-                        } else {
-                            info!("Send channel closed, closing socket.");
-                            // The sender has been dropped, so we should exit
+                        }
+                    }
+                }
+                Outcome::Send(None) => {
+                    info!("Send channel closed, closing socket.");
+                    // The sender has been dropped, so we should exit
+                    break;
+                }
+                Outcome::Recv(Ok(ReceivedDatagram {
+                    bytes_received,
+                    source,
+                    truncated,
+                })) => {
+                    consecutive_recv_errors = 0;
+                    if truncated {
+                        // A truncated datagram cannot be parsed reliably;
+                        // the length field in the SOME/IP header will not
+                        // match the bytes we received. Log and drop.
+                        error!(
+                            "Discarding truncated datagram from {}: {} bytes received",
+                            source, bytes_received
+                        );
+                        continue;
+                    }
+                    let source_address = SocketAddr::V4(source);
+                    let parse_result = MessageView::parse(&buf[..bytes_received])
+                        .and_then(|view| {
+                            let header = view.header().to_owned();
+                            let upper_header = header.upper_header_bytes();
+                            let key = E2EKey::from_message_id(header.message_id());
+                            let payload_bytes = view.payload_bytes();
+
+                            // Apply E2E check if configured
+                            let (e2e_status, effective_payload) =
+                                match e2e_registry.check(key, payload_bytes, upper_header) {
+                                    Some((status, stripped)) => (Some(status), stripped),
+                                    None => (None, payload_bytes),
+                                };
+
+                            let payload = MessageDefinitions::from_payload_bytes(
+                                header.message_id(),
+                                effective_payload,
+                            )?;
+                            Ok(ReceivedMessage {
+                                message: Message::new(header, payload),
+                                source: source_address,
+                                e2e_status,
+                            })
+                        })
+                        .map_err(Error::from);
+                    if rx_tx.send(parse_result).await.is_ok() {
+                    } else {
+                        info!("Socket Dropping");
+                        // The receiver has been dropped, so we should exit
+                        break;
+                    }
+                }
+                Outcome::Recv(Err(recv_err)) => {
+                    // Classify by transport kind: transient kinds
+                    // (ConnectionRefused from inbound ICMP
+                    // port-unreachable, WouldBlock, Interrupted,
+                    // TimedOut, NetworkUnreachable) do NOT count
+                    // toward the consecutive-error cap — a peer
+                    // dying after a flurry of our requests easily
+                    // produces 16 ICMP storms in microseconds, and
+                    // tearing down a healthy socket on that signal
+                    // is wrong. Only fatal kinds (e.g. EBADF mapped
+                    // to `Other`) count toward the kill cap.
+                    let transient = matches!(
+                        recv_err,
+                        crate::transport::TransportError::Io(kind) if kind.is_transient_recv()
+                    );
+                    if transient {
+                        debug!("socket recv_from transient error: {:?}", recv_err);
+                    } else {
+                        consecutive_recv_errors = consecutive_recv_errors.saturating_add(1);
+                        debug!(
+                            "socket recv_from fatal-class error ({}/{}): {:?}",
+                            consecutive_recv_errors, MAX_CONSECUTIVE_RECV_ERRORS, recv_err,
+                        );
+                        if consecutive_recv_errors >= MAX_CONSECUTIVE_RECV_ERRORS {
+                            error!(
+                                "socket recv_from failed {} times consecutively with fatal-class \
+                                 errors; closing socket loop",
+                                consecutive_recv_errors,
+                            );
                             break;
                         }
                     }
                 }
             }
-        });
+        }
     }
 }
 
-#[cfg(test)]
+#[cfg(all(test, feature = "client-tokio"))]
 mod tests {
     use super::*;
+    use crate::e2e::E2ERegistry;
     use crate::protocol::sd::test_support::{TestPayload, empty_sd_header};
+    use crate::tokio_transport::{TokioChannels, TokioSpawner};
+    use std::boxed::Box;
     use std::format;
+    use std::sync::{Arc, Mutex};
+    use std::vec;
+    // Tests build ad-hoc UDP peers via tokio directly; this is not part of
+    // the production code path, which goes through the `TransportSocket`
+    // abstraction via `TokioTransport`.
+    use tokio::net::UdpSocket;
 
-    type TestSocketManager = SocketManager<TestPayload>;
+    type TestSocketManager = SocketManager<TestPayload, TokioChannels>;
 
     fn test_registry() -> Arc<Mutex<E2ERegistry>> {
         Arc::new(Mutex::new(E2ERegistry::new()))
     }
 
+    async fn bind_ephemeral_spawned() -> TestSocketManager {
+        TestSocketManager::bind(0, test_registry()).await.unwrap()
+    }
+
     #[tokio::test]
     async fn test_bind_ephemeral_port() {
-        let sm = TestSocketManager::bind(0, test_registry()).unwrap();
+        let sm = bind_ephemeral_spawned().await;
         assert!(sm.port() > 0);
         assert_eq!(sm.session_id(), 1);
     }
 
     #[tokio::test]
     async fn test_send_message_new() {
+        use crate::transport::OneshotRecv;
         let target = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 1234);
         let msg = Message::new_sd(1, &empty_sd_header());
-        let (rx, send_msg) = SendMessage::<TestPayload>::new(target, msg);
+        let (rx, send_msg) = SendMessage::<TestPayload, TokioChannels>::new(target, msg);
         assert_eq!(send_msg.target_addr, target);
         // Verify the oneshot channel works
         send_msg.response.send(Ok(())).unwrap();
-        assert!(rx.await.unwrap().is_ok());
+        assert!(rx.recv().await.unwrap().is_ok());
     }
 
     #[tokio::test]
     async fn test_socket_manager_shut_down() {
-        let sm = TestSocketManager::bind(0, test_registry()).unwrap();
+        let sm = bind_ephemeral_spawned().await;
         sm.shut_down().await;
     }
 
     #[tokio::test]
     async fn test_socket_manager_send_and_receive() {
-        let mut sm = TestSocketManager::bind(0, test_registry()).unwrap();
+        let mut sm = bind_ephemeral_spawned().await;
         let sm_port = sm.port();
 
         // Create a raw UDP socket to send data to the SocketManager
@@ -397,7 +861,7 @@ mod tests {
 
     #[tokio::test]
     async fn test_poll_receive() {
-        let mut sm = TestSocketManager::bind(0, test_registry()).unwrap();
+        let mut sm = bind_ephemeral_spawned().await;
         let sm_port = sm.port();
 
         // Send a message to the socket manager from a raw socket
@@ -423,7 +887,7 @@ mod tests {
 
     #[tokio::test]
     async fn test_send_drops_when_socket_loop_exits() {
-        let mut sm = TestSocketManager::bind(0, test_registry()).unwrap();
+        let mut sm = bind_ephemeral_spawned().await;
         // Shut down the socket loop by dropping the internal channels
         // We can't directly kill the loop, but we can test the error path
         // by sending to a socket manager that has been shut down.
@@ -460,14 +924,14 @@ mod tests {
     async fn test_send_message_debug() {
         let target = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 1234);
         let msg = Message::<TestPayload>::new_sd(1, &empty_sd_header());
-        let (_rx, send_msg) = SendMessage::<TestPayload>::new(target, msg);
+        let (_rx, send_msg) = SendMessage::<TestPayload, TokioChannels>::new(target, msg);
         let s = format!("{send_msg:?}");
         assert!(s.contains("SendMessage"));
     }
 
     #[tokio::test]
     async fn test_socket_manager_debug() {
-        let sm = TestSocketManager::bind(0, test_registry()).unwrap();
+        let sm = bind_ephemeral_spawned().await;
         let s = format!("{sm:?}");
         assert!(s.contains("SocketManager"));
         sm.shut_down().await;
@@ -475,7 +939,7 @@ mod tests {
 
     #[tokio::test]
     async fn test_socket_manager_send_to_target() {
-        let mut sm = TestSocketManager::bind(0, test_registry()).unwrap();
+        let mut sm = bind_ephemeral_spawned().await;
 
         // Create a raw socket to receive
         let raw_socket = UdpSocket::bind("127.0.0.1:0").await.unwrap();
@@ -514,19 +978,20 @@ mod tests {
             false,
             false,
         )
+        .await
         .unwrap();
         assert_eq!(sm.session_id(), 1, "session_id 0 must be normalized to 1");
     }
 
     #[tokio::test]
     async fn test_session_id_wraps_to_one_and_clears_reboot_flag() {
-        let mut sm = TestSocketManager::bind(0, test_registry()).unwrap();
+        use crate::protocol::sd::RebootFlag;
+        let mut sm = bind_ephemeral_spawned().await;
         let raw_socket = UdpSocket::bind("127.0.0.1:0").await.unwrap();
         let target =
             SocketAddrV4::new(Ipv4Addr::LOCALHOST, raw_socket.local_addr().unwrap().port());
         let msg = || Message::<TestPayload>::new_sd(1, &empty_sd_header());
 
-        use crate::protocol::sd::RebootFlag;
         // Set session_id to one before the wrap point
         sm.session_id = u16::MAX - 1;
         assert_eq!(
@@ -562,4 +1027,330 @@ mod tests {
             "reboot flag stays Continuous after wrap"
         );
     }
+
+    #[tokio::test]
+    async fn send_e2e_protected_payload_exceeding_udp_buffer_returns_capacity_error() {
+        use crate::RawPayload;
+        use crate::e2e::{E2EProfile, Profile4Config};
+        use crate::protocol::{Header, MessageId, MessageType, MessageTypeField, ReturnCode};
+
+        // Craft a message whose raw-encoded size fits UDP_BUFFER_SIZE (16-byte
+        // SOME/IP header + payload <= cap) but whose E2E-protected size
+        // does not — Profile 4 adds `PROFILE4_HEADER_SIZE = 12` bytes,
+        // so a payload of `UDP_BUFFER_SIZE - 16 - 4` exactly fits raw and
+        // overflows by 8 once protected. Derive both fixture sizes from
+        // `UDP_BUFFER_SIZE` so this stays correct if the constant moves.
+        const SOMEIP_HEADER_SIZE: usize = 16;
+        const PAYLOAD_LEN: usize = UDP_BUFFER_SIZE - SOMEIP_HEADER_SIZE - 4;
+
+        // Register an E2E profile so the protect branch runs.
+        let message_id = MessageId::new_from_service_and_method(0x1234, 0x5678);
+        let key = E2EKey::from_message_id(message_id);
+        let mut reg = E2ERegistry::new();
+        reg.register(key, E2EProfile::Profile4(Profile4Config::new(0, 15)));
+        let e2e_registry = Arc::new(Mutex::new(reg));
+
+        let mut sm = SocketManager::<RawPayload, TokioChannels>::bind(0, e2e_registry)
+            .await
+            .unwrap();
+
+        let payload_bytes = [0u8; PAYLOAD_LEN];
+        let payload = RawPayload::from_payload_bytes(message_id, &payload_bytes).unwrap();
+        let header = Header::new(
+            message_id,
+            0x0001_0001,
+            0x01,
+            0x01,
+            MessageTypeField::new(MessageType::Request, false),
+            ReturnCode::Ok,
+            payload_bytes.len(),
+        );
+        let message = Message::new(header, payload);
+
+        let target = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9999);
+        let err = sm
+            .send(target, message)
+            .await
+            .expect_err("E2E-protected oversize message must error");
+        match err {
+            Error::Capacity(tag) => assert_eq!(tag, "udp_buffer"),
+            other => panic!("expected Error::Capacity(\"udp_buffer\"), got {other:?}"),
+        }
+    }
+
+    /// Proves the public `bind_with_transport` entry point accepts an
+    /// alternative `TransportFactory` implementation. The factory here is
+    /// a thin interceptor that counts how many times `bind` is called; it
+    /// delegates to the built-in `TokioTransport`, which is what the
+    /// current `Socket = TokioSocket` bound requires.
+    #[tokio::test]
+    async fn bind_with_transport_accepts_custom_factory() {
+        use crate::tokio_transport::{TokioSocket, TokioTransport};
+        use core::future::Future;
+        use core::sync::atomic::{AtomicUsize, Ordering};
+
+        struct CountingFactory {
+            inner: TokioTransport,
+            calls: AtomicUsize,
+        }
+
+        impl TransportFactory for CountingFactory {
+            type Socket = TokioSocket;
+            type BindFuture<'a> = core::pin::Pin<
+                Box<
+                    dyn Future<Output = Result<Self::Socket, crate::transport::TransportError>>
+                        + Send
+                        + 'a,
+                >,
+            >;
+            fn bind<'a>(
+                &'a self,
+                addr: SocketAddrV4,
+                options: &'a SocketOptions,
+            ) -> Self::BindFuture<'a> {
+                self.calls.fetch_add(1, Ordering::SeqCst);
+                let options = *options;
+                let inner = self.inner;
+                Box::pin(async move { inner.bind(addr, &options).await })
+            }
+        }
+
+        let factory = CountingFactory {
+            inner: TokioTransport,
+            calls: AtomicUsize::new(0),
+        };
+
+        let sm =
+            TestSocketManager::bind_with_transport(&factory, &TokioSpawner, 0, test_registry())
+                .await
+                .expect("bind via custom factory");
+        assert_eq!(
+            factory.calls.load(Ordering::SeqCst),
+            1,
+            "custom factory should have been invoked exactly once"
+        );
+        drop(sm);
+    }
+
+    /// End-to-end proof that a custom `TransportFactory` actually
+    /// carries traffic through the full `SocketManager` path. Sends a
+    /// SOME/IP-SD message from one bound `SocketManager` to a raw tokio
+    /// socket, verifies the bytes arrive intact. Complements the lighter
+    /// `bind_with_transport_accepts_custom_factory` by exercising
+    /// `send_to` + the spawned I/O loop, not just the bind call.
+    #[tokio::test]
+    async fn bind_with_transport_carries_traffic_end_to_end() {
+        use crate::tokio_transport::{TokioSocket, TokioTransport};
+        use core::future::Future;
+
+        // Factory that overrides `SocketOptions` to force
+        // `reuse_address = true` regardless of caller-provided flags —
+        // proves the factory sits in the hot path.
+        struct ForceReuseFactory;
+        impl TransportFactory for ForceReuseFactory {
+            type Socket = TokioSocket;
+            type BindFuture<'a> = core::pin::Pin<
+                Box<
+                    dyn Future<Output = Result<Self::Socket, crate::transport::TransportError>>
+                        + Send
+                        + 'a,
+                >,
+            >;
+            fn bind<'a>(
+                &'a self,
+                addr: SocketAddrV4,
+                options: &'a SocketOptions,
+            ) -> Self::BindFuture<'a> {
+                let mut opts = *options;
+                opts.reuse_address = true;
+                Box::pin(async move { TokioTransport.bind(addr, &opts).await })
+            }
+        }
+
+        let mut sm = SocketManager::<TestPayload, TokioChannels>::bind_with_transport(
+            &ForceReuseFactory,
+            &TokioSpawner,
+            0,
+            test_registry(),
+        )
+        .await
+        .expect("bind via custom factory");
+        let sm_port = sm.port();
+
+        let recv = UdpSocket::bind("127.0.0.1:0").await.unwrap();
+        let recv_port = recv.local_addr().unwrap().port();
+
+        let msg = Message::<TestPayload>::new_sd(1, &empty_sd_header());
+        sm.send(SocketAddrV4::new(Ipv4Addr::LOCALHOST, recv_port), msg)
+            .await
+            .expect("send_to via custom-factory-built socket");
+
+        let mut buf = [0u8; UDP_BUFFER_SIZE];
+        let (len, from) =
+            tokio::time::timeout(std::time::Duration::from_secs(2), recv.recv_from(&mut buf))
+                .await
+                .expect("timed out waiting for datagram")
+                .expect("recv failed");
+
+        assert!(len > 0, "empty datagram");
+        match from {
+            std::net::SocketAddr::V4(v4) => assert_eq!(v4.port(), sm_port),
+            other @ std::net::SocketAddr::V6(_) => {
+                panic!("unexpected source address family: {other:?}")
+            }
+        }
+
+        // Parse and confirm it's a SOME/IP-SD message, not garbage.
+        let view = MessageView::parse(&buf[..len]).unwrap();
+        assert_eq!(view.header().message_id(), crate::protocol::MessageId::SD);
+    }
+
+    /// Type-witness: proves `bind_with_transport` accepts a factory
+    /// whose `Socket` type is **not** `TokioSocket`. This is a
+    /// type-system claim, and without this test the trait surface could
+    /// regress to a Tokio pin in a future refactor without any test
+    /// catching it. The existing `bind_with_transport_*` tests both
+    /// hardcode `type Socket = TokioSocket`, which only covers the
+    /// tokio-default shape.
+    ///
+    /// `WrappedSocket` is a transparent newtype around `TokioSocket`
+    /// with its own `TransportSocket` impl — the *type identity* is
+    /// what matters for this test, not the behavior. The end-to-end
+    /// send-and-verify confirms the spawned I/O loop also carries
+    /// through the wrapper, not just the bind call.
+    #[tokio::test]
+    async fn bind_with_transport_accepts_non_tokio_socket_type() {
+        use crate::tokio_transport::{TokioSocket, TokioTransport};
+        use crate::transport::TransportError;
+        use core::future::Future;
+
+        struct WrappedSocket(TokioSocket);
+
+        impl TransportSocket for WrappedSocket {
+            // Borrow the inner socket's named GAT futures; this keeps
+            // the wrapper zero-overhead while still exercising a
+            // distinct `Self::Socket` type at the bind call site.
+            type SendFuture<'a> = <TokioSocket as TransportSocket>::SendFuture<'a>;
+            type RecvFuture<'a> = <TokioSocket as TransportSocket>::RecvFuture<'a>;
+
+            fn send_to<'a>(&'a self, buf: &'a [u8], target: SocketAddrV4) -> Self::SendFuture<'a> {
+                self.0.send_to(buf, target)
+            }
+            fn recv_from<'a>(&'a self, buf: &'a mut [u8]) -> Self::RecvFuture<'a> {
+                self.0.recv_from(buf)
+            }
+            fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+                self.0.local_addr()
+            }
+            fn join_multicast_v4(
+                &self,
+                group: Ipv4Addr,
+                iface: Ipv4Addr,
+            ) -> Result<(), TransportError> {
+                self.0.join_multicast_v4(group, iface)
+            }
+            fn leave_multicast_v4(
+                &self,
+                group: Ipv4Addr,
+                iface: Ipv4Addr,
+            ) -> Result<(), TransportError> {
+                self.0.leave_multicast_v4(group, iface)
+            }
+        }
+
+        struct WrappingFactory;
+        impl TransportFactory for WrappingFactory {
+            type Socket = WrappedSocket;
+            type BindFuture<'a> = core::pin::Pin<
+                Box<dyn Future<Output = Result<Self::Socket, TransportError>> + Send + 'a>,
+            >;
+            fn bind<'a>(
+                &'a self,
+                addr: SocketAddrV4,
+                options: &'a SocketOptions,
+            ) -> Self::BindFuture<'a> {
+                let opts = *options;
+                Box::pin(async move {
+                    let inner = TokioTransport.bind(addr, &opts).await?;
+                    Ok(WrappedSocket(inner))
+                })
+            }
+        }
+
+        // Compile-time witness: this `let` binding only typechecks if
+        // `bind_with_transport` accepts `F::Socket = WrappedSocket` —
+        // i.e. the previous `F::Socket = TokioSocket` pin is gone.
+        let mut sm = SocketManager::<TestPayload, TokioChannels>::bind_with_transport(
+            &WrappingFactory,
+            &TokioSpawner,
+            0,
+            test_registry(),
+        )
+        .await
+        .expect("bind via wrapping factory");
+        let sm_port = sm.port();
+
+        // Runtime witness: traffic flows through the wrapper's
+        // `send_to` and the spawned I/O loop's `recv_from`.
+        let recv = UdpSocket::bind("127.0.0.1:0").await.unwrap();
+        let recv_port = recv.local_addr().unwrap().port();
+
+        let msg = Message::<TestPayload>::new_sd(1, &empty_sd_header());
+        sm.send(SocketAddrV4::new(Ipv4Addr::LOCALHOST, recv_port), msg)
+            .await
+            .expect("send via wrapping factory");
+
+        let mut buf = [0u8; UDP_BUFFER_SIZE];
+        let (len, _from) =
+            tokio::time::timeout(std::time::Duration::from_secs(2), recv.recv_from(&mut buf))
+                .await
+                .expect("timed out waiting for datagram")
+                .expect("recv failed");
+        assert!(len > 0, "empty datagram");
+        let view = MessageView::parse(&buf[..len]).unwrap();
+        assert_eq!(view.header().message_id(), crate::protocol::MessageId::SD);
+        let _ = sm_port;
+    }
+
+    /// Negative test: a factory that returns
+    /// `Err(TransportError::AddressInUse)` must surface as
+    /// `Err(Error::Transport(TransportError::AddressInUse))` through
+    /// the `?` + `From` conversion chain in
+    /// `bind_with_transport`. Catches regressions in the `#[from]`
+    /// impl on `client::Error` or the return-type plumbing.
+    #[tokio::test]
+    async fn bind_with_transport_propagates_factory_error() {
+        use crate::tokio_transport::TokioSocket;
+        use crate::transport::TransportError;
+
+        struct AlwaysBusyFactory;
+        impl TransportFactory for AlwaysBusyFactory {
+            type Socket = TokioSocket;
+            type BindFuture<'a> = core::pin::Pin<
+                Box<dyn Future<Output = Result<Self::Socket, TransportError>> + Send + 'a>,
+            >;
+            fn bind<'a>(
+                &'a self,
+                _addr: SocketAddrV4,
+                _options: &'a SocketOptions,
+            ) -> Self::BindFuture<'a> {
+                Box::pin(async move { Err(TransportError::AddressInUse) })
+            }
+        }
+
+        let err = TestSocketManager::bind_with_transport(
+            &AlwaysBusyFactory,
+            &TokioSpawner,
+            0,
+            test_registry(),
+        )
+        .await
+        .expect_err("factory returned Err, bind must surface it");
+        match err {
+            Error::Transport(TransportError::AddressInUse) => {}
+            other => {
+                panic!("expected Error::Transport(TransportError::AddressInUse), got {other:?}")
+            }
+        }
+    }
 }
diff --git a/src/e2e/crc.rs b/src/e2e/crc.rs
index 2eb08d7..91e60ca 100644
--- a/src/e2e/crc.rs
+++ b/src/e2e/crc.rs
@@ -115,10 +115,10 @@ mod tests {
     #[test]
     fn test_crc32_p4_basic() {
         // Basic smoke test - verify CRC changes with different inputs
-        let crc1 = compute_crc32_p4(10, 0, 0x12345678, b"test");
-        let crc2 = compute_crc32_p4(10, 1, 0x12345678, b"test");
-        let crc3 = compute_crc32_p4(10, 0, 0x12345679, b"test");
-        let crc4 = compute_crc32_p4(10, 0, 0x12345678, b"Test");
+        let crc1 = compute_crc32_p4(10, 0, 0x1234_5678, b"test");
+        let crc2 = compute_crc32_p4(10, 1, 0x1234_5678, b"test");
+        let crc3 = compute_crc32_p4(10, 0, 0x1234_5679, b"test");
+        let crc4 = compute_crc32_p4(10, 0, 0x1234_5678, b"Test");
 
         assert_ne!(crc1, crc2, "Different counter should produce different CRC");
         assert_ne!(crc1, crc3, "Different data_id should produce different CRC");
@@ -141,8 +141,8 @@ mod tests {
     #[test]
     fn test_crc32_p4_deterministic() {
         // Same inputs should always produce same output
-        let crc1 = compute_crc32_p4(20, 5, 0xABCDEF01, b"payload data");
-        let crc2 = compute_crc32_p4(20, 5, 0xABCDEF01, b"payload data");
+        let crc1 = compute_crc32_p4(20, 5, 0xABCD_EF01, b"payload data");
+        let crc2 = compute_crc32_p4(20, 5, 0xABCD_EF01, b"payload data");
         assert_eq!(crc1, crc2);
     }
 
@@ -157,7 +157,7 @@ mod tests {
     #[test]
     fn test_crc32_p4_empty_payload() {
         // Should work with empty payload
-        let crc = compute_crc32_p4(8, 0, 0x12345678, b"");
+        let crc = compute_crc32_p4(8, 0, 0x1234_5678, b"");
         assert_ne!(crc, 0); // CRC should be non-trivial even for empty payload
     }
 
diff --git a/src/e2e/e2e_checker.rs b/src/e2e/e2e_checker.rs
index 549f744..e8b7377 100644
--- a/src/e2e/e2e_checker.rs
+++ b/src/e2e/e2e_checker.rs
@@ -250,7 +250,7 @@ mod tests {
 
     #[test]
     fn test_check_profile4_valid() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -267,8 +267,8 @@ mod tests {
 
     #[test]
     fn test_check_profile4_wrong_data_id() {
-        let config1 = Profile4Config::new(0x12345678, 15);
-        let config2 = Profile4Config::new(0xDEADBEEF, 15);
+        let config1 = Profile4Config::new(0x1234_5678, 15);
+        let config2 = Profile4Config::new(0xDEAD_BEEF, 15);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -283,7 +283,7 @@ mod tests {
 
     #[test]
     fn test_check_profile4_corrupted_crc() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -300,7 +300,7 @@ mod tests {
 
     #[test]
     fn test_check_profile4_corrupted_payload() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -317,7 +317,7 @@ mod tests {
 
     #[test]
     fn test_check_profile4_wrong_length() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -332,7 +332,7 @@ mod tests {
 
     #[test]
     fn test_check_profile4_too_short() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut check_state = Profile4State::new();
 
         let short = [0u8; 11]; // Less than 12-byte header
@@ -389,7 +389,7 @@ mod tests {
 
     #[test]
     fn test_sequence_repeated() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -409,7 +409,7 @@ mod tests {
 
     #[test]
     fn test_sequence_consecutive() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -425,7 +425,7 @@ mod tests {
 
     #[test]
     fn test_sequence_some_lost() {
-        let config = Profile4Config::new(0x12345678, 10);
+        let config = Profile4Config::new(0x1234_5678, 10);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -450,7 +450,7 @@ mod tests {
 
     #[test]
     fn test_sequence_wrong_sequence() {
-        let config = Profile4Config::new(0x12345678, 3);
+        let config = Profile4Config::new(0x1234_5678, 3);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -475,7 +475,7 @@ mod tests {
 
     #[test]
     fn test_sequence_wraparound() {
-        let config = Profile4Config::new(0x12345678, 5);
+        let config = Profile4Config::new(0x1234_5678, 5);
         let mut protect_state = Profile4State::with_initial_counter(u16::MAX - 2);
         let mut check_state = Profile4State::new();
 
@@ -533,7 +533,7 @@ mod tests {
 
         assert_eq!(result.status, E2ECheckStatus::Ok);
         assert_eq!(result.counter, Some(0));
-        assert_eq!(result.payload.as_deref(), Some(payload.as_slice()));
+        assert_eq!(result.payload, Some(payload.as_slice()));
     }
 
     #[test]
diff --git a/src/e2e/e2e_protector.rs b/src/e2e/e2e_protector.rs
index 90122f8..9a3d48d 100644
--- a/src/e2e/e2e_protector.rs
+++ b/src/e2e/e2e_protector.rs
@@ -196,7 +196,7 @@ mod tests {
 
     #[test]
     fn test_protect_profile4_header_format() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut state = Profile4State::new();
 
         let payload = b"test";
@@ -217,7 +217,7 @@ mod tests {
 
         // Check data_id field (bytes 4-7)
         let data_id = u32::from_be_bytes([protected[4], protected[5], protected[6], protected[7]]);
-        assert_eq!(data_id, 0x12345678);
+        assert_eq!(data_id, 0x1234_5678);
 
         // Check payload at end
         assert_eq!(&protected[12..], b"test");
@@ -225,7 +225,7 @@ mod tests {
 
     #[test]
     fn test_protect_profile4_counter_increment() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut state = Profile4State::new();
 
         let payload = b"test";
@@ -241,7 +241,7 @@ mod tests {
 
     #[test]
     fn test_protect_profile4_counter_wraps() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut state = Profile4State::with_initial_counter(u16::MAX);
 
         let payload = b"test";
@@ -400,7 +400,7 @@ mod tests {
 
     #[test]
     fn test_protect_profile4_buffer_too_small() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut state = Profile4State::new();
 
         let payload = b"test";
@@ -458,7 +458,7 @@ mod tests {
     #[test]
     #[cfg(feature = "std")]
     fn test_protect_profile4_length_overflow() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut state = Profile4State::new();
 
         // payload of 65536 bytes => total = 12 + 65536 = 65548 > u16::MAX
@@ -470,7 +470,7 @@ mod tests {
 
     #[test]
     fn test_protect_profile4_empty_payload() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut state = Profile4State::new();
 
         let mut buf = [0u8; 256];
diff --git a/src/e2e/mod.rs b/src/e2e/mod.rs
index 233db20..02a52b6 100644
--- a/src/e2e/mod.rs
+++ b/src/e2e/mod.rs
@@ -12,7 +12,7 @@
 //!     E2ECheckStatus,
 //! };
 //!
-//! let config = Profile4Config::new(0x12345678, 15);
+//! let config = Profile4Config::new(0x1234_5678, 15);
 //! let mut protect_state = Profile4State::new();
 //! let mut check_state = Profile4State::new();
 //!
@@ -251,7 +251,7 @@ mod tests {
 
     #[test]
     fn test_profile4_roundtrip() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -291,7 +291,7 @@ mod tests {
 
     #[test]
     fn test_profile4_sequence_detection() {
-        let config = Profile4Config::new(0x12345678, 5);
+        let config = Profile4Config::new(0x1234_5678, 5);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -319,7 +319,7 @@ mod tests {
 
     #[test]
     fn test_profile4_some_lost_detection() {
-        let config = Profile4Config::new(0x12345678, 5);
+        let config = Profile4Config::new(0x1234_5678, 5);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -343,7 +343,7 @@ mod tests {
 
     #[test]
     fn test_profile4_wrong_sequence_detection() {
-        let config = Profile4Config::new(0x12345678, 2);
+        let config = Profile4Config::new(0x1234_5678, 2);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -368,7 +368,7 @@ mod tests {
 
     #[test]
     fn test_profile4_crc_error() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut protect_state = Profile4State::new();
         let mut check_state = Profile4State::new();
 
@@ -403,7 +403,7 @@ mod tests {
 
     #[test]
     fn test_profile4_bad_argument_short_message() {
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         let mut check_state = Profile4State::new();
 
         // Message too short (less than 12-byte header)
diff --git a/src/e2e/registry.rs b/src/e2e/registry.rs
index 0dcd8c8..7a7c39b 100644
--- a/src/e2e/registry.rs
+++ b/src/e2e/registry.rs
@@ -85,7 +85,7 @@ mod tests {
     fn register_and_check_profile4() {
         let mut reg = E2ERegistry::new();
         let key = make_key();
-        let config = Profile4Config::new(0x12345678, 15);
+        let config = Profile4Config::new(0x1234_5678, 15);
         reg.register(key, E2EProfile::Profile4(config.clone()));
         assert!(reg.contains_key(&key));
 
diff --git a/src/embassy_channels.rs b/src/embassy_channels.rs
new file mode 100644
index 0000000..3ce35d6
--- /dev/null
+++ b/src/embassy_channels.rs
@@ -0,0 +1,679 @@
+//! [`ChannelFactory`] backed by `embassy-sync::channel::Channel`. Active
+//! when the `embassy_channels` feature is enabled.
+//!
+//! # Heap allocation per call
+//!
+//! Both sender and receiver hold an `Arc<Inner<...>>`, and every
+//! call to [`EmbassySyncChannels::oneshot()`][of], [`bounded()`][bf], or
+//! [`unbounded()`][uf] heap-allocates a fresh `Arc<Inner<...>>`. The
+//! `Client` run-loop calls these per request-response pair — most
+//! notably, every method on `Client` that awaits a server response
+//! constructs a oneshot via this factory, so each such method
+//! triggers one `Arc` allocation.
+//!
+//! [of]: crate::transport::ChannelFactory::oneshot
+//! [bf]: crate::transport::ChannelFactory::bounded
+//! [uf]: crate::transport::ChannelFactory::unbounded
+//!
+//! # Use [`crate::static_channels`] for the no-alloc bare-metal path
+//!
+//! [`crate::static_channels`] ships a no-alloc `ChannelFactory` whose
+//! senders and receivers carry `&'static` references into pre-allocated
+//! [`OneshotPool`] / [`MpscPool`] storage. The
+//! [`define_static_channels!`][dsc] macro generates the per-`T`
+//! `*Pooled<MyChannels>` impls + a [`ChannelFactory`] impl on a unit
+//! struct.
+//!
+//! [`OneshotPool`]: crate::static_channels::OneshotPool
+//! [`MpscPool`]: crate::static_channels::MpscPool
+//! [dsc]: crate::define_static_channels
+//!
+//! `EmbassySyncChannels` remains useful for two cases:
+//!
+//! 1. Bringing up a bare-metal port on `std + alloc` targets where
+//!    you want the trait-surface integration validated before
+//!    declaring static pool sizes.
+//! 2. Demonstrating the `ChannelFactory` integration shape for
+//!    consumers writing their own backend.
+//!
+//! For production firmware targeting "zero heap after
+//! `Client::new` returns", switch to the macro-declared static
+//! pools.
+//!
+//! # Close semantics
+//!
+//! All six channel families honor the close contracts in
+//! [`crate::transport`]:
+//!
+//! - **Oneshot**: sender drop without `send` resolves the receiver's
+//!   `recv()` to `Err(OneshotCancelled)`. Receiver drop causes the
+//!   sender's `send()` to return `Err(value)`.
+//! - **Bounded MPSC**: when the receiver drops, any sender awaiting on
+//!   a full channel is woken and returns `Err(())`. When the last
+//!   sender drops, the receiver's `recv()` resolves to `None`.
+//! - **Unbounded MPSC**: same close contracts as bounded. `send_now`
+//!   returns `Err(value)` if either the channel is full or the
+//!   receiver has dropped.
+//!
+//! Multi-sender contention on a closed bounded channel: the close
+//! signal uses a `MultiWakerRegistration<8>`, so up to 8 awaiting
+//! senders are woken immediately on receiver drop. Beyond that cap
+//! the multi-waker auto-wakes-and-clears on the next register, so
+//! the close path remains correct under any sender count.
+
+use alloc::sync::Arc;
+use core::cell::RefCell;
+use core::future::{Future, poll_fn};
+use core::sync::atomic::{AtomicBool, AtomicUsize, Ordering};
+use core::task::Poll;
+use embassy_sync::blocking_mutex::Mutex as BlockingMutex;
+use embassy_sync::blocking_mutex::raw::CriticalSectionRawMutex;
+use embassy_sync::channel::Channel;
+use embassy_sync::waitqueue::{AtomicWaker, MultiWakerRegistration};
+
+/// Maximum number of distinct waiting senders we wake on receiver drop.
+/// More than this and the multi-waker auto-wakes-and-clears on the next
+/// register, so the close path remains correct under any sender count.
+const SEND_WAKER_CAP: usize = 8;
+
+use crate::transport::{
+    BoundedPooled, ChannelFactory, MpscRecv, MpscSend, OneshotCancelled, OneshotPooled,
+    OneshotRecv, OneshotSend, UnboundedPooled, UnboundedRecv, UnboundedSend,
+};
+
+// ── Oneshot (capacity-1 Channel) ──────────────────────────────────────
+
+struct OneshotInner<T: Send + 'static> {
+    chan: Channel<CriticalSectionRawMutex, T, 1>,
+    /// Cleared when the sender drops without sending; receiver's
+    /// `recv()` then resolves to `Err(OneshotCancelled)`.
+    sender_alive: AtomicBool,
+    /// Cleared when the receiver drops; sender's `send()` then
+    /// returns `Err(value)`.
+    receiver_alive: AtomicBool,
+    /// Wakes the receiver when the sender drops without sending.
+    cancel_waker: AtomicWaker,
+}
+
+impl<T: Send + 'static> OneshotInner<T> {
+    fn new() -> Self {
+        Self {
+            chan: Channel::new(),
+            sender_alive: AtomicBool::new(true),
+            receiver_alive: AtomicBool::new(true),
+            cancel_waker: AtomicWaker::new(),
+        }
+    }
+}
+
+pub struct EmbassySyncOneshotSender<T: Send + 'static> {
+    inner: Arc<OneshotInner<T>>,
+    sent: bool,
+}
+
+pub struct EmbassySyncOneshotReceiver<T: Send + 'static> {
+    inner: Arc<OneshotInner<T>>,
+}
+
+impl<T: Send + 'static> OneshotSend<T> for EmbassySyncOneshotSender<T> {
+    fn send(mut self, value: T) -> Result<(), T> {
+        if !self.inner.receiver_alive.load(Ordering::Acquire) {
+            return Err(value);
+        }
+        match self.inner.chan.try_send(value) {
+            Ok(()) => {
+                self.sent = true;
+                Ok(())
+            }
+            Err(embassy_sync::channel::TrySendError::Full(v)) => Err(v),
+        }
+    }
+}
+
+impl<T: Send + 'static> Drop for EmbassySyncOneshotSender<T> {
+    fn drop(&mut self) {
+        if !self.sent {
+            self.inner.sender_alive.store(false, Ordering::Release);
+            self.inner.cancel_waker.wake();
+        }
+    }
+}
+
+impl<T: Send + 'static> OneshotRecv<T> for EmbassySyncOneshotReceiver<T> {
+    // The complex `poll_fn` body with manual pinning requires an explicit
+    // async block rather than `async fn` syntax.
+    #[allow(clippy::manual_async_fn)]
+    fn recv(self) -> impl Future<Output = Result<T, OneshotCancelled>> + Send {
+        async move {
+            let inner = &self.inner;
+            poll_fn(move |cx| {
+                if let Ok(v) = inner.chan.try_receive() {
+                    return Poll::Ready(Ok(v));
+                }
+                if !inner.sender_alive.load(Ordering::Acquire) {
+                    return Poll::Ready(Err(OneshotCancelled));
+                }
+                inner.cancel_waker.register(cx.waker());
+                // Poll embassy's receive future to register on the
+                // channel's internal waker.
+                let mut fut = inner.chan.receive();
+                // SAFETY: stack-pinned, polled once, dropped before
+                // exiting this scope. No reference escapes.
+                let pinned = unsafe { core::pin::Pin::new_unchecked(&mut fut) };
+                if let Poll::Ready(v) = pinned.poll(cx) {
+                    return Poll::Ready(Ok(v));
+                }
+                // Re-check both signals after registration to close
+                // the lost-wakeup window.
+                if let Ok(v) = inner.chan.try_receive() {
+                    return Poll::Ready(Ok(v));
+                }
+                if !inner.sender_alive.load(Ordering::Acquire) {
+                    return Poll::Ready(Err(OneshotCancelled));
+                }
+                Poll::Pending
+            })
+            .await
+        }
+    }
+}
+
+impl<T: Send + 'static> Drop for EmbassySyncOneshotReceiver<T> {
+    fn drop(&mut self) {
+        self.inner.receiver_alive.store(false, Ordering::Release);
+    }
+}
+
+// ── MPSC Inner (shared by bounded + unbounded) ────────────────────────
+
+struct MpscInner<T: Send + 'static, const N: usize> {
+    chan: Channel<CriticalSectionRawMutex, T, N>,
+    /// Number of live senders (sum of all clones).
+    sender_count: AtomicUsize,
+    /// `true` once either the receiver dropped or the last sender
+    /// dropped. Senders observe this to short-circuit; receivers use
+    /// it as the empty-and-done signal.
+    closed: AtomicBool,
+    /// Wakes the receiver when the last sender drops.
+    recv_waker: AtomicWaker,
+    /// Wakes bounded senders awaiting on a full channel when the
+    /// receiver drops. Multi-slot so cloned senders are all woken,
+    /// not just the most-recently-registered one.
+    send_wakers:
+        BlockingMutex<CriticalSectionRawMutex, RefCell<MultiWakerRegistration<SEND_WAKER_CAP>>>,
+}
+
+impl<T: Send + 'static, const N: usize> MpscInner<T, N> {
+    fn new() -> Self {
+        Self {
+            chan: Channel::new(),
+            sender_count: AtomicUsize::new(1),
+            closed: AtomicBool::new(false),
+            recv_waker: AtomicWaker::new(),
+            send_wakers: BlockingMutex::new(RefCell::new(MultiWakerRegistration::new())),
+        }
+    }
+}
+
+// ── Bounded MPSC ──────────────────────────────────────────────────────
+
+pub struct EmbassySyncBoundedSender<T: Send + 'static, const N: usize> {
+    inner: Arc<MpscInner<T, N>>,
+}
+
+pub struct EmbassySyncBoundedReceiver<T: Send + 'static, const N: usize> {
+    inner: Arc<MpscInner<T, N>>,
+}
+
+impl<T: Send + 'static, const N: usize> Clone for EmbassySyncBoundedSender<T, N> {
+    fn clone(&self) -> Self {
+        self.inner.sender_count.fetch_add(1, Ordering::AcqRel);
+        Self {
+            inner: self.inner.clone(),
+        }
+    }
+}
+
+impl<T: Send + 'static, const N: usize> Drop for EmbassySyncBoundedSender<T, N> {
+    fn drop(&mut self) {
+        let prev = self.inner.sender_count.fetch_sub(1, Ordering::AcqRel);
+        if prev == 1 {
+            // Last sender — close the channel and wake the receiver.
+            self.inner.closed.store(true, Ordering::Release);
+            self.inner.recv_waker.wake();
+        }
+    }
+}
+
+impl<T: Send + 'static, const N: usize> MpscSend<T> for EmbassySyncBoundedSender<T, N> {
+    fn send(&self, value: T) -> impl Future<Output = Result<(), ()>> + Send + '_ {
+        let inner = self.inner.clone();
+        async move {
+            if inner.closed.load(Ordering::Acquire) {
+                drop(value);
+                return Err(());
+            }
+            // Pin embassy's SendFuture on the stack so the captured
+            // value survives across yields. Race against the closed
+            // flag.
+            let mut send_fut = core::pin::pin!(inner.chan.send(value));
+            poll_fn(|cx| {
+                if inner.closed.load(Ordering::Acquire) {
+                    return Poll::Ready(Err(()));
+                }
+                match send_fut.as_mut().poll(cx) {
+                    Poll::Ready(()) => Poll::Ready(Ok(())),
+                    Poll::Pending => {
+                        inner
+                            .send_wakers
+                            .lock(|w| w.borrow_mut().register(cx.waker()));
+                        if inner.closed.load(Ordering::Acquire) {
+                            return Poll::Ready(Err(()));
+                        }
+                        Poll::Pending
+                    }
+                }
+            })
+            .await
+        }
+    }
+}
+
+impl<T: Send + 'static, const N: usize> Drop for EmbassySyncBoundedReceiver<T, N> {
+    fn drop(&mut self) {
+        // Receiver gone — mark closed and wake every awaiting sender.
+        self.inner.closed.store(true, Ordering::Release);
+        self.inner.send_wakers.lock(|w| w.borrow_mut().wake());
+    }
+}
+
+impl<T: Send + 'static, const N: usize> MpscRecv<T> for EmbassySyncBoundedReceiver<T, N> {
+    fn recv(&mut self) -> impl Future<Output = Option<T>> + Send + '_ {
+        let inner = self.inner.clone();
+        async move { mpsc_recv_inner(inner).await }
+    }
+
+    fn poll_recv(&mut self, cx: &mut core::task::Context<'_>) -> core::task::Poll<Option<T>> {
+        mpsc_poll_recv(&self.inner, cx)
+    }
+}
+
+// ── Unbounded MPSC ────────────────────────────────────────────────────
+
+const UNBOUNDED_CAP: usize = 128;
+
+pub struct EmbassySyncUnboundedSender<T: Send + 'static> {
+    inner: Arc<MpscInner<T, UNBOUNDED_CAP>>,
+}
+
+pub struct EmbassySyncUnboundedReceiver<T: Send + 'static> {
+    inner: Arc<MpscInner<T, UNBOUNDED_CAP>>,
+}
+
+impl<T: Send + 'static> Clone for EmbassySyncUnboundedSender<T> {
+    fn clone(&self) -> Self {
+        self.inner.sender_count.fetch_add(1, Ordering::AcqRel);
+        Self {
+            inner: self.inner.clone(),
+        }
+    }
+}
+
+impl<T: Send + 'static> Drop for EmbassySyncUnboundedSender<T> {
+    fn drop(&mut self) {
+        let prev = self.inner.sender_count.fetch_sub(1, Ordering::AcqRel);
+        if prev == 1 {
+            self.inner.closed.store(true, Ordering::Release);
+            self.inner.recv_waker.wake();
+        }
+    }
+}
+
+impl<T: Send + 'static> UnboundedSend<T> for EmbassySyncUnboundedSender<T> {
+    fn send_now(&self, value: T) -> Result<(), T> {
+        if self.inner.closed.load(Ordering::Acquire) {
+            return Err(value);
+        }
+        self.inner.chan.try_send(value).map_err(|e| match e {
+            embassy_sync::channel::TrySendError::Full(v) => v,
+        })
+    }
+}
+
+impl<T: Send + 'static> Drop for EmbassySyncUnboundedReceiver<T> {
+    fn drop(&mut self) {
+        self.inner.closed.store(true, Ordering::Release);
+        self.inner.send_wakers.lock(|w| w.borrow_mut().wake());
+    }
+}
+
+impl<T: Send + 'static> UnboundedRecv<T> for EmbassySyncUnboundedReceiver<T> {
+    fn recv(&mut self) -> impl Future<Output = Option<T>> + Send + '_ {
+        let inner = self.inner.clone();
+        async move { mpsc_recv_inner(inner).await }
+    }
+}
+
+// ── Shared MPSC recv plumbing ─────────────────────────────────────────
+
+async fn mpsc_recv_inner<T: Send + 'static, const N: usize>(
+    inner: Arc<MpscInner<T, N>>,
+) -> Option<T> {
+    poll_fn(move |cx| mpsc_poll_recv(&inner, cx)).await
+}
+
+fn mpsc_poll_recv<T: Send + 'static, const N: usize>(
+    inner: &MpscInner<T, N>,
+    cx: &mut core::task::Context<'_>,
+) -> core::task::Poll<Option<T>> {
+    if let Ok(v) = inner.chan.try_receive() {
+        return Poll::Ready(Some(v));
+    }
+    if inner.closed.load(Ordering::Acquire) {
+        if let Ok(v) = inner.chan.try_receive() {
+            return Poll::Ready(Some(v));
+        }
+        return Poll::Ready(None);
+    }
+    inner.recv_waker.register(cx.waker());
+    // Poll embassy's receive future to register on its internal
+    // waker so per-value sends wake us.
+    let mut fut = inner.chan.receive();
+    // SAFETY: stack-pinned, polled once, dropped before this scope ends.
+    let pinned = unsafe { core::pin::Pin::new_unchecked(&mut fut) };
+    if let Poll::Ready(v) = pinned.poll(cx) {
+        return Poll::Ready(Some(v));
+    }
+    // Re-check both signals after registration.
+    if let Ok(v) = inner.chan.try_receive() {
+        return Poll::Ready(Some(v));
+    }
+    if inner.closed.load(Ordering::Acquire) {
+        if let Ok(v) = inner.chan.try_receive() {
+            return Poll::Ready(Some(v));
+        }
+        return Poll::Ready(None);
+    }
+    Poll::Pending
+}
+
+// ── ChannelFactory impl ───────────────────────────────────────────────
+
+/// [`ChannelFactory`] backed by `embassy-sync::channel::Channel`.
+#[derive(Clone, Copy)]
+pub struct EmbassySyncChannels;
+
+impl ChannelFactory for EmbassySyncChannels {
+    type OneshotSender<T: Send + 'static> = EmbassySyncOneshotSender<T>;
+    type OneshotReceiver<T: Send + 'static> = EmbassySyncOneshotReceiver<T>;
+
+    type BoundedSender<T: Send + 'static, const N: usize> = EmbassySyncBoundedSender<T, N>;
+    type BoundedReceiver<T: Send + 'static, const N: usize> = EmbassySyncBoundedReceiver<T, N>;
+
+    type UnboundedSender<T: Send + 'static> = EmbassySyncUnboundedSender<T>;
+    type UnboundedReceiver<T: Send + 'static> = EmbassySyncUnboundedReceiver<T>;
+}
+
+// Blanket `*Pooled` impls. Embassy-sync still heap-allocates per call
+// (one `Arc<Inner<...>>` per pair); the goal of these blanket impls
+// is API parity with `TokioChannels`, not zero-alloc.
+impl<T: Send + 'static> OneshotPooled<EmbassySyncChannels> for T {
+    fn oneshot_pair() -> (
+        <EmbassySyncChannels as ChannelFactory>::OneshotSender<T>,
+        <EmbassySyncChannels as ChannelFactory>::OneshotReceiver<T>,
+    ) {
+        let inner = Arc::new(OneshotInner::new());
+        (
+            EmbassySyncOneshotSender {
+                inner: inner.clone(),
+                sent: false,
+            },
+            EmbassySyncOneshotReceiver { inner },
+        )
+    }
+}
+
+impl<T: Send + 'static, const N: usize> BoundedPooled<EmbassySyncChannels, N> for T {
+    fn bounded_pair() -> (
+        <EmbassySyncChannels as ChannelFactory>::BoundedSender<T, N>,
+        <EmbassySyncChannels as ChannelFactory>::BoundedReceiver<T, N>,
+    ) {
+        let inner: Arc<MpscInner<T, N>> = Arc::new(MpscInner::new());
+        (
+            EmbassySyncBoundedSender {
+                inner: inner.clone(),
+            },
+            EmbassySyncBoundedReceiver { inner },
+        )
+    }
+}
+
+impl<T: Send + 'static> UnboundedPooled<EmbassySyncChannels> for T {
+    fn unbounded_pair() -> (
+        <EmbassySyncChannels as ChannelFactory>::UnboundedSender<T>,
+        <EmbassySyncChannels as ChannelFactory>::UnboundedReceiver<T>,
+    ) {
+        let inner: Arc<MpscInner<T, UNBOUNDED_CAP>> = Arc::new(MpscInner::new());
+        (
+            EmbassySyncUnboundedSender {
+                inner: inner.clone(),
+            },
+            EmbassySyncUnboundedReceiver { inner },
+        )
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use core::pin::pin;
+    use core::task::{Context, Waker};
+
+    fn poll_once<F: Future + Unpin>(fut: &mut F) -> Poll<F::Output> {
+        let waker = Waker::noop();
+        let mut cx = Context::from_waker(waker);
+        core::pin::Pin::new(fut).poll(&mut cx)
+    }
+
+    #[test]
+    fn oneshot_happy_path() {
+        let (tx, rx) = <u32 as OneshotPooled<EmbassySyncChannels>>::oneshot_pair();
+        tx.send(42).unwrap();
+        let mut fut = pin!(rx.recv());
+        match fut.as_mut().poll(&mut Context::from_waker(Waker::noop())) {
+            Poll::Ready(Ok(42)) => {}
+            other => panic!("expected Ready(Ok(42)), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn oneshot_send_after_receiver_drop_returns_err() {
+        let (tx, rx) = <u32 as OneshotPooled<EmbassySyncChannels>>::oneshot_pair();
+        drop(rx);
+        match tx.send(7) {
+            Err(7) => {}
+            other => panic!("expected Err(7), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn oneshot_recv_after_sender_drop_returns_cancelled() {
+        let (tx, rx) = <u32 as OneshotPooled<EmbassySyncChannels>>::oneshot_pair();
+        drop(tx);
+        let mut fut = pin!(rx.recv());
+        match fut.as_mut().poll(&mut Context::from_waker(Waker::noop())) {
+            Poll::Ready(Err(OneshotCancelled)) => {}
+            other => panic!("expected Ready(Err(Cancelled)), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn unbounded_send_after_receiver_drop_returns_err() {
+        let (tx, rx) = <u32 as UnboundedPooled<EmbassySyncChannels>>::unbounded_pair();
+        drop(rx);
+        match tx.send_now(7) {
+            Err(7) => {}
+            other => panic!("expected Err(7), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn bounded_recv_returns_none_when_all_senders_drop() {
+        let (tx, mut rx) = <u32 as BoundedPooled<EmbassySyncChannels, 4>>::bounded_pair();
+        let tx2 = tx.clone();
+        drop(tx);
+        // One sender alive — recv must be Pending.
+        {
+            let mut fut = pin!(rx.recv());
+            assert!(matches!(poll_once(&mut fut), Poll::Pending));
+        }
+        drop(tx2);
+        // All senders gone — recv resolves to None.
+        let mut fut = pin!(rx.recv());
+        match poll_once(&mut fut) {
+            Poll::Ready(None) => {}
+            other => panic!("expected Ready(None), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn bounded_send_after_receiver_drop_returns_err_fast_path() {
+        let (tx, rx) = <u32 as BoundedPooled<EmbassySyncChannels, 4>>::bounded_pair();
+        drop(rx);
+        let mut fut = pin!(tx.send(99));
+        match poll_once(&mut fut) {
+            Poll::Ready(Err(())) => {}
+            other => panic!("expected Ready(Err), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn bounded_send_unblocks_with_err_when_receiver_drops_mid_await() {
+        let (tx, rx) = <u32 as BoundedPooled<EmbassySyncChannels, 1>>::bounded_pair();
+        // Fill the slot.
+        {
+            let mut fut = pin!(tx.send(1));
+            assert!(matches!(poll_once(&mut fut), Poll::Ready(Ok(()))));
+        }
+        // Next send must wait.
+        let mut send_fut = pin!(tx.send(2));
+        assert!(matches!(poll_once(&mut send_fut), Poll::Pending));
+        // Drop receiver — sender must observe close on next poll.
+        drop(rx);
+        match poll_once(&mut send_fut) {
+            Poll::Ready(Err(())) => {}
+            other => panic!("expected Ready(Err) after receiver drop, got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn bounded_send_recv_happy_path() {
+        let (tx, mut rx) = <u32 as BoundedPooled<EmbassySyncChannels, 4>>::bounded_pair();
+        {
+            let mut fut = pin!(tx.send(42));
+            assert!(matches!(poll_once(&mut fut), Poll::Ready(Ok(()))));
+        }
+        let mut recv_fut = pin!(rx.recv());
+        match poll_once(&mut recv_fut) {
+            Poll::Ready(Some(42)) => {}
+            other => panic!("expected Ready(Some(42)), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn poll_recv_returns_value_and_pending() {
+        let (tx, mut rx) = <u32 as BoundedPooled<EmbassySyncChannels, 4>>::bounded_pair();
+        let waker = Waker::noop();
+        let mut cx = Context::from_waker(waker);
+
+        // Nothing queued yet — must be Pending.
+        assert!(matches!(rx.poll_recv(&mut cx), Poll::Pending));
+
+        // Send a value; next poll_recv must return it.
+        let mut send_fut = pin!(tx.send(7));
+        assert!(matches!(poll_once(&mut send_fut), Poll::Ready(Ok(()))));
+        assert!(matches!(rx.poll_recv(&mut cx), Poll::Ready(Some(7))));
+    }
+
+    #[test]
+    fn bounded_multi_sender_clone_partial_drop_keeps_channel_open() {
+        let (tx1, mut rx) = <u32 as BoundedPooled<EmbassySyncChannels, 4>>::bounded_pair();
+        let tx2 = tx1.clone();
+
+        // Drop the first sender — channel must still be open (tx2 is alive).
+        drop(tx1);
+        {
+            let mut recv_fut = pin!(rx.recv());
+            assert!(
+                matches!(poll_once(&mut recv_fut), Poll::Pending),
+                "channel must remain open while tx2 is alive"
+            );
+        }
+
+        // Send via the surviving sender and receive successfully.
+        {
+            let mut fut = pin!(tx2.send(99));
+            assert!(matches!(poll_once(&mut fut), Poll::Ready(Ok(()))));
+        }
+        let mut recv_fut2 = pin!(rx.recv());
+        assert!(matches!(poll_once(&mut recv_fut2), Poll::Ready(Some(99))));
+    }
+
+    #[test]
+    fn bounded_recv_drains_queued_items_before_returning_none_on_sender_close() {
+        // Items already in the queue when the last sender drops must be
+        // drained before recv() resolves to None — exercising the
+        // closed-but-items-remain branch in mpsc_poll_recv.
+        let (tx, mut rx) = <u32 as BoundedPooled<EmbassySyncChannels, 4>>::bounded_pair();
+        {
+            let mut f1 = pin!(tx.send(1));
+            let mut f2 = pin!(tx.send(2));
+            assert!(matches!(poll_once(&mut f1), Poll::Ready(Ok(()))));
+            assert!(matches!(poll_once(&mut f2), Poll::Ready(Ok(()))));
+        }
+        drop(tx);
+
+        // First item.
+        {
+            let mut r = pin!(rx.recv());
+            assert!(matches!(poll_once(&mut r), Poll::Ready(Some(1))));
+        }
+        // Second item.
+        {
+            let mut r = pin!(rx.recv());
+            assert!(matches!(poll_once(&mut r), Poll::Ready(Some(2))));
+        }
+        // Queue empty and channel closed — must resolve to None.
+        let mut r = pin!(rx.recv());
+        assert!(matches!(poll_once(&mut r), Poll::Ready(None)));
+    }
+
+    #[test]
+    fn unbounded_send_recv_happy_path() {
+        let (tx, mut rx) = <u32 as UnboundedPooled<EmbassySyncChannels>>::unbounded_pair();
+        assert!(tx.send_now(123).is_ok());
+        let mut recv_fut = pin!(rx.recv());
+        match poll_once(&mut recv_fut) {
+            Poll::Ready(Some(123)) => {}
+            other => panic!("expected Ready(Some(123)), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn unbounded_recv_returns_none_when_last_sender_drops() {
+        let (tx1, mut rx) = <u32 as UnboundedPooled<EmbassySyncChannels>>::unbounded_pair();
+        let tx2 = tx1.clone();
+
+        // Drop one sender — channel must stay open.
+        drop(tx1);
+        {
+            let mut fut = pin!(rx.recv());
+            assert!(matches!(poll_once(&mut fut), Poll::Pending));
+        }
+
+        // Drop last sender — recv must resolve to None.
+        drop(tx2);
+        let mut fut = pin!(rx.recv());
+        assert!(matches!(poll_once(&mut fut), Poll::Ready(None)));
+    }
+}
diff --git a/src/lib.rs b/src/lib.rs
index 78877b3..39991af 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -19,19 +19,32 @@
 //! | [`protocol`] | Yes | Wire format: headers, messages, message types, return codes, and service discovery (SD) entries/options |
 //! | [`e2e`] | Yes | End-to-End protection — Profile 4 (CRC-32) and Profile 5 (CRC-16) |
 //! | [`WireFormat`] / [`PayloadWireFormat`] | Yes | Traits for serializing messages and defining custom payload types |
-//! | [`client`] | No | Async tokio client — service discovery, subscriptions, and request/response (feature `client`) |
-//! | [`server`] | No | Async tokio server — service offering, event publishing, and subscription management (feature `server`) |
+//! | `client` | No | Async client trait surface — service discovery, subscriptions, request/response (feature `client`; add `client-tokio` for `Client::new`) |
+//! | `server` | No | Async server trait surface — service offering, event publishing, subscription management (feature `server`; add `server-tokio` for `Server::new`) |
 //!
 //! ## Feature Flags
 //!
 //! | Feature | Default | Description |
 //! |---------|---------|-------------|
-//! | `client` | no | Async tokio client; implies `std` + tokio + socket2 |
-//! | `server` | no | Async tokio server; implies `std` + tokio + socket2 |
-//! | `std` | no | Enables std-dependent helpers |
-//!
-//! By default only the `protocol`, trait, and `e2e` modules are compiled, and the crate
-//! builds in `no_std` mode with no allocator requirement.
+//! | `std` | yes | Enables std-dependent helpers (`RawPayload`, `VecSdHeader`, `OfferedEndpoint`) |
+//! | `client` | no | Trait-surface client; implies `std` + futures (no tokio) |
+//! | `client-tokio` | no | Adds the `Client::new` / `TokioSpawner` / `TokioTransport` convenience defaults; implies `client` + tokio + socket2 |
+//! | `server` | no | Trait-surface server; implies `std` + futures (no tokio) |
+//! | `server-tokio` | no | Adds the `Server::new` / `TokioTransport` / `TokioTimer` convenience defaults; implies `server` + tokio + socket2 |
+//! | `bare_metal` | no | Activates embassy-sync, the `static_channels` module (no-alloc `ChannelFactory`), and `AtomicInterfaceHandle`. `StaticE2EHandle` additionally requires `std` because the underlying `E2ERegistry` is currently `std`-only. See `examples/bare_metal_client/` and `examples/bare_metal_server/` for runnable bare-metal integration examples. |
+//! | `embassy_channels` | no | Heap-backed `EmbassySyncChannels` `ChannelFactory`. Implies `bare_metal` and pulls `extern crate alloc;` into the crate; **on `no_std`, downstream consumers must provide a `#[global_allocator]`**. Useful for tests / early prototypes before sizing static pools. |
+//!
+//! The default feature set is `["std"]`, which links `std` and enables
+//! the `RawPayload` / `VecSdHeader` helpers. For a minimal build with
+//! no allocator requirement — the `protocol`, trait, `transport`, and
+//! `e2e` modules only — pass `--no-default-features`. The
+//! trait-surface canary workspace members (`examples/bare_metal_client`,
+//! `examples/bare_metal_server`) depend on the crate with
+//! `default-features = false, features = ["bare_metal", "client"]` /
+//! `["bare_metal", "server"]` and validate that configuration when built
+//! in isolation (`cargo build -p bare_metal_client` /
+//! `cargo build -p bare_metal_server`), rather than as part of a workspace-wide
+//! build where features may be unified across members.
 //!
 //! ## Examples
 //!
@@ -57,17 +70,21 @@
 //! assert_eq!(view.entry_count(), 1);
 //! ```
 //!
-//! ### Async client (requires `feature = "client"`)
+//! ### Async client (requires `feature = "client-tokio"`)
 //!
 //! ```rust,no_run
-//! # #[cfg(feature = "client")]
+//! # #[cfg(feature = "client-tokio")]
 //! # fn wrapper() {
 //! use simple_someip::{Client, ClientUpdate, RawPayload};
 //!
 //! #[tokio::main]
 //! async fn main() {
-//!     // Client::new returns a Clone-able handle and an update stream.
-//!     let (client, mut updates) = Client::<RawPayload>::new([192, 168, 1, 100].into());
+//!     // Client::new returns a Clone-able handle, an update stream, and
+//!     // the run-loop future. Spawn the future on the tokio runtime;
+//!     // the returned future depends on `tokio::select!` / `tokio::time`
+//!     // / tokio sockets, so it is not executor-agnostic today.
+//!     let (client, mut updates, run) = Client::<RawPayload, _, _, _>::new([192, 168, 1, 100].into());
+//!     let _run_task = tokio::spawn(run);
 //!     client.bind_discovery().await.unwrap();
 //!
 //!     while let Some(update) = updates.recv().await {
@@ -92,6 +109,40 @@
 #[cfg(feature = "std")]
 extern crate std;
 
+// `embassy_channels` needs `alloc` for `EmbassySyncChannels`'s
+// `Arc<Channel<...>>` storage (the heap-backed bare-metal channel
+// primitive). The `static_channels` module does NOT need alloc — users
+// who only enable `bare_metal` (without `embassy_channels`) get no-alloc.
+#[cfg(feature = "embassy_channels")]
+extern crate alloc;
+
+/// Maximum size, in bytes, of UDP payloads for `client` / `server` send
+/// paths that serialize into a fixed-size buffer of this size.
+///
+/// Paths currently capped by this constant:
+/// - `client::SocketManager::send` (unicast + SD outbound)
+/// - `server::EventPublisher::publish_event`
+/// - `server::EventPublisher::publish_raw_event`
+///
+/// When one of these paths is actually reached and serialization is
+/// attempted, messages larger than this cap fail with
+/// `client::Error::Capacity("udp_buffer")` or
+/// `server::Error::Capacity("udp_buffer")`, depending on the path.
+/// Paths that return early before
+/// attempting serialization (e.g. `publish_event` when there are no
+/// subscribers) are not affected. Other outbound SD paths (announcement
+/// builders, `SubscribeAck` / `SubscribeNack`) currently still use
+/// heap `Vec` buffers and are not capped by this constant — that is a
+/// known gap, planned alongside the bare-metal `no_alloc` refactor.
+///
+/// Note that this is an application-level UDP payload limit, not an
+/// Ethernet-MTU-safe size: a 1500-byte UDP payload exceeds a 1500-byte
+/// L2 MTU once IP/UDP headers are added (IPv4 leaves 1472 bytes of UDP
+/// payload, IPv6 leaves 1452), so sends at this size may fragment or
+/// fail depending on the network stack. Bare-metal ports targeting a
+/// smaller link MTU may want to lower this by forking.
+pub const UDP_BUFFER_SIZE: usize = 1500;
+
 /// SOME/IP client for discovering services and exchanging messages.
 #[cfg(feature = "client")]
 pub mod client;
@@ -103,9 +154,44 @@ pub mod protocol;
 #[cfg(feature = "std")]
 mod raw_payload;
 /// SOME/IP server for offering services and handling incoming requests.
+///
+/// The engine is generic over [`transport::TransportFactory`] +
+/// [`transport::Timer`] + [`transport::E2ERegistryHandle`] +
+/// [`server::SubscriptionHandle`], so the bare `server` feature exposes the
+/// trait-surface server. The `server-tokio` feature additionally provides
+/// the tokio convenience constructors (`server::Server::new`,
+/// `server::Server::new_with_loopback`, `server::Server::new_passive`)
+/// that default the type parameters to
+/// `Arc<Mutex<E2ERegistry>>` / `Arc<RwLock<SubscriptionManager>>` /
+/// `TokioTransport` / `TokioTimer`.
 #[cfg(feature = "server")]
 pub mod server;
+/// Tokio + `socket2` implementation of the [`transport`] traits. Provided
+/// as the default `std` backend — available whenever `client-tokio` or
+/// `server-tokio` is enabled.
+#[cfg(any(feature = "client-tokio", feature = "server-tokio"))]
+pub mod tokio_transport;
+
+/// `embassy-sync`-backed implementation of [`transport::ChannelFactory`].
+/// Available whenever the `embassy_channels` feature is enabled. Uses
+/// heap allocation (`Arc<Channel<...>>`) — for no-alloc, use
+/// [`static_channels`] instead.
+#[cfg(feature = "embassy_channels")]
+pub mod embassy_channels;
+/// Static-pool no-alloc primitives for [`transport::ChannelFactory`].
+/// Backs the consumer-declared static `OneshotPool` / `MpscPool`
+/// instances that the [`define_static_channels!`] macro
+/// generates per-`T` `*Pooled<MyChannels>` impls against.
+#[cfg(feature = "bare_metal")]
+pub mod static_channels;
 mod traits;
+/// Executor-agnostic UDP transport abstraction used by the client and
+/// server modules. `no_std`-compatible; a default `std + tokio` backend
+/// ships in `tokio_transport` (available under the `client-tokio` /
+/// `server-tokio` features) — the link is rendered as a code literal
+/// because the target module is feature-gated and would break
+/// default-feature rustdoc builds.
+pub mod transport;
 #[cfg(feature = "std")]
 pub use raw_payload::{RawPayload, VecSdHeader};
 #[cfg(feature = "std")]
@@ -113,7 +199,20 @@ pub use traits::OfferedEndpoint;
 pub use traits::{PayloadWireFormat, WireFormat};
 
 #[cfg(feature = "client")]
-pub use client::{Client, ClientUpdate, ClientUpdates, DiscoveryMessage, PendingResponse};
+pub use client::{
+    Client, ClientDeps, ClientUpdate, ClientUpdates, DiscoveryMessage, PendingResponse,
+};
 pub use e2e::{E2ECheckStatus, E2EKey, E2EProfile};
 #[cfg(feature = "server")]
-pub use server::Server;
+pub use server::{Server, ServerDeps, SubscriptionHandle};
+#[cfg(any(feature = "client-tokio", feature = "server-tokio"))]
+pub use tokio_transport::{TokioChannels, TokioSocket, TokioSpawner, TokioTimer, TokioTransport};
+#[cfg(feature = "bare_metal")]
+pub use transport::AtomicInterfaceHandle;
+pub use transport::{
+    ChannelFactory, E2ERegistryHandle, InterfaceHandle, IoErrorKind, LocalSpawner, MpscRecv,
+    MpscSend, OneshotCancelled, OneshotRecv, OneshotSend, ReceivedDatagram, SocketOptions, Spawner,
+    Timer, TransportError, TransportFactory, TransportSocket, UnboundedRecv, UnboundedSend,
+};
+#[cfg(all(feature = "bare_metal", feature = "std"))]
+pub use transport::{StaticE2EHandle, StaticE2EStorage};
diff --git a/src/protocol/byte_order.rs b/src/protocol/byte_order.rs
index 6d1061f..9c41106 100644
--- a/src/protocol/byte_order.rs
+++ b/src/protocol/byte_order.rs
@@ -273,6 +273,10 @@ impl<T: embedded_io::Write> WriteBytesExt for T {
 }
 
 #[cfg(test)]
+// Strict float equality is correct here: these tests verify byte-level
+// round-tripping of `to_be_bytes` / `read_f*_be`, where the result must
+// be bitwise-identical to the input.
+#[allow(clippy::float_cmp)]
 mod tests {
     use super::*;
 
diff --git a/src/protocol/header.rs b/src/protocol/header.rs
index 1a3ca2c..921ee22 100644
--- a/src/protocol/header.rs
+++ b/src/protocol/header.rs
@@ -321,6 +321,23 @@ impl<'a> HeaderView<'a> {
     }
 }
 
+impl WireFormat for Header {
+    fn required_size(&self) -> usize {
+        16
+    }
+
+    fn encode<T: embedded_io::Write>(&self, writer: &mut T) -> Result<usize, Error> {
+        writer.write_u32_be(self.message_id.message_id())?;
+        writer.write_u32_be(self.length)?;
+        writer.write_u32_be(self.request_id)?;
+        writer.write_u8(self.protocol_version)?;
+        writer.write_u8(self.interface_version)?;
+        writer.write_u8(u8::from(self.message_type))?;
+        writer.write_u8(u8::from(self.return_code))?;
+        Ok(16)
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -591,20 +608,3 @@ mod tests {
         assert_eq!(view.to_owned(), h);
     }
 }
-
-impl WireFormat for Header {
-    fn required_size(&self) -> usize {
-        16
-    }
-
-    fn encode<T: embedded_io::Write>(&self, writer: &mut T) -> Result<usize, Error> {
-        writer.write_u32_be(self.message_id.message_id())?;
-        writer.write_u32_be(self.length)?;
-        writer.write_u32_be(self.request_id)?;
-        writer.write_u8(self.protocol_version)?;
-        writer.write_u8(self.interface_version)?;
-        writer.write_u8(u8::from(self.message_type))?;
-        writer.write_u8(u8::from(self.return_code))?;
-        Ok(16)
-    }
-}
diff --git a/src/protocol/message_id.rs b/src/protocol/message_id.rs
index d2815cb..533550b 100644
--- a/src/protocol/message_id.rs
+++ b/src/protocol/message_id.rs
@@ -83,6 +83,17 @@ impl MessageId {
     }
 }
 
+impl core::fmt::Debug for MessageId {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        write!(
+            f,
+            "Message Id: {{ service_id: {:#02X}, method_id: {:#02X} }}",
+            self.service_id(),
+            self.method_id(),
+        )
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -180,14 +191,3 @@ mod tests {
         assert!(buf.contains("method_id"));
     }
 }
-
-impl core::fmt::Debug for MessageId {
-    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
-        write!(
-            f,
-            "Message Id: {{ service_id: {:#02X}, method_id: {:#02X} }}",
-            self.service_id(),
-            self.method_id(),
-        )
-    }
-}
diff --git a/src/protocol/sd/header.rs b/src/protocol/sd/header.rs
index b513152..2321a31 100644
--- a/src/protocol/sd/header.rs
+++ b/src/protocol/sd/header.rs
@@ -234,7 +234,7 @@ mod tests {
             service_id: 0x1234,
             instance_id: 0x0001,
             major_version: 1,
-            ttl: 0xFFFFFF,
+            ttl: 0xFF_FFFF,
             index_first_options_run: 0,
             index_second_options_run: 0,
             options_count: OptionsCount::new(1, 0),
@@ -264,7 +264,7 @@ mod tests {
     #[test]
     fn subscribe_ack_round_trips() {
         let entry = Entry::SubscribeAckEventGroup(EventGroupEntry::new(
-            0xAAAA, 0x0001, 1, 0xFFFFFF, 0x0010,
+            0xAAAA, 0x0001, 1, 0xFF_FFFF, 0x0010,
         ));
         let entries = [entry];
         let h = Header::new(Flags::new_sd(RebootFlag::RecentlyRebooted), &entries, &[]);
@@ -281,7 +281,7 @@ mod tests {
             service_id: 0x1234,
             instance_id: 0x0001,
             major_version: 1,
-            ttl: 0xFFFFFF,
+            ttl: 0xFF_FFFF,
             index_first_options_run: 0,
             index_second_options_run: 0,
             options_count: OptionsCount::new(1, 0),
diff --git a/src/protocol/sd/options.rs b/src/protocol/sd/options.rs
index 8286649..96fd9a6 100644
--- a/src/protocol/sd/options.rs
+++ b/src/protocol/sd/options.rs
@@ -241,7 +241,7 @@ impl Options {
     ///
     /// # Panics
     ///
-    /// Panics if the option size minus [`OPTION_LENGTH_SIZE_DELTA`] exceeds `u16::MAX`
+    /// Panics if the option size minus `OPTION_LENGTH_SIZE_DELTA` exceeds `u16::MAX`
     /// (unreachable in practice).
     pub fn write<T: embedded_io::Write>(
         &self,
@@ -353,7 +353,7 @@ impl<'a> OptionView<'a> {
         OptionType::try_from(self.0[OPTION_TYPE_OFFSET])
     }
 
-    /// Total wire size of this option (length field value + [`OPTION_LENGTH_SIZE_DELTA`]).
+    /// Total wire size of this option (length field value + `OPTION_LENGTH_SIZE_DELTA`).
     #[must_use]
     pub fn wire_size(&self) -> usize {
         let length = u16::from_be_bytes([self.0[0], self.0[1]]);
diff --git a/src/server/README.md b/src/server/README.md
index cb78f05..effa13b 100644
--- a/src/server/README.md
+++ b/src/server/README.md
@@ -55,8 +55,9 @@ async fn main() -> Result<(), Box<dyn std::error::Error>> {
     // Create the server
     let mut server = Server::new(config).await?;
 
-    // Start announcing the service (sends OfferService every 1s)
-    server.start_announcing()?;
+    // Start announcing the service (sends OfferService every 1s).
+    // Spawn the announcement loop future on the Tokio runtime.
+    tokio::spawn(server.announcement_loop()?);
 
     // Get event publisher for sending events
     let publisher = server.publisher();
@@ -90,7 +91,7 @@ The server periodically sends **OfferService** messages to the multicast group `
 
 ```
 SD Message Structure:
-├─ Flags: Reboot=true, Unicast=false
+├─ Flags: Reboot=Recently/Continuous (per session-counter wrap), Unicast=true
 ├─ Entry: OfferService
 │  ├─ Service ID
 │  ├─ Instance ID
@@ -152,10 +153,10 @@ Configuration for a SOME/IP service provider:
 
 Main server struct:
 
-- `new(config: ServerConfig) -> Result<Self>` - Create new server
-- `start_announcing() -> Result<()>` - Start SD announcements
+- `new(config: ServerConfig) -> Result<Self, Error>` - Create new server
+- `announcement_loop() -> Result<impl Future<Output = ()> + Send + 'static, Error>` - Build the SD announcement future; caller spawns on the Tokio runtime
 - `publisher() -> Arc<EventPublisher>` - Get event publisher
-- `run() -> Result<()>` - Run event loop (handles subscriptions)
+- `run() -> Result<(), Error>` - Run event loop (handles subscriptions)
 - `register_e2e(key, profile)` - Register E2E protection for a message key
 - `unregister_e2e(key)` - Remove E2E protection for a message key
 
@@ -170,6 +171,11 @@ Publishes events to subscribers:
 - `publish_raw_event(service_id, instance_id, event_group_id, event_id, session_id, protocol_version, interface_version, payload) -> Result<usize>`
   - Low-level event publishing using raw bytes
   - Returns number of subscribers that received the event
+- `register_subscriber(service_id, instance_id, event_group_id, subscriber_addr) -> Result<(), SubscribeError>`
+  - Manually register a subscriber (advanced use; the built-in SD loop calls this for you)
+  - Capacity-rejects with `SubscribeError::*` so external dispatchers can emit a `SubscribeNack`
+- `remove_subscriber(service_id, instance_id, event_group_id, subscriber_addr)`
+  - Manually remove a subscriber
 - `has_subscribers(service_id, instance_id, event_group_id) -> bool`
   - Check if any subscribers exist for an event group
 - `subscriber_count(service_id, instance_id, event_group_id) -> usize`
@@ -179,10 +185,12 @@ Publishes events to subscribers:
 
 Manages event group subscriptions:
 
-- `subscribe(service_id, instance_id, event_group_id, subscriber_addr)` - Add subscriber (deduplicates automatically)
+- `subscribe(service_id, instance_id, event_group_id, subscriber_addr) -> Result<(), SubscribeError>` - Add subscriber (deduplicates automatically); returns `Err` when a fixed-capacity bound (`SUBSCRIBERS_PER_GROUP` or `EVENT_GROUPS_CAP`) is exhausted
 - `unsubscribe(service_id, instance_id, event_group_id, subscriber_addr)` - Remove subscriber
 - `get_subscribers(service_id, instance_id, event_group_id) -> Vec<Subscriber>` - Get all subscribers
 
+External dispatchers (those calling `EventPublisher::register_subscriber` directly) must NACK on `Err(SubscribeError::*)`; the server's built-in SD loop already does this automatically.
+
 ## Troubleshooting
 
 ### No subscribers
diff --git a/src/server/error.rs b/src/server/error.rs
index 9d80d9a..7b6a187 100644
--- a/src/server/error.rs
+++ b/src/server/error.rs
@@ -1,6 +1,10 @@
 use thiserror::Error;
 
 /// Errors that can occur during SOME/IP server operations.
+///
+/// Not marked `#[non_exhaustive]`: downstream crates that match on this
+/// enum rely on exhaustiveness. Variant additions are breaking changes
+/// and require a `SemVer` bump.
 #[derive(Error, Debug)]
 pub enum Error {
     /// A SOME/IP protocol-level error.
@@ -9,9 +13,20 @@ pub enum Error {
     /// An I/O error from the underlying network transport.
     #[error(transparent)]
     Io(#[from] std::io::Error),
+    /// A transport-layer error from a [`crate::transport::TransportFactory`]
+    /// or [`crate::transport::TransportSocket`] operation.
+    #[error("transport error: {0}")]
+    Transport(#[from] crate::transport::TransportError),
     /// An E2E protection or checking error occurred.
     #[error(transparent)]
     E2e(#[from] crate::e2e::Error),
+    /// A fixed-capacity internal structure is full (e.g. a stack send
+    /// buffer smaller than the outgoing message). The argument is a
+    /// lowercase `snake_case` tag naming the resource; grep the crate for
+    /// the tag to find the compile-time constant that governs it. Current
+    /// tags: `"udp_buffer"` (→ `crate::UDP_BUFFER_SIZE`).
+    #[error("internal capacity exceeded: {0}")]
+    Capacity(&'static str),
 }
 
 impl From<crate::protocol::sd::Error> for Error {
diff --git a/src/server/event_publisher.rs b/src/server/event_publisher.rs
index c32470f..3bb850e 100644
--- a/src/server/event_publisher.rs
+++ b/src/server/event_publisher.rs
@@ -1,30 +1,49 @@
 //! Event publishing functionality
 
 use super::Error;
-use super::subscription_manager::SubscriptionManager;
-use crate::e2e::{E2EKey, E2ERegistry, PROFILE4_HEADER_SIZE};
+use super::subscription_manager::{SUBSCRIBERS_PER_GROUP, SubscriptionHandle};
+use crate::UDP_BUFFER_SIZE;
+use crate::e2e::E2EKey;
 use crate::protocol::{Header, Message};
 use crate::traits::{PayloadWireFormat, WireFormat};
-use std::sync::{Arc, Mutex};
-use std::vec;
-use std::vec::Vec;
-use tokio::net::UdpSocket;
-use tokio::sync::RwLock;
-
-/// Publishes events to subscribers
-pub struct EventPublisher {
-    subscriptions: Arc<RwLock<SubscriptionManager>>,
-    socket: Arc<UdpSocket>,
-    e2e_registry: Arc<Mutex<E2ERegistry>>,
+use crate::transport::{E2ERegistryHandle, TransportSocket};
+use core::net::SocketAddrV4;
+use heapless::Vec as HeaplessVec;
+use std::sync::Arc;
+
+/// The publish snapshot buffer is sized to `SUBSCRIBERS_PER_GROUP` so
+/// `for_each_subscriber` can never overflow it. If a future refactor
+/// changes the manager's per-group cap independently, this assert
+/// catches the divergence at compile time.
+const _: () = assert!(
+    SUBSCRIBERS_PER_GROUP >= 1,
+    "SUBSCRIBERS_PER_GROUP must be >= 1 for the publish snapshot to fit any subscribers"
+);
+
+/// Publishes events to subscribers.
+///
+/// Generic over `T: TransportSocket` (the socket primitive — `TokioSocket`
+/// in the std/tokio path, a bare-metal embassy / smoltcp wrapper on
+/// firmware), `R: E2ERegistryHandle`, and `S: SubscriptionHandle`.
+pub struct EventPublisher<R, S, T>
+where
+    R: E2ERegistryHandle,
+    S: SubscriptionHandle,
+    T: TransportSocket + Send + Sync + 'static,
+{
+    subscriptions: S,
+    socket: Arc<T>,
+    e2e_registry: R,
 }
 
-impl EventPublisher {
+impl<R, S, T> EventPublisher<R, S, T>
+where
+    R: E2ERegistryHandle,
+    S: SubscriptionHandle,
+    T: TransportSocket + Send + Sync + 'static,
+{
     /// Create a new event publisher
-    pub fn new(
-        subscriptions: Arc<RwLock<SubscriptionManager>>,
-        socket: Arc<UdpSocket>,
-        e2e_registry: Arc<Mutex<E2ERegistry>>,
-    ) -> Self {
+    pub fn new(subscriptions: S, socket: Arc<T>, e2e_registry: R) -> Self {
         Self {
             subscriptions,
             socket,
@@ -46,7 +65,9 @@ impl EventPublisher {
     ///
     /// # Panics
     ///
-    /// Panics if the E2E registry mutex is poisoned.
+    /// May panic if the underlying [`E2ERegistryHandle`](crate::transport::E2ERegistryHandle)
+    /// implementation panics (e.g., `Arc<Mutex<E2ERegistry>>` on mutex poison).
+    #[allow(clippy::too_many_lines)]
     pub async fn publish_event<P: PayloadWireFormat>(
         &self,
         service_id: u16,
@@ -54,11 +75,23 @@ impl EventPublisher {
         event_group_id: u16,
         message: &Message<P>,
     ) -> Result<usize, Error> {
-        // Get subscribers
-        let subscribers = {
-            let mgr = self.subscriptions.read().await;
-            mgr.get_subscribers(service_id, instance_id, event_group_id)
-        };
+        // Snapshot subscriber addresses into a stack-allocated buffer so
+        // we can release the subscription read lock before doing async
+        // sends. This avoids a per-event heap allocation that the old
+        // `get_subscribers -> Vec<Subscriber>` API forced.
+        //
+        // The buffer cap matches the manager's per-group cap so push()
+        // is provably infallible — see the `const _` guard below.
+        let mut subscribers: HeaplessVec<SocketAddrV4, SUBSCRIBERS_PER_GROUP> = HeaplessVec::new();
+        let _total = self
+            .subscriptions
+            .for_each_subscriber(service_id, instance_id, event_group_id, |sub| {
+                // push() can never fail here: SUBSCRIBERS_PER_GROUP is
+                // both the manager's per-group cap and this buffer's
+                // cap, so the manager will never feed us more than fits.
+                let _ = subscribers.push(sub.address);
+            })
+            .await;
 
         if subscribers.is_empty() {
             tracing::trace!(
@@ -70,56 +103,97 @@ impl EventPublisher {
             return Ok(0);
         }
 
-        // Serialize the message once
-        let mut buffer = Vec::new();
-        message.encode(&mut buffer)?;
+        // Fail fast with the capacity error rather than letting
+        // `encode_to_slice` report a less-actionable protocol I/O error
+        // when it runs out of buffer. Matches the raw-event path below
+        // and the client socket_manager path.
+        let required_size = message.required_size();
+        if required_size > UDP_BUFFER_SIZE {
+            tracing::error!(
+                "Message size ({} bytes) exceeds UDP_BUFFER_SIZE ({}); dropping publish",
+                required_size,
+                UDP_BUFFER_SIZE
+            );
+            return Err(Error::Capacity("udp_buffer"));
+        }
 
-        // Apply E2E protect if configured
+        // Serialize the message into a fixed-size buffer of
+        // `UDP_BUFFER_SIZE` bytes. (In this `async fn` the buffer lives
+        // in the future state, not literally on the stack; "MTU-sized"
+        // is a misleading description since the cap is a UDP payload
+        // limit, not an Ethernet MTU — see `UDP_BUFFER_SIZE` docs.)
+        let mut buffer = [0u8; UDP_BUFFER_SIZE];
+        let mut message_length = message.encode_to_slice(&mut buffer)?;
+
+        // Apply E2E protect if configured. The `protected` stack buffer is
+        // disjoint from `buffer`, so we can read the unprotected payload
+        // directly out of `buffer[16..]` without a separate copy.
         {
             let key = E2EKey::from_message_id(message.header().message_id());
-            let mut registry = self
-                .e2e_registry
-                .lock()
-                .expect("e2e registry lock poisoned");
-            if registry.contains_key(&key) {
-                let message_length = buffer.len();
-                let original_payload = buffer[16..message_length].to_vec();
+            if self.e2e_registry.contains_key(&key) {
                 let upper_header: [u8; 8] = buffer[8..16].try_into().expect("upper header slice");
-                let mut protected = vec![0u8; original_payload.len() + PROFILE4_HEADER_SIZE];
-                match registry.protect(key, &original_payload, upper_header, &mut protected) {
+                let mut protected = [0u8; UDP_BUFFER_SIZE];
+                let result = self.e2e_registry.protect(
+                    key,
+                    &buffer[16..message_length],
+                    upper_header,
+                    &mut protected,
+                );
+                match result {
                     Some(Ok(protected_len)) => {
+                        if 16 + protected_len > UDP_BUFFER_SIZE {
+                            tracing::error!(
+                                "E2E-protected datagram ({} bytes, header + protected payload) \
+                                 exceeds UDP_BUFFER_SIZE ({}); dropping publish",
+                                16 + protected_len,
+                                UDP_BUFFER_SIZE
+                            );
+                            return Err(Error::Capacity("udp_buffer"));
+                        }
                         #[allow(clippy::cast_possible_truncation)]
                         let new_length: u32 = 8 + protected_len as u32;
                         buffer[4..8].copy_from_slice(&new_length.to_be_bytes());
-                        buffer.resize(16 + protected_len, 0);
                         buffer[16..16 + protected_len].copy_from_slice(&protected[..protected_len]);
+                        message_length = 16 + protected_len;
                     }
                     Some(Err(e)) => {
-                        tracing::error!("E2E protect error: {:?}", e);
+                        // Surface protect failures as `Err(Error::E2e(_))`
+                        // rather than logging-and-falling-through, which
+                        // would silently send the UNPROTECTED payload
+                        // claiming an E2E-protected channel and break the
+                        // receiver's CRC/counter checks. Counter
+                        // exhaustion, key-lookup races, and similar
+                        // backend errors all funnel here.
+                        tracing::error!("E2E protect error: {:?}; dropping publish", e);
+                        return Err(Error::E2e(e));
                     }
                     None => unreachable!("contains_key was true"),
                 }
             }
         }
 
-        // Send to all subscribers
-        let mut sent_count = 0;
-        for subscriber in &subscribers {
-            match self.socket.send_to(&buffer, subscriber.address).await {
-                Ok(_) => {
+        let datagram = &buffer[..message_length];
+
+        // Send to all snapshotted subscribers. Track the last
+        // transport error so we can surface "every send failed" as
+        // `Err(Transport(_))` rather than masking total failure as
+        // `Ok(0)` — which would be indistinguishable from "no
+        // subscribers" to the caller.
+        let mut sent_count = 0usize;
+        let mut last_err: Option<crate::transport::TransportError> = None;
+        for addr in &subscribers {
+            match self.socket.send_to(datagram, *addr).await {
+                Ok(()) => {
                     sent_count += 1;
                     tracing::trace!(
                         "Sent event to subscriber {} ({} bytes)",
-                        subscriber.address,
-                        buffer.len()
+                        addr,
+                        message_length
                     );
                 }
                 Err(e) => {
-                    tracing::error!(
-                        "Failed to send event to subscriber {}: {:?}",
-                        subscriber.address,
-                        e
-                    );
+                    tracing::error!("Failed to send event to subscriber {}: {:?}", addr, e);
+                    last_err = Some(e);
                 }
             }
         }
@@ -131,6 +205,14 @@ impl EventPublisher {
             service_id
         );
 
+        if sent_count == 0 {
+            // Every send failed (subscribers was non-empty above, so
+            // last_err is necessarily Some). Surface the most recent
+            // transport error so the caller can react.
+            return Err(Error::Transport(
+                last_err.unwrap_or(crate::transport::TransportError::Unsupported),
+            ));
+        }
         Ok(sent_count)
     }
 
@@ -153,16 +235,36 @@ impl EventPublisher {
         interface_version: u8,
         payload: &[u8],
     ) -> Result<usize, Error> {
-        // Get subscribers
-        let subscribers = {
-            let mgr = self.subscriptions.read().await;
-            mgr.get_subscribers(service_id, instance_id, event_group_id)
-        };
+        // Snapshot subscriber addresses into a stack buffer (see
+        // publish_event for rationale).
+        let mut subscribers: HeaplessVec<SocketAddrV4, SUBSCRIBERS_PER_GROUP> = HeaplessVec::new();
+        let _total = self
+            .subscriptions
+            .for_each_subscriber(service_id, instance_id, event_group_id, |sub| {
+                let _ = subscribers.push(sub.address);
+            })
+            .await;
 
         if subscribers.is_empty() {
             return Ok(0);
         }
 
+        // Pre-build size check. Fail fast with `Error::Capacity` BEFORE
+        // calling `Header::new_event`, which `assert!`s on payloads
+        // larger than `u32::MAX as usize - 8`. The earlier
+        // `checked_add(header_len, payload.len())` guard below was dead
+        // for that reason; keeping it for defence-in-depth on platforms
+        // where `Header::SIZE + payload` could overflow `usize`. The
+        // `16` here is the SOME/IP header size in bytes.
+        if payload.len() > UDP_BUFFER_SIZE.saturating_sub(16) {
+            tracing::error!(
+                "raw event payload ({} bytes) + 16-byte header exceeds UDP_BUFFER_SIZE ({}); dropping publish",
+                payload.len(),
+                UDP_BUFFER_SIZE
+            );
+            return Err(Error::Capacity("udp_buffer"));
+        }
+
         // Build SOME/IP header
         let header = Header::new_event(
             service_id,
@@ -173,28 +275,55 @@ impl EventPublisher {
             payload.len(),
         );
 
-        // Serialize header + payload
-        let mut buffer = Vec::new();
-        header.encode(&mut buffer)?;
-        buffer.extend_from_slice(payload);
-
-        // Send to all subscribers
-        let mut sent_count = 0;
-        for subscriber in &subscribers {
-            match self.socket.send_to(&buffer, subscriber.address).await {
-                Ok(_) => {
+        // Serialize header + payload into a fixed-size buffer of
+        // `UDP_BUFFER_SIZE` bytes. See note in `publish_event` above.
+        let mut buffer = [0u8; UDP_BUFFER_SIZE];
+        let header_len = header.encode_to_slice(&mut buffer)?;
+        let Some(total_len) = header_len.checked_add(payload.len()) else {
+            tracing::error!(
+                "raw event length computation overflowed usize (header_len={}, payload.len()={}); dropping publish",
+                header_len,
+                payload.len()
+            );
+            return Err(Error::Capacity("udp_buffer"));
+        };
+        // Defence-in-depth: the pre-build guard above already rejects
+        // oversize payloads, but a future caller adding optional
+        // post-encode tail bytes (e.g. another protect profile) would
+        // need this branch. Cheap to keep.
+        if total_len > UDP_BUFFER_SIZE {
+            tracing::error!(
+                "raw event ({} bytes) exceeds UDP_BUFFER_SIZE ({}); dropping publish",
+                total_len,
+                UDP_BUFFER_SIZE
+            );
+            return Err(Error::Capacity("udp_buffer"));
+        }
+        buffer[header_len..total_len].copy_from_slice(payload);
+        let datagram = &buffer[..total_len];
+
+        // Send to all snapshotted subscribers; surface total-failure
+        // as `Err(Transport(_))` rather than `Ok(0)` (see
+        // `publish_event`).
+        let mut sent_count = 0usize;
+        let mut last_err: Option<crate::transport::TransportError> = None;
+        for addr in &subscribers {
+            match self.socket.send_to(datagram, *addr).await {
+                Ok(()) => {
                     sent_count += 1;
                 }
                 Err(e) => {
-                    tracing::error!(
-                        "Failed to send raw event to {}: {:?}",
-                        subscriber.address,
-                        e
-                    );
+                    tracing::error!("Failed to send raw event to {}: {:?}", addr, e);
+                    last_err = Some(e);
                 }
             }
         }
 
+        if sent_count == 0 {
+            return Err(Error::Transport(
+                last_err.unwrap_or(crate::transport::TransportError::Unsupported),
+            ));
+        }
         Ok(sent_count)
     }
 
@@ -213,9 +342,10 @@ impl EventPublisher {
         instance_id: u16,
         event_group_id: u16,
     ) -> bool {
-        let mgr = self.subscriptions.read().await;
-        !mgr.get_subscribers(service_id, instance_id, event_group_id)
-            .is_empty()
+        self.subscriptions
+            .for_each_subscriber(service_id, instance_id, event_group_id, |_| {})
+            .await
+            > 0
     }
 
     /// Register a subscriber for an event group.
@@ -226,7 +356,7 @@ impl EventPublisher {
     ///
     /// Calling this method with the same `(service_id, instance_id,
     /// event_group_id, subscriber_addr)` tuple is idempotent — the
-    /// underlying [`SubscriptionManager`] deduplicates — so external
+    /// underlying [`super::SubscriptionManager`] deduplicates — so external
     /// dispatchers can safely call it on every incoming
     /// `SubscribeEventGroup` (including TTL refreshes) without growing
     /// the subscriber list.
@@ -242,15 +372,33 @@ impl EventPublisher {
     /// `remove_subscriber` when no refresh has arrived within the
     /// advertised TTL — otherwise subscribers accumulate for the
     /// lifetime of the process.
+    ///
+    /// # Errors
+    ///
+    /// Returns [`crate::server::SubscribeError`] when the underlying
+    /// [`super::SubscriptionManager`] cannot record the subscription because a
+    /// bounded capacity was hit:
+    /// - `SubscribersPerGroupFull` — the per-event-group subscriber list
+    ///   is full.
+    /// - `EventGroupsFull` — the outer event-group map is full.
+    ///
+    /// On `Err`, the subscriber was **not** registered and no events
+    /// will be delivered to `subscriber_addr` for this event group.
+    /// External dispatchers should treat this the same way the server's
+    /// own `run()` loop does: emit a `SubscribeNack` (or equivalent
+    /// upstream notification) so the peer does not assume it is
+    /// subscribed. A duplicate registration for an already-subscribed
+    /// address returns `Ok(())` (deduplicated).
     pub async fn register_subscriber(
         &self,
         service_id: u16,
         instance_id: u16,
         event_group_id: u16,
         subscriber_addr: std::net::SocketAddrV4,
-    ) {
-        let mut mgr = self.subscriptions.write().await;
-        mgr.subscribe(service_id, instance_id, event_group_id, subscriber_addr);
+    ) -> Result<(), crate::server::SubscribeError> {
+        self.subscriptions
+            .subscribe(service_id, instance_id, event_group_id, subscriber_addr)
+            .await
     }
 
     /// Remove a previously-registered subscriber from an event group.
@@ -270,8 +418,9 @@ impl EventPublisher {
         event_group_id: u16,
         subscriber_addr: std::net::SocketAddrV4,
     ) {
-        let mut mgr = self.subscriptions.write().await;
-        mgr.unsubscribe(service_id, instance_id, event_group_id, subscriber_addr);
+        self.subscriptions
+            .unsubscribe(service_id, instance_id, event_group_id, subscriber_addr)
+            .await;
     }
 
     /// Get the current number of subscribers for a specific event group
@@ -281,26 +430,58 @@ impl EventPublisher {
         instance_id: u16,
         event_group_id: u16,
     ) -> usize {
-        let mgr = self.subscriptions.read().await;
-        mgr.get_subscribers(service_id, instance_id, event_group_id)
-            .len()
+        self.subscriptions
+            .for_each_subscriber(service_id, instance_id, event_group_id, |_| {})
+            .await
     }
 }
 
-#[cfg(test)]
+#[cfg(all(test, feature = "server-tokio"))]
 mod tests {
     use super::*;
+    use crate::e2e::E2ERegistry;
     use crate::protocol::sd::test_support::{TestPayload, empty_sd_header};
+    use crate::server::SubscriptionManager;
+    use crate::tokio_transport::TokioSocket;
     use std::net::{Ipv4Addr, SocketAddrV4};
+    use std::sync::Mutex;
+    use std::vec;
+    use std::vec::Vec;
+    use tokio::net::UdpSocket;
+    use tokio::sync::RwLock;
+
+    /// Type alias bringing the tokio-flavor concrete type parameters back
+    /// into scope so tests can spell `TestEventPublisher` without
+    /// chasing the three-type-parameter signature on every call site.
+    type TestEventPublisher =
+        EventPublisher<Arc<Mutex<E2ERegistry>>, Arc<RwLock<SubscriptionManager>>, TokioSocket>;
 
     fn test_registry() -> Arc<Mutex<E2ERegistry>> {
         Arc::new(Mutex::new(E2ERegistry::new()))
     }
 
+    /// Bind a `TokioSocket` for tests. The publisher path under
+    /// `server-tokio` already depends on `tokio_transport`, so we use it
+    /// directly rather than constructing a `tokio::net::UdpSocket` and
+    /// adapting it.
+    async fn bind_tokio_socket() -> Arc<TokioSocket> {
+        use crate::transport::{SocketOptions, TransportFactory};
+        let factory = crate::tokio_transport::TokioTransport;
+        Arc::new(
+            factory
+                .bind(
+                    SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0),
+                    &SocketOptions::new(),
+                )
+                .await
+                .expect("bind tokio socket for test"),
+        )
+    }
+
     async fn make_publisher(
         subscriptions: Arc<RwLock<SubscriptionManager>>,
-    ) -> (EventPublisher, Arc<UdpSocket>) {
-        let socket = Arc::new(UdpSocket::bind("127.0.0.1:0").await.unwrap());
+    ) -> (TestEventPublisher, Arc<TokioSocket>) {
+        let socket = bind_tokio_socket().await;
         let publisher = EventPublisher::new(subscriptions, Arc::clone(&socket), test_registry());
         (publisher, socket)
     }
@@ -312,11 +493,7 @@ mod tests {
     #[tokio::test]
     async fn test_event_publisher_creation() {
         let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
-        let socket = Arc::new(
-            UdpSocket::bind("127.0.0.1:0")
-                .await
-                .expect("Failed to bind socket"),
-        );
+        let socket = bind_tokio_socket().await;
 
         let publisher = EventPublisher::new(subscriptions, socket, test_registry());
         assert!(std::mem::size_of_val(&publisher) > 0);
@@ -337,15 +514,14 @@ mod tests {
 
         // Create a receiver socket to act as subscriber
         let receiver = UdpSocket::bind("127.0.0.1:0").await.unwrap();
-        let recv_addr = match receiver.local_addr().unwrap() {
-            std::net::SocketAddr::V4(a) => a,
-            _ => panic!("expected v4"),
+        let std::net::SocketAddr::V4(recv_addr) = receiver.local_addr().unwrap() else {
+            panic!("expected v4 source address");
         };
 
         // Add subscriber
         {
             let mut mgr = subscriptions.write().await;
-            mgr.subscribe(0x5B, 1, 0x01, recv_addr);
+            mgr.subscribe(0x5B, 1, 0x01, recv_addr).unwrap();
         }
 
         let (publisher, _) = make_publisher(subscriptions).await;
@@ -376,19 +552,286 @@ mod tests {
         assert_eq!(count, 0);
     }
 
+    #[tokio::test]
+    async fn test_publish_raw_event_exceeds_udp_buffer_returns_capacity_error() {
+        let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
+        let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9999);
+        {
+            let mut mgr = subscriptions.write().await;
+            mgr.subscribe(0x5B, 1, 0x01, addr).unwrap();
+        }
+        let (publisher, _) = make_publisher(subscriptions).await;
+
+        // Payload = UDP_BUFFER_SIZE forces total (header + payload) over the cap.
+        let too_big = vec![0u8; UDP_BUFFER_SIZE];
+        let err = publisher
+            .publish_raw_event(0x5B, 1, 0x01, 0x8001, 0x0001, 0x01, 0x01, &too_big)
+            .await
+            .expect_err("oversize payload must error, not report Ok(0)");
+        match err {
+            Error::Capacity(tag) => assert_eq!(tag, "udp_buffer"),
+            other => panic!("expected Error::Capacity(\"udp_buffer\"), got {other:?}"),
+        }
+    }
+
+    /// Regression for H12: when there ARE subscribers but every
+    /// `send_to` fails, `publish_event` must surface the underlying
+    /// transport error instead of masking the failure as `Ok(0)` —
+    /// which is indistinguishable from "no subscribers" to the caller.
+    ///
+    /// Uses a mock `TransportSocket` whose `send_to` always returns
+    /// `Err(TransportError::Io(IoErrorKind::NetworkUnreachable))`.
+    #[tokio::test]
+    async fn publish_event_returns_err_when_every_send_fails() {
+        use crate::transport::{IoErrorKind, ReceivedDatagram, TransportError, TransportSocket};
+        use core::future::{Future, Ready, ready};
+        use core::pin::Pin;
+        use core::task::{Context, Poll};
+
+        struct AlwaysFailSocket;
+
+        struct AlwaysFailSend;
+        impl Future for AlwaysFailSend {
+            type Output = Result<(), TransportError>;
+            fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+                Poll::Ready(Err(TransportError::Io(IoErrorKind::NetworkUnreachable)))
+            }
+        }
+
+        impl TransportSocket for AlwaysFailSocket {
+            type SendFuture<'a> = AlwaysFailSend;
+            type RecvFuture<'a> = Ready<Result<ReceivedDatagram, TransportError>>;
+
+            fn send_to<'a>(&'a self, _buf: &'a [u8], _t: SocketAddrV4) -> Self::SendFuture<'a> {
+                AlwaysFailSend
+            }
+            fn recv_from<'a>(&'a self, _buf: &'a mut [u8]) -> Self::RecvFuture<'a> {
+                ready(Err(TransportError::Unsupported))
+            }
+            fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+                Ok(SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0))
+            }
+            fn join_multicast_v4(&self, _g: Ipv4Addr, _i: Ipv4Addr) -> Result<(), TransportError> {
+                Ok(())
+            }
+            fn leave_multicast_v4(&self, _g: Ipv4Addr, _i: Ipv4Addr) -> Result<(), TransportError> {
+                Ok(())
+            }
+        }
+
+        let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
+        let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9999);
+        {
+            let mut mgr = subscriptions.write().await;
+            mgr.subscribe(0x5B, 1, 0x01, addr).unwrap();
+        }
+        let publisher: EventPublisher<
+            Arc<Mutex<E2ERegistry>>,
+            Arc<RwLock<SubscriptionManager>>,
+            AlwaysFailSocket,
+        > = EventPublisher::new(subscriptions, Arc::new(AlwaysFailSocket), test_registry());
+
+        let msg = make_test_message();
+        let err = publisher
+            .publish_event(0x5B, 1, 0x01, &msg)
+            .await
+            .expect_err("total-failure path must surface Err, not Ok(0)");
+        match err {
+            Error::Transport(TransportError::Io(IoErrorKind::NetworkUnreachable)) => {}
+            other => panic!(
+                "expected Transport(Io(NetworkUnreachable)) from total-failure send, got {other:?}"
+            ),
+        }
+    }
+
+    /// Same H12 path through `publish_raw_event`.
+    #[tokio::test]
+    async fn publish_raw_event_returns_err_when_every_send_fails() {
+        use crate::transport::{IoErrorKind, ReceivedDatagram, TransportError, TransportSocket};
+        use core::future::{Future, Ready, ready};
+        use core::pin::Pin;
+        use core::task::{Context, Poll};
+
+        struct AlwaysFailSocket;
+        struct AlwaysFailSend;
+        impl Future for AlwaysFailSend {
+            type Output = Result<(), TransportError>;
+            fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+                Poll::Ready(Err(TransportError::Io(IoErrorKind::ConnectionRefused)))
+            }
+        }
+        impl TransportSocket for AlwaysFailSocket {
+            type SendFuture<'a> = AlwaysFailSend;
+            type RecvFuture<'a> = Ready<Result<ReceivedDatagram, TransportError>>;
+            fn send_to<'a>(&'a self, _buf: &'a [u8], _t: SocketAddrV4) -> Self::SendFuture<'a> {
+                AlwaysFailSend
+            }
+            fn recv_from<'a>(&'a self, _buf: &'a mut [u8]) -> Self::RecvFuture<'a> {
+                ready(Err(TransportError::Unsupported))
+            }
+            fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+                Ok(SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0))
+            }
+            fn join_multicast_v4(&self, _g: Ipv4Addr, _i: Ipv4Addr) -> Result<(), TransportError> {
+                Ok(())
+            }
+            fn leave_multicast_v4(&self, _g: Ipv4Addr, _i: Ipv4Addr) -> Result<(), TransportError> {
+                Ok(())
+            }
+        }
+
+        let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
+        let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9999);
+        {
+            let mut mgr = subscriptions.write().await;
+            mgr.subscribe(0x5B, 1, 0x01, addr).unwrap();
+        }
+        let publisher: EventPublisher<
+            Arc<Mutex<E2ERegistry>>,
+            Arc<RwLock<SubscriptionManager>>,
+            AlwaysFailSocket,
+        > = EventPublisher::new(subscriptions, Arc::new(AlwaysFailSocket), test_registry());
+
+        let err = publisher
+            .publish_raw_event(0x5B, 1, 0x01, 0x8001, 0x0001, 0x01, 0x01, &[0xAA, 0xBB])
+            .await
+            .expect_err("total-failure path must surface Err, not Ok(0)");
+        match err {
+            Error::Transport(TransportError::Io(IoErrorKind::ConnectionRefused)) => {}
+            other => panic!("expected Transport(Io(ConnectionRefused)), got {other:?}"),
+        }
+    }
+
+    /// Regression guard against 343da67: without the pre-check, an oversize
+    /// message would fail with a less-actionable protocol I/O error from
+    /// `encode_to_slice`'s slice writer running out of buffer, rather than
+    /// the explicit `Error::Capacity("udp_buffer")` the new branch returns.
+    ///
+    /// Note: a subscriber must be registered first — the pre-check sits
+    /// after the `subscribers.is_empty()` early return, so without one the
+    /// function would return `Ok(0)` and never touch the new branch,
+    /// giving a false positive.
+    #[tokio::test]
+    async fn publish_event_pre_encode_exceeds_udp_buffer_returns_capacity_error() {
+        use crate::RawPayload;
+        use crate::protocol::{Header, MessageId, MessageType, MessageTypeField, ReturnCode};
+
+        let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
+        let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9999);
+        {
+            let mut mgr = subscriptions.write().await;
+            mgr.subscribe(0x5B, 1, 0x01, addr).unwrap();
+        }
+        let (publisher, _) = make_publisher(subscriptions).await;
+
+        // Build a payload that exceeds the UDP cap by one byte based on
+        // `UDP_BUFFER_SIZE` instead of a hardcoded fixture length, so the
+        // test stays correct if the constant is retuned. Mirrors the
+        // client-side oversize fixture in
+        // `send_raw_message_exceeding_udp_buffer_returns_capacity_error`.
+        let message_id = MessageId::new_from_service_and_method(0x1234, 0x5678);
+        let payload_len = UDP_BUFFER_SIZE - 16 + 1  /* SOME/IP header is 16 bytes */;
+        let payload_bytes = vec![0u8; payload_len];
+        let payload = RawPayload::from_payload_bytes(message_id, &payload_bytes).unwrap();
+        let header = Header::new(
+            message_id,
+            0x0001_0001,
+            0x01,
+            0x01,
+            MessageTypeField::new(MessageType::Request, false),
+            ReturnCode::Ok,
+            payload_bytes.len(),
+        );
+        let message = Message::new(header, payload);
+        assert!(
+            message.required_size() > UDP_BUFFER_SIZE,
+            "fixture must exceed cap",
+        );
+
+        let err = publisher
+            .publish_event(0x5B, 1, 0x01, &message)
+            .await
+            .expect_err("oversize message must error, not report Ok(_)");
+        match err {
+            Error::Capacity(tag) => assert_eq!(tag, "udp_buffer"),
+            other => panic!("expected Error::Capacity(\"udp_buffer\"), got {other:?}"),
+        }
+    }
+
+    /// Messages whose raw encoded size fits `UDP_BUFFER_SIZE` but whose
+    /// E2E-protected size does not must be rejected with
+    /// `Error::Capacity("udp_buffer")` — guarding the post-protect branch
+    /// added alongside the raw-size pre-check.
+    #[tokio::test]
+    async fn test_publish_event_e2e_protected_exceeds_udp_buffer_returns_capacity_error() {
+        use crate::RawPayload;
+        use crate::e2e::{E2EProfile, Profile4Config};
+        use crate::protocol::MessageId;
+
+        // Register an E2E profile so the protect branch actually runs.
+        let message_id = MessageId::new_from_service_and_method(0x5B, 0x8001);
+        let key = E2EKey::from_message_id(message_id);
+        let mut reg = E2ERegistry::new();
+        reg.register(key, E2EProfile::Profile4(Profile4Config::new(0, 15)));
+        let e2e_registry = Arc::new(Mutex::new(reg));
+
+        // Pre-register a subscriber so we don't short-circuit on the
+        // "no subscribers" branch before reaching the E2E guard.
+        let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
+        {
+            let mut mgr = subscriptions.write().await;
+            mgr.subscribe(0x5B, 1, 0x01, SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9999))
+                .unwrap();
+        }
+
+        let socket = bind_tokio_socket().await;
+        let publisher = EventPublisher::new(subscriptions, socket, e2e_registry);
+
+        // Size the payload from `UDP_BUFFER_SIZE` and `PROFILE4_HEADER_SIZE`
+        // so the raw message fits exactly within the cap — leaving Profile4
+        // protection to push the encoded message over the limit and
+        // exercise the post-protect guard — regardless of how
+        // `UDP_BUFFER_SIZE` is retuned.
+        let payload_len = UDP_BUFFER_SIZE - 16; // raw total == UDP_BUFFER_SIZE; SOME/IP header = 16
+        let payload_bytes = vec![0u8; payload_len];
+        let payload = RawPayload::from_payload_bytes(message_id, &payload_bytes).unwrap();
+        let header = Header::new_event(
+            message_id.service_id(),
+            message_id.method_id(),
+            0x0001_0001,
+            0x01,
+            0x01,
+            payload_bytes.len(),
+        );
+        let message = Message::new(header, payload);
+        assert!(
+            message.required_size() <= UDP_BUFFER_SIZE,
+            "fixture's raw size must fit the cap so the pre-encode check passes and \
+             we actually exercise the post-protect guard",
+        );
+
+        let err = publisher
+            .publish_event(0x5B, 1, 0x01, &message)
+            .await
+            .expect_err("E2E-protected oversize message must error, not report Ok(n)");
+        match err {
+            Error::Capacity(tag) => assert_eq!(tag, "udp_buffer"),
+            other => panic!("expected Error::Capacity(\"udp_buffer\"), got {other:?}"),
+        }
+    }
+
     #[tokio::test]
     async fn test_publish_raw_event_with_subscriber() {
         let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
 
         let receiver = UdpSocket::bind("127.0.0.1:0").await.unwrap();
-        let recv_addr = match receiver.local_addr().unwrap() {
-            std::net::SocketAddr::V4(a) => a,
-            _ => panic!("expected v4"),
+        let std::net::SocketAddr::V4(recv_addr) = receiver.local_addr().unwrap() else {
+            panic!("expected v4 source address");
         };
 
         {
             let mut mgr = subscriptions.write().await;
-            mgr.subscribe(0x5B, 1, 0x01, recv_addr);
+            mgr.subscribe(0x5B, 1, 0x01, recv_addr).unwrap();
         }
 
         let (publisher, _) = make_publisher(subscriptions).await;
@@ -417,13 +860,13 @@ mod tests {
     #[tokio::test]
     async fn test_subscriber_count() {
         let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
-        let addr1 = SocketAddrV4::new(Ipv4Addr::new(127, 0, 0, 1), 9001);
-        let addr2 = SocketAddrV4::new(Ipv4Addr::new(127, 0, 0, 1), 9002);
+        let addr1 = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9001);
+        let addr2 = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9002);
 
         {
             let mut mgr = subscriptions.write().await;
-            mgr.subscribe(0x5B, 1, 0x01, addr1);
-            mgr.subscribe(0x5B, 1, 0x01, addr2);
+            mgr.subscribe(0x5B, 1, 0x01, addr1).unwrap();
+            mgr.subscribe(0x5B, 1, 0x01, addr2).unwrap();
         }
 
         let (publisher, _) = make_publisher(subscriptions).await;
@@ -439,12 +882,8 @@ mod tests {
 
         {
             let mut mgr = subscriptions.write().await;
-            mgr.subscribe(
-                0x5B,
-                1,
-                0x01,
-                SocketAddrV4::new(Ipv4Addr::new(127, 0, 0, 1), 9001),
-            );
+            mgr.subscribe(0x5B, 1, 0x01, SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9001))
+                .unwrap();
         }
 
         assert!(publisher.has_subscribers(0x5B, 1, 0x01).await);
@@ -466,7 +905,10 @@ mod tests {
         let (publisher, _) = make_publisher(Arc::clone(&subscriptions)).await;
 
         assert!(!publisher.has_subscribers(0x5B, 1, 0x01).await);
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
         assert!(publisher.has_subscribers(0x5B, 1, 0x01).await);
         assert_eq!(publisher.subscriber_count(0x5B, 1, 0x01).await, 1);
     }
@@ -478,9 +920,18 @@ mod tests {
 
         // Simulate TTL refreshes — the same (tuple, addr) called repeatedly
         // must not grow the subscriber list.
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
 
         assert_eq!(publisher.subscriber_count(0x5B, 1, 0x01).await, 1);
     }
@@ -490,8 +941,14 @@ mod tests {
         let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
         let (publisher, _) = make_publisher(Arc::clone(&subscriptions)).await;
 
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
-        publisher.register_subscriber(0x5B, 1, 0x02, ADDR_A).await;
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
+        publisher
+            .register_subscriber(0x5B, 1, 0x02, ADDR_A)
+            .await
+            .unwrap();
 
         assert_eq!(publisher.subscriber_count(0x5B, 1, 0x01).await, 1);
         assert_eq!(publisher.subscriber_count(0x5B, 1, 0x02).await, 1);
@@ -504,7 +961,10 @@ mod tests {
         let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
         let (publisher, _) = make_publisher(Arc::clone(&subscriptions)).await;
 
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
         assert!(publisher.has_subscribers(0x5B, 1, 0x01).await);
 
         publisher.remove_subscriber(0x5B, 1, 0x01, ADDR_A).await;
@@ -517,9 +977,18 @@ mod tests {
         let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
         let (publisher, _) = make_publisher(Arc::clone(&subscriptions)).await;
 
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_B).await;
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_C).await;
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_B)
+            .await
+            .unwrap();
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_C)
+            .await
+            .unwrap();
         assert_eq!(publisher.subscriber_count(0x5B, 1, 0x01).await, 3);
 
         publisher.remove_subscriber(0x5B, 1, 0x01, ADDR_B).await;
@@ -544,7 +1013,10 @@ mod tests {
         assert_eq!(publisher.subscriber_count(0x5B, 1, 0x01).await, 0);
 
         // Register one subscriber, then remove a different address.
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
         publisher.remove_subscriber(0x5B, 1, 0x01, ADDR_B).await;
         assert_eq!(publisher.subscriber_count(0x5B, 1, 0x01).await, 1);
 
@@ -558,8 +1030,14 @@ mod tests {
         let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
         let (publisher, _) = make_publisher(Arc::clone(&subscriptions)).await;
 
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_B).await;
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_B)
+            .await
+            .unwrap();
         assert!(publisher.has_subscribers(0x5B, 1, 0x01).await);
 
         publisher.remove_subscriber(0x5B, 1, 0x01, ADDR_A).await;
@@ -576,9 +1054,15 @@ mod tests {
         let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
         let (publisher, _) = make_publisher(Arc::clone(&subscriptions)).await;
 
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
         publisher.remove_subscriber(0x5B, 1, 0x01, ADDR_A).await;
-        publisher.register_subscriber(0x5B, 1, 0x01, ADDR_A).await;
+        publisher
+            .register_subscriber(0x5B, 1, 0x01, ADDR_A)
+            .await
+            .unwrap();
 
         assert_eq!(publisher.subscriber_count(0x5B, 1, 0x01).await, 1);
     }
diff --git a/src/server/mod.rs b/src/server/mod.rs
index 1532b98..04b2d84 100644
--- a/src/server/mod.rs
+++ b/src/server/mod.rs
@@ -8,25 +8,39 @@
 
 mod error;
 mod event_publisher;
+mod sd_state;
 mod service_info;
 mod subscription_manager;
 
 pub use error::Error;
 pub use event_publisher::EventPublisher;
-pub use service_info::{EventGroupInfo, ServiceInfo};
-pub use subscription_manager::SubscriptionManager;
+pub use service_info::{EventGroupInfo, ServiceInfo, Subscriber};
+pub use subscription_manager::{SubscribeError, SubscriptionHandle, SubscriptionManager};
 
-use crate::e2e::{E2EKey, E2EProfile, E2ERegistry};
+use sd_state::SdStateManager;
+
+use core::sync::atomic::{AtomicBool, Ordering};
+
+use crate::Timer;
+use crate::e2e::{E2EKey, E2EProfile};
 use crate::protocol::sd::{self, Entry, Flags, OptionsCount, ServiceEntry, TransportProtocol};
-use core::sync::atomic::Ordering;
+use crate::transport::{E2ERegistryHandle, SocketOptions, TransportFactory, TransportSocket};
+use futures::{FutureExt, pin_mut, select};
+#[cfg(test)]
+use std::vec::Vec;
 use std::{
     format,
-    net::{IpAddr, Ipv4Addr, SocketAddrV4},
-    sync::{Arc, Mutex, atomic::AtomicU16},
+    net::{Ipv4Addr, SocketAddrV4},
+    sync::Arc,
     vec,
-    vec::Vec,
 };
-use tokio::{net::UdpSocket, sync::RwLock};
+
+#[cfg(feature = "server-tokio")]
+use crate::e2e::E2ERegistry;
+#[cfg(feature = "server-tokio")]
+use std::sync::Mutex;
+#[cfg(feature = "server-tokio")]
+use tokio::sync::RwLock;
 
 /// Configuration for a SOME/IP service provider
 #[derive(Debug, Clone)]
@@ -45,9 +59,21 @@ pub struct ServerConfig {
     pub minor_version: u32,
     /// Service Discovery TTL (time to live)
     pub ttl: u32,
+    /// Event-group IDs the server publishes to. Used by the SD
+    /// `Subscribe` handler to NACK subscriptions for unknown groups
+    /// (per AUTOSAR SOME/IP-SD: an event group must be known before
+    /// subscription is granted). When empty, any event-group ID is
+    /// accepted — preserves back-compat for callers that have not
+    /// enumerated their groups; populate to opt into validation.
+    pub event_group_ids: heapless::Vec<u16, { ServerConfig::EVENT_GROUP_IDS_CAP }>,
 }
 
 impl ServerConfig {
+    /// Maximum number of event-group IDs trackable in
+    /// [`Self::event_group_ids`]. Matches `EVENT_GROUPS_CAP` in the
+    /// subscription manager.
+    pub const EVENT_GROUP_IDS_CAP: usize = 32;
+
     /// Create a new server configuration
     #[must_use]
     pub fn new(interface: Ipv4Addr, local_port: u16, service_id: u16, instance_id: u16) -> Self {
@@ -59,34 +85,114 @@ impl ServerConfig {
             major_version: 1,
             minor_version: 0,
             ttl: 3, // 3 seconds is typical for SOME/IP
+            event_group_ids: heapless::Vec::new(),
         }
     }
+
+    /// Returns `true` if `event_group_id` is registered, OR
+    /// [`Self::event_group_ids`] is empty (validation disabled).
+    #[must_use]
+    pub fn accepts_event_group(&self, event_group_id: u16) -> bool {
+        self.event_group_ids.is_empty() || self.event_group_ids.contains(&event_group_id)
+    }
 }
 
-/// SOME/IP Server that can offer services and publish events
-pub struct Server {
+/// Bundle of pluggable infrastructure passed to [`Server::new_with_deps`].
+/// Mirrors `crate::ClientDeps` (under `client`) but with the server's
+/// smaller surface
+/// — no `Spawner` (server has no internal task spawning), no
+/// `InterfaceHandle` (interface lives in [`ServerConfig`]).
+///
+/// All four fields are public so callers can construct the struct
+/// inline.
+pub struct ServerDeps<F, Tm, R, S>
+where
+    F: TransportFactory,
+    Tm: Timer,
+    R: E2ERegistryHandle,
+    S: SubscriptionHandle,
+{
+    /// Transport factory used to bind the unicast and SD sockets.
+    pub factory: F,
+    /// Async sleep primitive used by the announcement loop's 1-second tick.
+    pub timer: Tm,
+    /// Shared E2E registry handle for runtime E2E configuration.
+    pub e2e_registry: R,
+    /// Shared subscription manager handle. The convenience constructor
+    /// `Server::new` (under `server-tokio`) builds an
+    /// `Arc<RwLock<SubscriptionManager>>` for this; bare-metal callers
+    /// supply their own [`SubscriptionHandle`] impl.
+    pub subscriptions: S,
+}
+
+/// SOME/IP Server that can offer services and publish events.
+///
+/// Generic over the four pluggable infrastructure types bundled in
+/// [`ServerDeps`]:
+/// - `R: E2ERegistryHandle` — runtime E2E configuration registry
+/// - `S: SubscriptionHandle` — event-group subscription state
+/// - `F: TransportFactory` — socket primitive (carried as a stored
+///   unit-struct in the tokio path; bare-metal impls may carry state)
+/// - `Tm: Timer` — async sleep used by the announcement loop
+///
+/// The convenience constructors `Self::new` / `Self::new_with_loopback`
+/// / `Self::new_passive` (under the `server-tokio` feature) instantiate
+/// these as `Arc<Mutex<E2ERegistry>>` / `Arc<RwLock<SubscriptionManager>>`
+/// / `TokioTransport` / `TokioTimer`. Bare-metal callers use
+/// [`Self::new_with_deps`] (under `server`) and supply their own.
+pub struct Server<R, S, F, Tm>
+where
+    R: E2ERegistryHandle,
+    S: SubscriptionHandle,
+    F: TransportFactory + Send + Sync + 'static,
+    F::Socket: Send + Sync + 'static,
+    Tm: Timer + Clone + Send + Sync + 'static,
+{
     config: ServerConfig,
     /// Socket for receiving subscription requests
-    unicast_socket: Arc<UdpSocket>,
+    unicast_socket: Arc<F::Socket>,
     /// Socket for sending SD announcements
-    sd_socket: Arc<UdpSocket>,
+    sd_socket: Arc<F::Socket>,
     /// Subscription manager
-    subscriptions: Arc<RwLock<SubscriptionManager>>,
+    subscriptions: S,
     /// Event publisher
-    publisher: Arc<EventPublisher>,
-    /// Incrementing session ID for SD messages
-    sd_session_id: Arc<AtomicU16>,
+    publisher: Arc<EventPublisher<R, S, F::Socket>>,
+    /// SD session-ID counter and announcement emitter
+    sd_state: Arc<SdStateManager>,
     /// Shared E2E registry for runtime E2E configuration
-    e2e_registry: Arc<Mutex<E2ERegistry>>,
-    /// `true` if this server was constructed via [`Server::new_passive`].
+    e2e_registry: R,
+    /// Transport factory. Used at construction time to bind sockets;
+    /// retained on the struct so bare-metal factories that carry state
+    /// (e.g. an embassy-net `Stack` handle) survive the constructor.
+    /// On `server-tokio` builds this is a zero-sized `TokioTransport`.
+    #[allow(dead_code)]
+    factory: F,
+    /// Async sleep primitive used by [`Self::announcement_loop`]'s
+    /// 1-second tick. On `server-tokio` builds this is `TokioTimer`
+    /// (wrapping `tokio::time::sleep`).
+    timer: Tm,
+    /// `true` if this server was constructed via `Server::new_passive`.
     /// Passive servers have no real SD socket bound to port 30490; their
-    /// SD handling is managed externally. Calling [`Self::start_announcing`]
+    /// SD handling is managed externally. Calling [`Self::announcement_loop`]
     /// or [`Self::run`] on a passive server is a programming error and
     /// returns an [`Error::Io`] with [`std::io::ErrorKind::InvalidInput`].
     is_passive: bool,
+    /// Set the first time [`Self::announcement_loop`] is called. A
+    /// second call returns `Err(Error::Io(InvalidInput))` so two
+    /// independent futures cannot race on the same SD socket and
+    /// session counter.
+    announcement_loop_started: AtomicBool,
 }
 
-impl Server {
+#[cfg(feature = "server-tokio")]
+impl
+    Server<
+        Arc<Mutex<E2ERegistry>>,
+        Arc<RwLock<SubscriptionManager>>,
+        crate::tokio_transport::TokioTransport,
+        crate::tokio_transport::TokioTimer,
+    >
+{
     /// Create a new SOME/IP server
     ///
     /// # Errors
@@ -125,175 +231,285 @@ impl Server {
         config: ServerConfig,
         multicast_loopback: bool,
     ) -> Result<Self, Error> {
-        // Bind unicast socket for receiving subscriptions
+        let deps = ServerDeps {
+            factory: crate::tokio_transport::TokioTransport,
+            timer: crate::tokio_transport::TokioTimer,
+            e2e_registry: Arc::new(Mutex::new(E2ERegistry::new())),
+            subscriptions: Arc::new(RwLock::new(SubscriptionManager::new())),
+        };
+        Self::new_with_deps(deps, config, multicast_loopback).await
+    }
+
+    /// Create a passive SOME/IP server.
+    ///
+    /// A passive server binds its unicast socket at `config.local_port` as
+    /// usual (so `publish_raw_event` has a real source port matching the
+    /// endpoint advertised in external `OfferService` messages), but binds
+    /// its SD socket to an ephemeral port instead of the SOME/IP SD port
+    /// (30490). The passive server is therefore **not** part of the
+    /// `SO_REUSEPORT` group at 30490, and the kernel will never deliver SD
+    /// traffic destined for 30490 to it.
+    ///
+    /// Passive servers are intended for use with an external SD dispatcher
+    /// (for example, a `Client` whose discovery socket receives all
+    /// incoming `SubscribeEventGroup` / `FindService` messages and routes
+    /// them to the right `EventPublisher` via
+    /// [`EventPublisher::register_subscriber`]). Do **not** call
+    /// [`Server::announcement_loop`] or spawn [`Server::run`] on a passive
+    /// server — the external dispatcher owns those responsibilities.
+    ///
+    /// # Errors
+    ///
+    /// Returns an error if binding either socket fails.
+    pub async fn new_passive(config: ServerConfig) -> Result<Self, Error> {
+        let deps = ServerDeps {
+            factory: crate::tokio_transport::TokioTransport,
+            timer: crate::tokio_transport::TokioTimer,
+            e2e_registry: Arc::new(Mutex::new(E2ERegistry::new())),
+            subscriptions: Arc::new(RwLock::new(SubscriptionManager::new())),
+        };
+        Self::new_passive_with_deps(deps, config).await
+    }
+}
+
+impl<R, S, F, Tm> Server<R, S, F, Tm>
+where
+    R: E2ERegistryHandle,
+    S: SubscriptionHandle,
+    F: TransportFactory + Send + Sync + 'static,
+    F::Socket: Send + Sync + 'static,
+    for<'a> <F::Socket as TransportSocket>::SendFuture<'a>: Send,
+    for<'a> <F::Socket as TransportSocket>::RecvFuture<'a>: Send,
+    Tm: Timer + Clone + Send + Sync + 'static,
+{
+    /// Bare-metal-friendly constructor that takes every dependency
+    /// explicitly via a [`ServerDeps`] bundle. The `server-tokio`
+    /// convenience constructors (`Self::new`, `Self::new_with_loopback`,
+    /// `Self::new_passive`) ultimately delegate here.
+    ///
+    /// # Errors
+    ///
+    /// Returns an error if binding the unicast or SD socket via
+    /// [`TransportFactory::bind`] fails, or if joining the SD multicast
+    /// group fails.
+    pub async fn new_with_deps(
+        deps: ServerDeps<F, Tm, R, S>,
+        mut config: ServerConfig,
+        multicast_loopback: bool,
+    ) -> Result<Self, Error> {
+        let ServerDeps {
+            factory,
+            timer,
+            e2e_registry,
+            subscriptions,
+        } = deps;
+
+        // Bind unicast socket for receiving subscriptions.
         let unicast_addr = SocketAddrV4::new(config.interface, config.local_port);
-        let unicast_socket = Arc::new(UdpSocket::bind(unicast_addr).await?);
+        let unicast_socket = Arc::new(factory.bind(unicast_addr, &SocketOptions::new()).await?);
+        // If the caller passed local_port = 0, the kernel picked an
+        // ephemeral port. Back-fill the config so SD offers and event
+        // publishers advertise the actual bound port instead of 0.
+        let bound_port = unicast_socket.local_addr()?.port();
+        config.local_port = bound_port;
         tracing::info!(
-            "Server bound to {} for service 0x{:04X}",
-            unicast_addr,
+            "Server bound to {}:{} for service 0x{:04X}",
+            config.interface,
+            bound_port,
             config.service_id
         );
 
-        // Bind SD socket for sending/receiving SD messages (must use SD port 30490)
-        let expected_sd_port = sd::MULTICAST_PORT;
-        let sd_bind_addr =
-            std::net::SocketAddr::new(IpAddr::V4(config.interface), expected_sd_port);
-        let sd_raw_socket = socket2::Socket::new(
-            socket2::Domain::IPV4,
-            socket2::Type::DGRAM,
-            Some(socket2::Protocol::UDP),
-        )?;
-        sd_raw_socket.set_reuse_address(true)?;
-        #[cfg(unix)]
-        sd_raw_socket.set_reuse_port(true)?;
-        sd_raw_socket.set_multicast_if_v4(&config.interface)?;
-        sd_raw_socket.set_multicast_loop_v4(multicast_loopback)?;
-        sd_raw_socket.bind(&sd_bind_addr.into())?;
-        sd_raw_socket.set_nonblocking(true)?;
-        let sd_std_socket: std::net::UdpSocket = sd_raw_socket.into();
-        let sd_socket = UdpSocket::from_std(sd_std_socket)?;
-
-        // Join SD multicast group to receive FindService and SubscribeEventGroup
+        // Bind SD socket for sending/receiving SD messages (must use SD port 30490).
+        let mut sd_opts = SocketOptions::new();
+        sd_opts.reuse_address = true;
+        sd_opts.reuse_port = true;
+        sd_opts.multicast_if_v4 = Some(config.interface);
+        sd_opts.multicast_loop_v4 = Some(multicast_loopback);
+        let sd_addr = SocketAddrV4::new(config.interface, sd::MULTICAST_PORT);
+        let sd_socket = factory.bind(sd_addr, &sd_opts).await?;
         sd_socket.join_multicast_v4(sd::MULTICAST_IP, config.interface)?;
-        let actual_sd_addr = sd_socket.local_addr()?;
+        let sd_socket = Arc::new(sd_socket);
         tracing::info!(
             "Server SD socket bound to {} (expected port {}), joined multicast {}",
-            actual_sd_addr,
-            expected_sd_port,
+            sd_addr,
+            sd::MULTICAST_PORT,
             sd::MULTICAST_IP
         );
-        if let std::net::SocketAddr::V4(v4) = actual_sd_addr
-            && v4.port() != expected_sd_port
-        {
-            tracing::error!(
-                "SD socket port mismatch! Expected {}, got {}. Offers will use wrong source port.",
-                expected_sd_port,
-                v4.port()
-            );
-        }
 
-        let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
-        let e2e_registry = Arc::new(Mutex::new(E2ERegistry::new()));
         let publisher = Arc::new(EventPublisher::new(
-            Arc::clone(&subscriptions),
+            subscriptions.clone(),
             Arc::clone(&unicast_socket),
-            Arc::clone(&e2e_registry),
+            e2e_registry.clone(),
         ));
 
         Ok(Self {
             config,
             unicast_socket,
-            sd_socket: Arc::new(sd_socket),
+            sd_socket,
             subscriptions,
             publisher,
-            sd_session_id: Arc::new(AtomicU16::new(1)),
+            sd_state: Arc::new(SdStateManager::new()),
             e2e_registry,
+            factory,
+            timer,
             is_passive: false,
+            announcement_loop_started: AtomicBool::new(false),
         })
     }
 
-    /// Create a passive SOME/IP server.
+    /// Bare-metal-friendly passive-server constructor.
     ///
-    /// A passive server binds its unicast socket at `config.local_port` as
-    /// usual (so `publish_raw_event` has a real source port matching the
-    /// endpoint advertised in external `OfferService` messages), but binds
-    /// its SD socket to an ephemeral port instead of the SOME/IP SD port
-    /// (30490). The passive server is therefore **not** part of the
-    /// `SO_REUSEPORT` group at 30490, and the kernel will never deliver SD
-    /// traffic destined for 30490 to it.
-    ///
-    /// Passive servers are intended for use with an external SD dispatcher
-    /// (for example, a `Client` whose discovery socket receives all
-    /// incoming `SubscribeEventGroup` / `FindService` messages and routes
-    /// them to the right `EventPublisher` via
-    /// [`EventPublisher::register_subscriber`]). Do **not** call
-    /// [`Server::start_announcing`] or spawn [`Server::run`] on a passive
-    /// server — the external dispatcher owns those responsibilities.
+    /// Passive servers bind a unicast socket as usual but bind their SD
+    /// socket to an ephemeral port (port 0) instead of the SOME/IP SD
+    /// port — see `Server::new_passive` under `server-tokio` for the
+    /// full explanation. Calling [`Self::announcement_loop`] or
+    /// [`Self::run`] on the result is a programming error.
     ///
     /// # Errors
     ///
     /// Returns an error if binding either socket fails.
-    pub async fn new_passive(config: ServerConfig) -> Result<Self, Error> {
-        // Bind unicast socket at the configured local_port — the passive
-        // server still needs a real source port so published events appear
-        // to come from the endpoint advertised in the external OfferService.
+    pub async fn new_passive_with_deps(
+        deps: ServerDeps<F, Tm, R, S>,
+        mut config: ServerConfig,
+    ) -> Result<Self, Error> {
+        let ServerDeps {
+            factory,
+            timer,
+            e2e_registry,
+            subscriptions,
+        } = deps;
+
+        // Bind unicast socket at the configured local_port.
         let unicast_addr = SocketAddrV4::new(config.interface, config.local_port);
-        let unicast_socket = Arc::new(UdpSocket::bind(unicast_addr).await?);
+        let unicast_socket = Arc::new(factory.bind(unicast_addr, &SocketOptions::new()).await?);
+        // Back-fill the actual bound port if the caller passed 0.
+        let bound_port = unicast_socket.local_addr()?.port();
+        config.local_port = bound_port;
         tracing::info!(
-            "Passive server bound to {} for service 0x{:04X}",
-            unicast_addr,
+            "Passive server bound to {}:{} for service 0x{:04X}",
+            config.interface,
+            bound_port,
             config.service_id
         );
 
-        // Bind a placeholder SD socket on an ephemeral port. Nothing will
-        // route to it (neither multicast nor unicast on 30490), and neither
-        // `start_announcing` nor `run` should be called for a passive
-        // server. We still allocate it so the `Server` struct shape is
-        // identical to the full-server path.
-        let sd_placeholder_addr = std::net::SocketAddr::new(IpAddr::V4(config.interface), 0);
-        let sd_socket = UdpSocket::bind(sd_placeholder_addr).await?;
-        // Log the bound address using `Debug` on the `Result<SocketAddr>`
-        // so a hypothetical `local_addr` failure does not propagate as a
-        // construction error and we do not introduce an unreachable Err
-        // arm purely for defensive logging.
+        // Placeholder SD socket on an ephemeral port — no multicast options,
+        // no group join. Nothing should route to it.
+        let sd_placeholder_addr = SocketAddrV4::new(config.interface, 0);
+        let sd_socket = Arc::new(
+            factory
+                .bind(sd_placeholder_addr, &SocketOptions::new())
+                .await?,
+        );
         tracing::info!(
-            "Passive server SD placeholder socket bound to {:?} (not in SD reuseport group)",
-            sd_socket.local_addr()
+            "Passive server SD placeholder socket bound near {} (not in SD reuseport group)",
+            sd_placeholder_addr
         );
 
-        let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
-        let e2e_registry = Arc::new(Mutex::new(E2ERegistry::new()));
         let publisher = Arc::new(EventPublisher::new(
-            Arc::clone(&subscriptions),
+            subscriptions.clone(),
             Arc::clone(&unicast_socket),
-            Arc::clone(&e2e_registry),
+            e2e_registry.clone(),
         ));
 
         Ok(Self {
             config,
             unicast_socket,
-            sd_socket: Arc::new(sd_socket),
+            sd_socket,
             subscriptions,
             publisher,
-            sd_session_id: Arc::new(AtomicU16::new(1)),
+            sd_state: Arc::new(SdStateManager::new()),
             e2e_registry,
+            factory,
+            timer,
             is_passive: true,
+            announcement_loop_started: AtomicBool::new(false),
         })
     }
+}
 
-    /// Start announcing the service via Service Discovery
+impl<R, S, F, Tm> Server<R, S, F, Tm>
+where
+    R: E2ERegistryHandle,
+    S: SubscriptionHandle,
+    F: TransportFactory + Send + Sync + 'static,
+    F::Socket: Send + Sync + 'static,
+    for<'a> F::BindFuture<'a>: Send,
+    for<'a> <F::Socket as TransportSocket>::SendFuture<'a>: Send,
+    for<'a> <F::Socket as TransportSocket>::RecvFuture<'a>: Send,
+    Tm: Timer + Clone + Send + Sync + 'static,
+    for<'a> Tm::SleepFuture<'a>: Send,
+{
+    /// Build the periodic-SD-announcement future.
     ///
-    /// This sends periodic `OfferService` messages to the SD multicast group
+    /// Returns a future that sends an `OfferService` message to the SD
+    /// multicast group every second. The caller must drive the future
+    /// (typically via `tokio::spawn`) for announcements to fire; this
+    /// function does no work on its own.
     ///
-    /// # Errors
+    /// ```no_run
+    /// # #[cfg(feature = "server-tokio")] {
+    /// # use simple_someip::server::{Server, ServerConfig};
+    /// # use std::net::Ipv4Addr;
+    /// # async fn demo() -> Result<(), simple_someip::server::Error> {
+    /// # let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 30490, 0, 0);
+    /// # let server = Server::new(config).await?;
+    /// let announce_fut = server.announcement_loop()?;
+    /// tokio::spawn(announce_fut);
+    /// # Ok(())
+    /// # }
+    /// # }
+    /// ```
     ///
-    /// Returns [`Error::Io`] with [`std::io::ErrorKind::InvalidInput`] if
-    /// called on a server constructed via [`Server::new_passive`] — passive
-    /// servers have no real SD socket bound to port 30490, so any
-    /// announcements would go out with an incorrect source port.
+    /// # Errors
     ///
-    /// Otherwise currently always returns `Ok(())`; SD send failures are
-    /// logged internally.
-    pub fn start_announcing(&self) -> Result<(), Error> {
+    /// Returns [`Error::Io`] with [`std::io::ErrorKind::InvalidInput`] if:
+    /// - called on a server constructed via `Server::new_passive` — passive
+    ///   servers have no real SD socket bound to port 30490, so any
+    ///   announcements would go out with an incorrect source port; or
+    /// - called twice on the same server. Two announcement futures
+    ///   driving the same SD socket and session counter would double the
+    ///   announcement rate and race on the wrap-flag latch. Drop the
+    ///   first future to disable announcements before requesting a new
+    ///   one (which currently still requires a fresh `Server`).
+    #[must_use = "the returned announcement-loop future must be spawned (e.g. tokio::spawn) or awaited for the server to emit SD announcements; dropping it silently disables announcements"]
+    pub fn announcement_loop(
+        &self,
+    ) -> Result<impl core::future::Future<Output = ()> + Send + 'static, Error> {
         if self.is_passive {
             return Err(Error::Io(std::io::Error::new(
                 std::io::ErrorKind::InvalidInput,
                 format!(
-                    "start_announcing called on passive Server for service 0x{:04X}; \
+                    "announcement_loop called on passive Server for service 0x{:04X}; \
                      announcements must be driven externally (e.g. via \
-                     `simple_someip::Client::start_sd_announcements`)",
+                     `simple_someip::Client::sd_announcements_loop`)",
+                    self.config.service_id
+                ),
+            )));
+        }
+        if self
+            .announcement_loop_started
+            .compare_exchange(false, true, Ordering::AcqRel, Ordering::Acquire)
+            .is_err()
+        {
+            return Err(Error::Io(std::io::Error::new(
+                std::io::ErrorKind::InvalidInput,
+                format!(
+                    "announcement_loop already started for service 0x{:04X}; \
+                     two announcement futures cannot share the same SD socket \
+                     and session counter",
                     self.config.service_id
                 ),
             )));
         }
         let config = self.config.clone();
         let sd_socket = Arc::clone(&self.sd_socket);
-        let sd_session_id = Arc::clone(&self.sd_session_id);
+        let sd_state = Arc::clone(&self.sd_state);
+        let timer = self.timer.clone();
 
-        tokio::spawn(async move {
+        Ok(async move {
             let mut announcement_count = 0u32;
             loop {
-                match Self::send_offer_service(&config, &sd_socket, &sd_session_id).await {
+                match sd_state.send_offer_service(&config, &*sd_socket).await {
                     Ok(()) => {
                         announcement_count += 1;
                         if announcement_count == 1 {
@@ -314,86 +530,13 @@ impl Server {
                     }
                 }
 
-                // Send announcements every 1 second
-                tokio::time::sleep(tokio::time::Duration::from_secs(1)).await;
+                // Send announcements every 1 second. Sleep goes through
+                // the `Timer` trait so bare-metal consumers can swap in
+                // a different timer impl; today it resolves to
+                // `TokioTimer` under the `server-tokio` feature.
+                timer.sleep(core::time::Duration::from_secs(1)).await;
             }
-        });
-
-        Ok(())
-    }
-
-    /// Send an `OfferService` message via Service Discovery
-    async fn send_offer_service(
-        config: &ServerConfig,
-        socket: &UdpSocket,
-        session_id: &AtomicU16,
-    ) -> Result<(), Error> {
-        use crate::protocol::Header as SomeIpHeader;
-        use crate::traits::WireFormat;
-
-        // Create OfferService entry
-        let entry = Entry::OfferService(ServiceEntry {
-            index_first_options_run: 0,
-            index_second_options_run: 0,
-            options_count: OptionsCount::new(1, 0),
-            service_id: config.service_id,
-            instance_id: config.instance_id,
-            major_version: config.major_version,
-            ttl: config.ttl,
-            minor_version: config.minor_version,
-        });
-
-        // Create IPv4 endpoint option
-        let option = sd::Options::IpV4Endpoint {
-            ip: config.interface,
-            port: config.local_port,
-            protocol: TransportProtocol::Udp,
-        };
-
-        let entries = [entry];
-        let options = [option];
-        let sd_payload = sd::Header::new(Flags::new(true, true), &entries, &options);
-
-        // Encode SD payload
-        let mut sd_data = Vec::new();
-        sd_payload.encode(&mut sd_data)?;
-
-        // Increment session ID (wrapping from 0xFFFF back to 0x0001, skipping 0)
-        let prev = session_id
-            .fetch_update(Ordering::Relaxed, Ordering::Relaxed, |v| {
-                let next = v.wrapping_add(1);
-                Some(if next == 0 { 1 } else { next })
-            })
-            .unwrap();
-        let next = prev.wrapping_add(1);
-        let sid = u32::from(if next == 0 { 1 } else { next });
-
-        // Wrap in SOME/IP header for SD (service 0xFFFF, method 0x8100)
-        let someip_header = SomeIpHeader::new_sd(sid, sd_data.len());
-
-        // Encode complete SOME/IP-SD message
-        let mut buffer = Vec::new();
-        someip_header.encode(&mut buffer)?;
-        buffer.extend_from_slice(&sd_data);
-
-        let multicast_addr = SocketAddrV4::new(sd::MULTICAST_IP, sd::MULTICAST_PORT);
-
-        tracing::trace!(
-            "Sending OfferService: service=0x{:04X}, instance={}, port={}, size={} bytes",
-            config.service_id,
-            config.instance_id,
-            config.local_port,
-            buffer.len()
-        );
-        tracing::trace!(
-            "OfferService data: {:02X?}",
-            &buffer[..buffer.len().min(64)]
-        );
-
-        socket.send_to(&buffer, multicast_addr).await?;
-        tracing::trace!("Sent to {}", multicast_addr);
-
-        Ok(())
+        })
     }
 
     /// Send a unicast `OfferService` to a specific address (in response to `FindService`)
@@ -420,19 +563,22 @@ impl Server {
 
         let entries = [entry];
         let options = [option];
-        let sd_payload = sd::Header::new(Flags::new(true, true), &entries, &options);
-
-        let mut sd_data = Vec::new();
-        sd_payload.encode(&mut sd_data)?;
-
-        let sid = self.next_sd_session_id();
-        let someip_header = SomeIpHeader::new_sd(sid, sd_data.len());
-
-        let mut buffer = Vec::new();
-        someip_header.encode(&mut buffer)?;
-        buffer.extend_from_slice(&sd_data);
-
-        self.sd_socket.send_to(&buffer, target).await?;
+        // Atomic (sid, reboot_flag) pair so concurrent emissions cannot
+        // race around the wrap boundary — see
+        // `SdStateManager::next_session_id_with_reboot_flag` docs.
+        let (sid, reboot_flag) = self.sd_state.next_session_id_with_reboot_flag();
+        let sd_payload = sd::Header::new(Flags::new_sd(reboot_flag), &entries, &options);
+
+        let mut buffer = [0u8; crate::UDP_BUFFER_SIZE];
+        let sd_data_len = sd_payload.encode_to_slice(&mut buffer[16..])?;
+        let someip_header = SomeIpHeader::new_sd(sid, sd_data_len);
+        someip_header.encode_to_slice(&mut buffer[..16])?;
+        let total_len = 16 + sd_data_len;
+
+        let target_v4 = socket_addr_v4(target)?;
+        self.sd_socket
+            .send_to(&buffer[..total_len], target_v4)
+            .await?;
         tracing::debug!(
             "Sent unicast OfferService to {} for service 0x{:04X}",
             target,
@@ -442,23 +588,9 @@ impl Server {
         Ok(())
     }
 
-    /// Get the next SD session ID (`client_id=0`, `session_id` incrementing), skipping 0
-    fn next_sd_session_id(&self) -> u32 {
-        let prev = self
-            .sd_session_id
-            .fetch_update(Ordering::Relaxed, Ordering::Relaxed, |v| {
-                let next = v.wrapping_add(1);
-                Some(if next == 0 { 1 } else { next })
-            })
-            .unwrap();
-        // fetch_update returns the previous value; compute the same next value
-        let next = prev.wrapping_add(1);
-        u32::from(if next == 0 { 1 } else { next })
-    }
-
     /// Get the event publisher for sending events
     #[must_use]
-    pub fn publisher(&self) -> Arc<EventPublisher> {
+    pub fn publisher(&self) -> Arc<EventPublisher<R, S, F::Socket>> {
         Arc::clone(&self.publisher)
     }
 
@@ -467,8 +599,11 @@ impl Server {
     /// # Errors
     ///
     /// Returns an error if the socket's local address cannot be retrieved.
-    pub fn unicast_local_addr(&self) -> Result<std::net::SocketAddr, std::io::Error> {
-        self.unicast_socket.local_addr()
+    pub fn unicast_local_addr(&self) -> Result<std::net::SocketAddr, Error> {
+        match self.unicast_socket.local_addr() {
+            Ok(v4) => Ok(std::net::SocketAddr::V4(v4)),
+            Err(e) => Err(Error::Transport(e)),
+        }
     }
 
     /// Update the configured local port (useful after binding to ephemeral port 0).
@@ -480,27 +615,13 @@ impl Server {
     ///
     /// Once registered, outgoing events published via [`EventPublisher::publish_event`]
     /// will have E2E protection applied automatically.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the E2E registry mutex is poisoned.
     pub fn register_e2e(&self, key: E2EKey, profile: E2EProfile) {
-        self.e2e_registry
-            .lock()
-            .expect("e2e registry lock poisoned")
-            .register(key, profile);
+        self.e2e_registry.register(key, profile);
     }
 
     /// Remove E2E configuration for the given key.
-    ///
-    /// # Panics
-    ///
-    /// Panics if the E2E registry mutex is poisoned.
     pub fn unregister_e2e(&self, key: &E2EKey) {
-        self.e2e_registry
-            .lock()
-            .expect("e2e registry lock poisoned")
-            .unregister(key);
+        self.e2e_registry.unregister(key);
     }
 
     /// Run the server event loop
@@ -512,7 +633,7 @@ impl Server {
     /// # Errors
     ///
     /// Returns [`Error::Io`] with [`std::io::ErrorKind::InvalidInput`] if
-    /// called on a server constructed via [`Server::new_passive`] — passive
+    /// called on a server constructed via `Server::new_passive` — passive
     /// servers have no real SD socket to read from, so the run loop would
     /// block forever on the ephemeral placeholder socket.
     ///
@@ -534,21 +655,68 @@ impl Server {
             )));
         }
 
+        // Incoming-peer buffers sized to the IP datagram limit (64 KiB - 1).
+        // Do NOT shrink to `UDP_BUFFER_SIZE` (1500): peer SD messages are
+        // bounded by the link MTU but `recv_from` here is a server-side
+        // sink for any peer datagram landing on the SD/unicast port, and
+        // larger-than-MTU peer messages must surface (or be cleanly
+        // truncated by the kernel) rather than being silently capped at
+        // 1500 by an undersized buffer. Out-going `EventPublisher` paths
+        // do use the smaller `UDP_BUFFER_SIZE` because we control the
+        // wire size of what we emit; that asymmetry is intentional.
         let mut unicast_buf = vec![0u8; 65535];
         let mut sd_buf = vec![0u8; 65535];
 
         loop {
-            let (data, len, addr, source) = tokio::select! {
-                result = self.unicast_socket.recv_from(&mut unicast_buf) => {
-                    let (len, addr) = result?;
-                    (&unicast_buf[..], len, addr, "unicast")
-                }
-                result = self.sd_socket.recv_from(&mut sd_buf) => {
-                    let (len, addr) = result?;
-                    (&sd_buf[..], len, addr, "sd-multicast")
+            // `select!` (not `select_biased!`) gives pseudo-random fairness
+            // across ready arms each poll — matches the prior
+            // `tokio::select!` behavior and avoids starving either the
+            // unicast or SD-multicast arm under sustained one-sided load.
+            //
+            // SAFETY: both arms call `TransportSocket::recv_from`. The
+            // `TokioSocket` backend is cancel-safe per tokio docs — a
+            // non-selected arm can be dropped without losing in-flight
+            // kernel state. Custom transport backends MUST provide the
+            // same guarantee. A future contributor adding a
+            // non-cancel-safe `FusedFuture` arm here would silently lose
+            // state when the arm is dropped on a select win. Both futures
+            // must therefore stay `Send + FusedFuture + Unpin` *and*
+            // cancel-safe.
+            //
+            // Fresh futures are constructed each iteration so the borrows
+            // of `unicast_buf` / `sd_buf` / the sockets end when the
+            // select macro returns, freeing the buffer we index into
+            // below.
+            let (len, addr, source, from_unicast) = {
+                let unicast_fut = self.unicast_socket.recv_from(&mut unicast_buf).fuse();
+                let sd_fut = self.sd_socket.recv_from(&mut sd_buf).fuse();
+                pin_mut!(unicast_fut, sd_fut);
+                select! {
+                    result = unicast_fut => {
+                        let datagram = result?;
+                        (
+                            datagram.bytes_received,
+                            std::net::SocketAddr::V4(datagram.source),
+                            "unicast",
+                            true,
+                        )
+                    }
+                    result = sd_fut => {
+                        let datagram = result?;
+                        (
+                            datagram.bytes_received,
+                            std::net::SocketAddr::V4(datagram.source),
+                            "sd-multicast",
+                            false,
+                        )
+                    }
                 }
             };
-            let data = &data[..len];
+            let data = if from_unicast {
+                &unicast_buf[..len]
+            } else {
+                &sd_buf[..len]
+            };
 
             // By default IP_MULTICAST_LOOP=false suppresses own multicast
             // messages on the SD socket, so no source-IP filtering is needed.
@@ -602,6 +770,7 @@ impl Server {
     }
 
     /// Handle a Service Discovery message
+    #[allow(clippy::too_many_lines)]
     async fn handle_sd_message(
         &mut self,
         sd_view: &sd::SdHeaderView<'_>,
@@ -628,7 +797,7 @@ impl Server {
                             self.config.service_id,
                             entry_view.service_id()
                         );
-                        self.send_subscribe_nack_from_view(&entry_view, sender, "Wrong service ID")
+                        self.send_subscribe_nack_from_view(&entry_view, sender, "wrong_service_id")
                             .await?;
                     } else if entry_view.instance_id() != self.config.instance_id {
                         tracing::warn!(
@@ -639,9 +808,54 @@ impl Server {
                         self.send_subscribe_nack_from_view(
                             &entry_view,
                             sender,
-                            "Wrong instance ID",
+                            "wrong_instance_id",
                         )
                         .await?;
+                    } else if entry_view.major_version() != self.config.major_version {
+                        // Per AUTOSAR SOME/IP-SD: a Subscribe whose
+                        // major_version disagrees with the server's
+                        // configured major must be NACKed (TTL=0). Without
+                        // this arm a client probing for a v2 service
+                        // against a v1 server would get an Ack and start
+                        // sending traffic that the application stack
+                        // would silently mis-decode.
+                        tracing::warn!(
+                            "Subscribe for wrong major_version: expected {}, got {}",
+                            self.config.major_version,
+                            entry_view.major_version()
+                        );
+                        if let Err(e) = self
+                            .send_subscribe_nack_from_view(
+                                &entry_view,
+                                sender,
+                                "wrong_major_version",
+                            )
+                            .await
+                        {
+                            tracing::warn!(error = %e, "SubscribeNack send failed");
+                        }
+                    } else if !self.config.accepts_event_group(entry_view.event_group_id()) {
+                        // Per AUTOSAR SOME/IP-SD, the event group must
+                        // be known to the server before subscription
+                        // can be granted. If `event_group_ids` is
+                        // populated and the request is for an
+                        // unrecognised group, NACK so the client
+                        // doesn't believe it's subscribed.
+                        tracing::warn!(
+                            "Subscribe for unknown event_group_id 0x{:04X} (service 0x{:04X})",
+                            entry_view.event_group_id(),
+                            entry_view.service_id()
+                        );
+                        if let Err(e) = self
+                            .send_subscribe_nack_from_view(
+                                &entry_view,
+                                sender,
+                                "unknown_event_group",
+                            )
+                            .await
+                        {
+                            tracing::warn!(error = %e, "SubscribeNack send failed");
+                        }
                     } else {
                         // Extract the subscriber endpoint from the entry's
                         // own options run. Each SD entry describes two runs
@@ -653,32 +867,82 @@ impl Server {
                         let first_count = entry_view.options_count().first_options_count as usize;
                         let second_index = entry_view.index_second_options_run() as usize;
                         let second_count = entry_view.options_count().second_options_count as usize;
-                        if let Some(endpoint_addr) = Self::extract_subscriber_endpoint(
+                        if let Some(endpoint_addr) = extract_subscriber_endpoint(
                             &sd_view.options(),
                             first_index,
                             first_count,
                             second_index,
                             second_count,
                         ) {
-                            let mut subs = self.subscriptions.write().await;
-                            subs.subscribe(
-                                entry_view.service_id(),
-                                entry_view.instance_id(),
-                                entry_view.event_group_id(),
-                                endpoint_addr,
-                            );
-
-                            // Send SubscribeAck
-                            self.send_subscribe_ack_from_view(&entry_view, sender)
-                                .await?;
+                            let subscribe_result = self
+                                .subscriptions
+                                .subscribe(
+                                    entry_view.service_id(),
+                                    entry_view.instance_id(),
+                                    entry_view.event_group_id(),
+                                    endpoint_addr,
+                                )
+                                .await;
+
+                            match subscribe_result {
+                                Ok(()) => {
+                                    // ACK the just-committed subscription. If the
+                                    // ACK send fails (transient transport error),
+                                    // roll back the subscription so we don't leak
+                                    // a committed-but-unacked entry — and log
+                                    // rather than propagate, so a single SD-socket
+                                    // hiccup doesn't tear down `run()`.
+                                    if let Err(e) =
+                                        self.send_subscribe_ack_from_view(&entry_view, sender).await
+                                    {
+                                        tracing::warn!(
+                                            error = %e,
+                                            service_id = entry_view.service_id(),
+                                            instance_id = entry_view.instance_id(),
+                                            event_group_id = entry_view.event_group_id(),
+                                            "SubscribeAck send failed; rolling back subscription"
+                                        );
+                                        self.subscriptions
+                                            .unsubscribe(
+                                                entry_view.service_id(),
+                                                entry_view.instance_id(),
+                                                entry_view.event_group_id(),
+                                                endpoint_addr,
+                                            )
+                                            .await;
+                                    }
+                                }
+                                Err(e) => {
+                                    // Capacity-rejected subscription: NACK so
+                                    // the client doesn't believe it's
+                                    // subscribed.
+                                    let reason: &'static str = match e {
+                                        SubscribeError::SubscribersPerGroupFull => {
+                                            "subscribers_per_group_full"
+                                        }
+                                        SubscribeError::EventGroupsFull => "event_groups_full",
+                                    };
+                                    tracing::debug!("Subscription rejected: {reason}");
+                                    if let Err(e) = self
+                                        .send_subscribe_nack_from_view(&entry_view, sender, reason)
+                                        .await
+                                    {
+                                        tracing::warn!(error = %e, "SubscribeNack send failed");
+                                    }
+                                }
+                            }
                         } else {
                             tracing::warn!("No endpoint found in Subscribe message options");
-                            self.send_subscribe_nack_from_view(
-                                &entry_view,
-                                sender,
-                                "No endpoint in options",
-                            )
-                            .await?;
+                            if let Err(e) = self
+                                .send_subscribe_nack_from_view(
+                                    &entry_view,
+                                    sender,
+                                    "no_endpoint_in_options",
+                                )
+                                .await
+                            {
+                                tracing::warn!(error = %e, "SubscribeNack send failed");
+                            }
                         }
                     }
                 }
@@ -692,7 +956,9 @@ impl Server {
                             find_service_id,
                             self.config.service_id
                         );
-                        self.send_unicast_offer(sender).await?;
+                        if let Err(e) = self.send_unicast_offer(sender).await {
+                            tracing::warn!(error = %e, "Unicast OfferService send failed");
+                        }
                     } else {
                         tracing::trace!(
                             "Ignoring FindService for service 0x{:04X} (not ours)",
@@ -708,94 +974,100 @@ impl Server {
 
         Ok(())
     }
+}
 
-    /// Extract a single subscriber endpoint from the options runs
-    /// associated with an SD entry.
-    ///
-    /// Each SD entry owns up to two options runs. A run is a contiguous
-    /// slice of the options array starting at `index_*_options_run` with
-    /// `*_options_count` entries. This helper walks both runs, collects
-    /// every `IpV4Endpoint` option it finds, returns the first, and logs
-    /// a `warn!` if more than one endpoint is present (we do not yet
-    /// support multi-endpoint subscribers — e.g. TCP+UDP — and will pick
-    /// an arbitrary one).
-    ///
-    /// Returns `None` if no `IpV4Endpoint` is found in either run.
-    fn extract_subscriber_endpoint(
-        options: &sd::OptionIter<'_>,
-        first_index: usize,
-        first_count: usize,
-        second_index: usize,
-        second_count: usize,
-    ) -> Option<SocketAddrV4> {
-        // Walk each run by cloning the iterator — `OptionIter` is a
-        // cheap view over borrowed bytes so `clone` is free. Taking
-        // `options` by reference lets the caller keep ownership and
-        // keeps the clippy `needless_pass_by_value` lint quiet.
-        //
-        // We only ever return the first `IpV4Endpoint` found, so rather
-        // than collect into a `Vec` (heap alloc on every Subscribe) we
-        // track the first hit in an `Option` and keep a count so the
-        // multi-endpoint warn path still reports how many additional
-        // endpoints were present. This keeps the SD receive loop
-        // allocation-free on the happy path.
-        let mut first_endpoint: Option<SocketAddrV4> = None;
-        let mut endpoint_count: usize = 0;
-        let mut ignored_other: usize = 0;
-
-        let mut walk_run = |index: usize, count: usize| {
-            if count == 0 {
-                return;
-            }
-            for option_view in options.clone().skip(index).take(count) {
-                match option_view.option_type() {
-                    Ok(sd::OptionType::IpV4Endpoint) => {
-                        if let Ok((ip, _, port)) = option_view.as_ipv4() {
-                            endpoint_count += 1;
-                            if first_endpoint.is_none() {
-                                first_endpoint = Some(SocketAddrV4::new(ip, port));
-                            }
+/// Convert a [`std::net::SocketAddr`] into a [`SocketAddrV4`] for the
+/// transport layer. SOME/IP-SD is IPv4-only at this layer; if a V6
+/// address ever surfaces here it indicates a misconfiguration upstream
+/// (a V6 socket binding the SD port, or a V6 source address surfaced
+/// by a transport that should not produce one). Returns
+/// [`TransportError::Unsupported`](crate::transport::TransportError::Unsupported)
+/// in that case so the caller can log and drop the message instead of panicking.
+fn socket_addr_v4(addr: std::net::SocketAddr) -> Result<SocketAddrV4, Error> {
+    match addr {
+        std::net::SocketAddr::V4(v4) => Ok(v4),
+        std::net::SocketAddr::V6(_) => Err(Error::Transport(
+            crate::transport::TransportError::Unsupported,
+        )),
+    }
+}
+
+/// Extract a single subscriber endpoint from the options runs associated with
+/// an SD entry. Walks both option runs, returns the first `IpV4Endpoint`
+/// found, and logs a `warn!` if more than one is present.
+fn extract_subscriber_endpoint(
+    options: &sd::OptionIter<'_>,
+    first_index: usize,
+    first_count: usize,
+    second_index: usize,
+    second_count: usize,
+) -> Option<SocketAddrV4> {
+    let mut first_endpoint: Option<SocketAddrV4> = None;
+    let mut endpoint_count: usize = 0;
+    let mut ignored_other: usize = 0;
+
+    let mut walk_run = |index: usize, count: usize| {
+        if count == 0 {
+            return;
+        }
+        for option_view in options.clone().skip(index).take(count) {
+            match option_view.option_type() {
+                Ok(sd::OptionType::IpV4Endpoint) => {
+                    if let Ok((ip, _, port)) = option_view.as_ipv4() {
+                        endpoint_count += 1;
+                        if first_endpoint.is_none() {
+                            first_endpoint = Some(SocketAddrV4::new(ip, port));
                         }
                     }
-                    Ok(_) | Err(_) => ignored_other += 1,
                 }
+                Ok(_) | Err(_) => ignored_other += 1,
             }
-        };
+        }
+    };
 
-        walk_run(first_index, first_count);
-        walk_run(second_index, second_count);
+    walk_run(first_index, first_count);
+    walk_run(second_index, second_count);
 
-        match endpoint_count {
-            0 => {
-                tracing::warn!(
-                    "No IPv4 endpoint in options runs \
-                     (first: idx={first_index}, count={first_count}; \
-                     second: idx={second_index}, count={second_count}; \
-                     ignored={ignored_other})"
-                );
-                None
-            }
-            1 => {
-                // Unwrap is safe: count == 1 implies we set `first_endpoint`.
-                let ep = first_endpoint.expect("endpoint_count=1 implies first_endpoint is Some");
-                tracing::trace!("Found IPv4 endpoint {}", ep);
-                Some(ep)
-            }
-            n => {
-                let ep = first_endpoint.expect("endpoint_count>=1 implies first_endpoint is Some");
-                tracing::warn!(
-                    "{} IPv4 endpoints found in subscribe options runs; \
-                     using first ({}) and ignoring {} additional. \
-                     Multi-endpoint (e.g. TCP+UDP) subscribers are not yet supported.",
-                    n,
-                    ep,
-                    n - 1
-                );
-                Some(ep)
-            }
+    match endpoint_count {
+        0 => {
+            tracing::warn!(
+                "No IPv4 endpoint in options runs \
+                 (first: idx={first_index}, count={first_count}; \
+                 second: idx={second_index}, count={second_count}; \
+                 ignored={ignored_other})"
+            );
+            None
+        }
+        1 => {
+            let ep = first_endpoint.expect("endpoint_count=1 implies first_endpoint is Some");
+            tracing::trace!("Found IPv4 endpoint {}", ep);
+            Some(ep)
+        }
+        n => {
+            let ep = first_endpoint.expect("endpoint_count>=1 implies first_endpoint is Some");
+            tracing::warn!(
+                "{} IPv4 endpoints found in subscribe options runs; \
+                 using first ({}) and ignoring {} additional. \
+                 Multi-endpoint (e.g. TCP+UDP) subscribers are not yet supported.",
+                n,
+                ep,
+                n - 1
+            );
+            Some(ep)
         }
     }
+}
 
+impl<R, S, F, Tm> Server<R, S, F, Tm>
+where
+    R: E2ERegistryHandle,
+    S: SubscriptionHandle,
+    F: TransportFactory + Send + Sync + 'static,
+    F::Socket: Send + Sync + 'static,
+    for<'a> <F::Socket as TransportSocket>::SendFuture<'a>: Send,
+    for<'a> <F::Socket as TransportSocket>::RecvFuture<'a>: Send,
+    Tm: Timer + Clone + Send + Sync + 'static,
+{
     /// Send `SubscribeAck` from an entry view
     async fn send_subscribe_ack_from_view(
         &self,
@@ -818,19 +1090,21 @@ impl Server {
         });
 
         let entries = [ack_entry];
-        let sd_payload = sd::Header::new(Flags::new(true, true), &entries, &[]);
-
-        let mut sd_data = Vec::new();
-        sd_payload.encode(&mut sd_data)?;
-
-        let sid = self.next_sd_session_id();
-        let someip_header = SomeIpHeader::new_sd(sid, sd_data.len());
-
-        let mut buffer = Vec::new();
-        someip_header.encode(&mut buffer)?;
-        buffer.extend_from_slice(&sd_data);
-
-        self.sd_socket.send_to(&buffer, subscriber).await?;
+        // Atomic (sid, reboot_flag) pair — see
+        // `SdStateManager::next_session_id_with_reboot_flag`.
+        let (sid, reboot_flag) = self.sd_state.next_session_id_with_reboot_flag();
+        let sd_payload = sd::Header::new(Flags::new_sd(reboot_flag), &entries, &[]);
+
+        let mut buffer = [0u8; crate::UDP_BUFFER_SIZE];
+        let sd_data_len = sd_payload.encode_to_slice(&mut buffer[16..])?;
+        let someip_header = SomeIpHeader::new_sd(sid, sd_data_len);
+        someip_header.encode_to_slice(&mut buffer[..16])?;
+        let total_len = 16 + sd_data_len;
+
+        let subscriber_v4 = socket_addr_v4(subscriber)?;
+        self.sd_socket
+            .send_to(&buffer[..total_len], subscriber_v4)
+            .await?;
 
         tracing::debug!(
             "Sent SubscribeAck to {} for service 0x{:04X}, eventgroup 0x{:04X}",
@@ -865,19 +1139,21 @@ impl Server {
         });
 
         let entries = [nack_entry];
-        let sd_payload = sd::Header::new(Flags::new(true, true), &entries, &[]);
-
-        let mut sd_data = Vec::new();
-        sd_payload.encode(&mut sd_data)?;
-
-        let sid = self.next_sd_session_id();
-        let someip_header = SomeIpHeader::new_sd(sid, sd_data.len());
-
-        let mut buffer = Vec::new();
-        someip_header.encode(&mut buffer)?;
-        buffer.extend_from_slice(&sd_data);
-
-        self.sd_socket.send_to(&buffer, subscriber).await?;
+        // Atomic (sid, reboot_flag) pair — see
+        // `SdStateManager::next_session_id_with_reboot_flag`.
+        let (sid, reboot_flag) = self.sd_state.next_session_id_with_reboot_flag();
+        let sd_payload = sd::Header::new(Flags::new_sd(reboot_flag), &entries, &[]);
+
+        let mut buffer = [0u8; crate::UDP_BUFFER_SIZE];
+        let sd_data_len = sd_payload.encode_to_slice(&mut buffer[16..])?;
+        let someip_header = SomeIpHeader::new_sd(sid, sd_data_len);
+        someip_header.encode_to_slice(&mut buffer[..16])?;
+        let total_len = 16 + sd_data_len;
+
+        let subscriber_v4 = socket_addr_v4(subscriber)?;
+        self.sd_socket
+            .send_to(&buffer[..total_len], subscriber_v4)
+            .await?;
 
         tracing::warn!(
             "Sent SubscribeNack to {} for service 0x{:04X}, eventgroup 0x{:04X} (reason: {})",
@@ -891,41 +1167,230 @@ impl Server {
     }
 }
 
-#[cfg(test)]
+#[cfg(all(test, feature = "server-tokio"))]
 mod tests {
     use super::*;
     use crate::protocol::{
         Header as SomeIpHeader, MessageType, MessageTypeField, MessageView, ReturnCode,
     };
+    use crate::tokio_transport::{TokioTimer, TokioTransport};
     use crate::traits::WireFormat;
     use std::format;
+    use std::net::IpAddr;
+    use tokio::net::UdpSocket;
+
+    /// Type alias bringing the tokio-flavor concrete type parameters back
+    /// into scope so tests can spell `TestServer::new(...)` without
+    /// chasing the four-type-parameter signature on every call site.
+    /// Mirrors the `TestClient` pattern from `tests/client_server.rs`.
+    type TestServer = Server<
+        Arc<Mutex<E2ERegistry>>,
+        Arc<RwLock<SubscriptionManager>>,
+        TokioTransport,
+        TokioTimer,
+    >;
 
     #[tokio::test]
     async fn test_server_creation() {
-        let config = ServerConfig::new(Ipv4Addr::new(127, 0, 0, 1), 30682, 0x5B, 1);
+        let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 30682, 0x5B, 1);
 
-        let server: Result<Server, _> = Server::new(config).await;
+        let server: Result<TestServer, _> = TestServer::new(config).await;
         assert!(server.is_ok());
     }
 
+    /// Regression for H5: `ServerConfig::accepts_event_group` must
+    /// accept any group when `event_group_ids` is empty (back-compat:
+    /// servers that have not enumerated their groups must keep
+    /// working) and validate strictly when populated.
+    #[test]
+    fn server_config_accepts_event_group_empty_means_any() {
+        let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 30490, 0x5B, 1);
+        assert!(config.event_group_ids.is_empty());
+        // Empty list: every group accepted.
+        assert!(config.accepts_event_group(0x0001));
+        assert!(config.accepts_event_group(0xBEEF));
+        assert!(config.accepts_event_group(0xFFFF));
+    }
+
+    #[test]
+    fn server_config_accepts_event_group_populated_validates() {
+        let mut config = ServerConfig::new(Ipv4Addr::LOCALHOST, 30490, 0x5B, 1);
+        config.event_group_ids.push(0x0001).unwrap();
+        config.event_group_ids.push(0x0042).unwrap();
+        assert!(config.accepts_event_group(0x0001));
+        assert!(config.accepts_event_group(0x0042));
+        assert!(!config.accepts_event_group(0x0002));
+        assert!(!config.accepts_event_group(0xBEEF));
+    }
+
+    /// Regression for H3: when `subscribe` succeeds but the
+    /// `SubscribeAck` send fails (transient transport error), the
+    /// just-committed subscription must be rolled back so the
+    /// manager isn't left holding a slot for a peer that never
+    /// received its ACK. `handle_sd_message` must also NOT propagate
+    /// the error via `?` — a single SD-socket hiccup tearing down
+    /// `run()` was the original bug.
+    #[tokio::test]
+    async fn handle_sd_message_rolls_back_subscription_on_failed_ack_send() {
+        use crate::transport::{IoErrorKind, ReceivedDatagram, TransportError};
+        use core::future::{Future, Ready, ready};
+        use core::pin::Pin;
+        use core::task::{Context, Poll};
+        use std::pin::Pin as StdPin;
+
+        // Socket whose `send_to` always fails. `recv_from` is never
+        // called by this test (we drive `handle_sd_message` directly).
+        struct FailingSocket {
+            local: SocketAddrV4,
+        }
+        struct FailingSend;
+        impl Future for FailingSend {
+            type Output = Result<(), TransportError>;
+            fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+                Poll::Ready(Err(TransportError::Io(IoErrorKind::NetworkUnreachable)))
+            }
+        }
+        impl TransportSocket for FailingSocket {
+            type SendFuture<'a> = FailingSend;
+            type RecvFuture<'a> = Ready<Result<ReceivedDatagram, TransportError>>;
+            fn send_to<'a>(&'a self, _b: &'a [u8], _t: SocketAddrV4) -> Self::SendFuture<'a> {
+                FailingSend
+            }
+            fn recv_from<'a>(&'a self, _b: &'a mut [u8]) -> Self::RecvFuture<'a> {
+                ready(Err(TransportError::Unsupported))
+            }
+            fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+                Ok(self.local)
+            }
+            fn join_multicast_v4(&self, _g: Ipv4Addr, _i: Ipv4Addr) -> Result<(), TransportError> {
+                Ok(())
+            }
+            fn leave_multicast_v4(&self, _g: Ipv4Addr, _i: Ipv4Addr) -> Result<(), TransportError> {
+                Ok(())
+            }
+        }
+
+        struct FailingFactory {
+            next_port: Arc<Mutex<u16>>,
+        }
+        impl TransportFactory for FailingFactory {
+            type Socket = FailingSocket;
+            type BindFuture<'a> = StdPin<
+                std::boxed::Box<
+                    dyn Future<Output = Result<Self::Socket, TransportError>> + Send + 'a,
+                >,
+            >;
+            fn bind<'a>(
+                &'a self,
+                addr: SocketAddrV4,
+                _options: &'a SocketOptions,
+            ) -> Self::BindFuture<'a> {
+                let port = if addr.port() == 0 {
+                    let mut p = self.next_port.lock().unwrap();
+                    *p = p.saturating_add(1);
+                    50000u16.saturating_add(*p)
+                } else {
+                    addr.port()
+                };
+                let local = SocketAddrV4::new(*addr.ip(), port);
+                std::boxed::Box::pin(async move { Ok(FailingSocket { local }) })
+            }
+        }
+
+        let factory = FailingFactory {
+            next_port: Arc::new(Mutex::new(0)),
+        };
+        let subscriptions = Arc::new(RwLock::new(SubscriptionManager::new()));
+        let deps = ServerDeps {
+            factory,
+            timer: TokioTimer,
+            e2e_registry: Arc::new(Mutex::new(E2ERegistry::new())),
+            subscriptions: subscriptions.clone(),
+        };
+        let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 0, 0x5B, 1);
+        let mut server = Server::new_with_deps(deps, config, false)
+            .await
+            .expect("create failing-socket server");
+
+        // Build a valid Subscribe; our service id/instance/major
+        // match the config's defaults, so the only failure point
+        // will be the ACK send.
+        let bytes = make_subscription_header(
+            0x5B,
+            1,
+            1,
+            3,
+            0x01,
+            Ipv4Addr::LOCALHOST,
+            sd::TransportProtocol::Udp,
+            45000,
+        );
+        let view = MessageView::parse(&bytes).expect("parse Subscribe");
+        let sd_view = view.sd_header().expect("Subscribe has SD header");
+        let sender = std::net::SocketAddr::V4(SocketAddrV4::new(Ipv4Addr::LOCALHOST, 45000));
+
+        // The H3 fix: handle_sd_message must NOT bubble the ACK send
+        // failure as Err — it logs and continues.
+        let result = server.handle_sd_message(&sd_view, sender).await;
+        assert!(
+            result.is_ok(),
+            "handle_sd_message must not propagate transient SD-socket I/O errors; got {result:?}"
+        );
+
+        // The H3 fix: a committed-but-unacked subscription must be
+        // rolled back, so the manager has 0 entries.
+        let subs = subscriptions.read().await;
+        assert_eq!(
+            subs.subscription_count(),
+            0,
+            "subscription must be rolled back after failed ACK send"
+        );
+    }
+
+    /// Regression for H4: `announcement_loop` must be idempotent.
+    /// Calling it a second time returns `Err(Error::Io(InvalidInput))`
+    /// so two announcement futures cannot race on the same SD socket
+    /// and session counter.
+    #[tokio::test]
+    async fn announcement_loop_second_call_returns_invalid_input() {
+        let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 30683, 0x5BB4, 1);
+        let server = TestServer::new(config).await.expect("create server");
+        let _first = server
+            .announcement_loop()
+            .expect("first announcement_loop call must succeed");
+        let second = server.announcement_loop();
+        match second {
+            Err(Error::Io(io_err)) => {
+                assert_eq!(io_err.kind(), std::io::ErrorKind::InvalidInput);
+                let msg = format!("{io_err}");
+                assert!(
+                    msg.contains("already started"),
+                    "expected the diagnostic to say 'already started', got: {msg}"
+                );
+            }
+            Ok(_) => panic!("second announcement_loop must error, got Ok"),
+            Err(other) => panic!("expected Error::Io(InvalidInput), got {other:?}"),
+        }
+    }
+
     #[tokio::test]
     async fn test_server_creation_with_loopback_enabled() {
         // Use a unicast port distinct from other tests to avoid EADDRINUSE
         // when the test binary runs tests in parallel. The SD socket binds
         // the SD multicast port (30490) and relies on SO_REUSEPORT, the same
         // as `test_server_creation`.
-        let config = ServerConfig::new(Ipv4Addr::new(127, 0, 0, 1), 30683, 0x5C, 1);
+        let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 30683, 0x5C, 1);
 
-        let server = Server::new_with_loopback(config, true)
+        let server = TestServer::new_with_loopback(config, true)
             .await
             .expect("new_with_loopback(true) should succeed on localhost");
 
         // Confirm the SD socket was actually configured with IP_MULTICAST_LOOP
         // enabled — this is the behavior the new code path is supposed to
         // produce and is what makes same-host testing possible.
-        let sock_ref = socket2::SockRef::from(&*server.sd_socket);
         assert!(
-            sock_ref
+            server
+                .sd_socket
                 .multicast_loop_v4()
                 .expect("multicast_loop_v4 getter should succeed"),
             "multicast loopback should be enabled on the SD socket",
@@ -960,19 +1425,22 @@ mod tests {
     }
 
     /// Helper: create a server on an ephemeral port and return (Server, port)
-    async fn create_test_server(service_id: u16, instance_id: u16) -> (Server, u16) {
+    async fn create_test_server(service_id: u16, instance_id: u16) -> (TestServer, u16) {
         // Use port 0 to get an ephemeral port
-        let config = ServerConfig::new(Ipv4Addr::new(127, 0, 0, 1), 0, service_id, instance_id);
-        let mut server = Server::new(config).await.expect("Failed to create server");
+        let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 0, service_id, instance_id);
+        let mut server = TestServer::new(config)
+            .await
+            .expect("Failed to create server");
         let port = match server.unicast_local_addr().unwrap() {
             std::net::SocketAddr::V4(addr) => addr.port(),
-            _ => panic!("Expected IPv4 address"),
+            std::net::SocketAddr::V6(_) => panic!("expected IPv4 address"),
         };
         // Update config to reflect actual bound port
         server.set_local_port(port);
         (server, port)
     }
 
+    #[allow(clippy::too_many_arguments)]
     fn make_subscription_header(
         service_id: u16,
         instance_id: u16,
@@ -1018,21 +1486,23 @@ mod tests {
             1,
             3,
             0x01,
-            Ipv4Addr::new(127, 0, 0, 1),
+            Ipv4Addr::LOCALHOST,
             sd::TransportProtocol::Udp,
             server_port,
         );
 
         // Send to the server
         client_socket
-            .send_to(&message, format!("127.0.0.1:{}", server_port))
+            .send_to(&message, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
         // Run server to process one message (with a timeout)
         let server_handle = tokio::spawn(async move {
             let mut buf = vec![0u8; 65535];
-            let (len, addr) = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let datagram = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let len = datagram.bytes_received;
+            let addr = std::net::SocketAddr::V4(datagram.source);
             let data = &buf[..len];
             let view = MessageView::parse(data).unwrap();
             let sd_view = view.sd_header().unwrap();
@@ -1056,7 +1526,7 @@ mod tests {
         .unwrap();
 
         let ttl = parse_subscribe_ack_ttl(&resp_buf[..resp_len]);
-        assert!(ttl > 0, "Expected ACK (TTL > 0), got TTL={}", ttl);
+        assert!(ttl > 0, "Expected ACK (TTL > 0), got TTL={ttl}");
 
         server_handle.await.unwrap();
     }
@@ -1072,19 +1542,21 @@ mod tests {
             1,
             3,
             0x01,
-            Ipv4Addr::new(127, 0, 0, 1),
+            Ipv4Addr::LOCALHOST,
             sd::TransportProtocol::Udp,
             server_port,
         );
         client_socket
-            .send_to(&message, format!("127.0.0.1:{}", server_port))
+            .send_to(&message, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
         // Process the message
         let server_handle = tokio::spawn(async move {
             let mut buf = vec![0u8; 65535];
-            let (len, addr) = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let datagram = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let len = datagram.bytes_received;
+            let addr = std::net::SocketAddr::V4(datagram.source);
             let data = &buf[..len];
             let view = MessageView::parse(data).unwrap();
             let sd_view = view.sd_header().unwrap();
@@ -1106,7 +1578,7 @@ mod tests {
         .unwrap();
 
         let ttl = parse_subscribe_ack_ttl(&resp_buf[..resp_len]);
-        assert_eq!(ttl, 0, "Expected NACK (TTL=0), got TTL={}", ttl);
+        assert_eq!(ttl, 0, "Expected NACK (TTL=0), got TTL={ttl}");
 
         server_handle.await.unwrap();
     }
@@ -1122,18 +1594,20 @@ mod tests {
             1,
             3,
             0x01,
-            Ipv4Addr::new(127, 0, 0, 1),
+            Ipv4Addr::LOCALHOST,
             sd::TransportProtocol::Udp,
             server_port,
         );
         client_socket
-            .send_to(&message, format!("127.0.0.1:{}", server_port))
+            .send_to(&message, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
         let server_handle = tokio::spawn(async move {
             let mut buf = vec![0u8; 65535];
-            let (len, addr) = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let datagram = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let len = datagram.bytes_received;
+            let addr = std::net::SocketAddr::V4(datagram.source);
             let data = &buf[..len];
             let view = MessageView::parse(data).unwrap();
             let sd_view = view.sd_header().unwrap();
@@ -1153,7 +1627,7 @@ mod tests {
         .unwrap();
 
         let ttl = parse_subscribe_ack_ttl(&resp_buf[..resp_len]);
-        assert_eq!(ttl, 0, "Expected NACK (TTL=0), got TTL={}", ttl);
+        assert_eq!(ttl, 0, "Expected NACK (TTL=0), got TTL={ttl}");
 
         server_handle.await.unwrap();
     }
@@ -1173,14 +1647,16 @@ mod tests {
         );
         let message = build_sd_message(&sd_header);
         client_socket
-            .send_to(&message, format!("127.0.0.1:{}", server_port))
+            .send_to(&message, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
         // Process the message on the unicast socket
         let server_handle = tokio::spawn(async move {
             let mut buf = vec![0u8; 65535];
-            let (len, addr) = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let datagram = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let len = datagram.bytes_received;
+            let addr = std::net::SocketAddr::V4(datagram.source);
             let data = &buf[..len];
             let view = MessageView::parse(data).unwrap();
             let sd_view = view.sd_header().unwrap();
@@ -1224,13 +1700,15 @@ mod tests {
         );
         let message = build_sd_message(&sd_header);
         client_socket
-            .send_to(&message, format!("127.0.0.1:{}", server_port))
+            .send_to(&message, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
         let server_handle = tokio::spawn(async move {
             let mut buf = vec![0u8; 65535];
-            let (len, addr) = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let datagram = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let len = datagram.bytes_received;
+            let addr = std::net::SocketAddr::V4(datagram.source);
             let data = &buf[..len];
             let view = MessageView::parse(data).unwrap();
             let sd_view = view.sd_header().unwrap();
@@ -1271,13 +1749,15 @@ mod tests {
         );
         let message = build_sd_message(&sd_header);
         client_socket
-            .send_to(&message, format!("127.0.0.1:{}", server_port))
+            .send_to(&message, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
         let server_handle = tokio::spawn(async move {
             let mut buf = vec![0u8; 65535];
-            let (len, addr) = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let datagram = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let len = datagram.bytes_received;
+            let addr = std::net::SocketAddr::V4(datagram.source);
             let data = &buf[..len];
             let view = MessageView::parse(data).unwrap();
             let sd_view = view.sd_header().unwrap();
@@ -1311,13 +1791,15 @@ mod tests {
         let message = build_sd_message(&sd_header);
 
         client_socket
-            .send_to(&message, format!("127.0.0.1:{}", server_port))
+            .send_to(&message, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
         let server_handle = tokio::spawn(async move {
             let mut buf = vec![0u8; 65535];
-            let (len, addr) = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let datagram = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let len = datagram.bytes_received;
+            let addr = std::net::SocketAddr::V4(datagram.source);
             let data = &buf[..len];
             let view = MessageView::parse(data).unwrap();
             let sd_view = view.sd_header().unwrap();
@@ -1339,7 +1821,7 @@ mod tests {
         .unwrap();
 
         let ttl = parse_subscribe_ack_ttl(&resp_buf[..resp_len]);
-        assert_eq!(ttl, 0, "Expected NACK (TTL=0), got TTL={}", ttl);
+        assert_eq!(ttl, 0, "Expected NACK (TTL=0), got TTL={ttl}");
 
         server_handle.await.unwrap();
     }
@@ -1376,10 +1858,19 @@ mod tests {
         assert_eq!(entry.service_id(), 0x5B);
         assert_eq!(entry.instance_id(), 1);
 
-        // Also test that start_announcing doesn't error
+        // Also test that announcement_loop builds a future without error.
         drop(server);
         let (server2, _) = create_test_server(0x5B, 1).await;
-        assert!(server2.start_announcing().is_ok());
+        let fut = server2
+            .announcement_loop()
+            .expect("announcement_loop on a regular server must build");
+        // Intentionally do not poll or spawn the future: we only care
+        // that constructing it returned Ok. If this future were
+        // spawned, the announcer would loop indefinitely and emit
+        // multicast until explicitly aborted or the Tokio runtime
+        // shut down at end-of-test, which could interfere with
+        // parallel tests using the same multicast group.
+        drop(fut);
     }
 
     #[tokio::test]
@@ -1388,7 +1879,7 @@ mod tests {
         let client_socket = UdpSocket::bind("127.0.0.1:0").await.unwrap();
         let client_port = match client_socket.local_addr().unwrap() {
             std::net::SocketAddr::V4(a) => a.port(),
-            _ => panic!("expected v4"),
+            std::net::SocketAddr::V6(_) => panic!("expected v4 source address"),
         };
 
         let subscriptions = Arc::clone(&server.subscriptions);
@@ -1410,7 +1901,7 @@ mod tests {
         let mut non_sd_buf = Vec::new();
         non_sd_header.encode(&mut non_sd_buf).unwrap();
         client_socket
-            .send_to(&non_sd_buf, format!("127.0.0.1:{}", server_port))
+            .send_to(&non_sd_buf, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
@@ -1422,12 +1913,12 @@ mod tests {
             1,
             3,
             0x01,
-            Ipv4Addr::new(127, 0, 0, 1),
+            Ipv4Addr::LOCALHOST,
             sd::TransportProtocol::Udp,
             client_port,
         );
         client_socket
-            .send_to(&message, format!("127.0.0.1:{}", server_port))
+            .send_to(&message, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
@@ -1442,7 +1933,7 @@ mod tests {
         .unwrap();
 
         let ttl = parse_subscribe_ack_ttl(&resp_buf[..resp_len]);
-        assert!(ttl > 0, "Expected ACK (TTL > 0), got TTL={}", ttl);
+        assert!(ttl > 0, "Expected ACK (TTL > 0), got TTL={ttl}");
 
         // Verify subscription was added (non-SD message was ignored)
         let subs = subscriptions.read().await;
@@ -1457,7 +1948,7 @@ mod tests {
         let client_socket = UdpSocket::bind("127.0.0.1:0").await.unwrap();
         let client_port = match client_socket.local_addr().unwrap() {
             std::net::SocketAddr::V4(a) => a.port(),
-            _ => panic!("expected v4"),
+            std::net::SocketAddr::V6(_) => panic!("expected v4 source address"),
         };
 
         let subscriptions = Arc::clone(&server.subscriptions);
@@ -1468,7 +1959,7 @@ mod tests {
 
         // Send garbage bytes
         client_socket
-            .send_to(&[0xFF, 0xFE, 0xFD], format!("127.0.0.1:{}", server_port))
+            .send_to(&[0xFF, 0xFE, 0xFD], format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
@@ -1480,12 +1971,12 @@ mod tests {
             1,
             3,
             0x01,
-            Ipv4Addr::new(127, 0, 0, 1),
+            Ipv4Addr::LOCALHOST,
             sd::TransportProtocol::Udp,
             client_port,
         );
         client_socket
-            .send_to(&message, format!("127.0.0.1:{}", server_port))
+            .send_to(&message, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
@@ -1500,7 +1991,7 @@ mod tests {
         .unwrap();
 
         let ttl = parse_subscribe_ack_ttl(&resp_buf[..resp_len]);
-        assert!(ttl > 0, "Expected ACK (TTL > 0), got TTL={}", ttl);
+        assert!(ttl > 0, "Expected ACK (TTL > 0), got TTL={ttl}");
 
         let subs = subscriptions.read().await;
         assert_eq!(subs.subscription_count(), 1);
@@ -1508,22 +1999,6 @@ mod tests {
         server_handle.abort();
     }
 
-    #[tokio::test]
-    async fn test_next_sd_session_id_wraps() {
-        let (server, _) = create_test_server(0x5B, 1).await;
-
-        // Set session ID to 0xFFFE
-        server.sd_session_id.store(0xFFFE, Ordering::Relaxed);
-
-        // First call: 0xFFFE -> 0xFFFF, returns 0xFFFF
-        let sid1 = server.next_sd_session_id();
-        assert_eq!(sid1, 0xFFFF);
-
-        // Second call: 0xFFFF -> wraps to 0x0001 (skipping 0), returns 0x0001
-        let sid2 = server.next_sd_session_id();
-        assert_eq!(sid2, 0x0001);
-    }
-
     #[tokio::test]
     async fn test_handle_sd_other_entry_type() {
         let (mut server, _) = create_test_server(0x5B, 1).await;
@@ -1565,18 +2040,20 @@ mod tests {
             1,
             3,
             0x01,
-            Ipv4Addr::new(127, 0, 0, 1),
+            Ipv4Addr::LOCALHOST,
             sd::TransportProtocol::Udp,
             server_port.wrapping_add(1), // Subscriber's port, different from server
         );
         client_socket
-            .send_to(&message, format!("127.0.0.1:{}", server_port))
+            .send_to(&message, format!("127.0.0.1:{server_port}"))
             .await
             .unwrap();
 
         let server_handle = tokio::spawn(async move {
             let mut buf = vec![0u8; 65535];
-            let (len, addr) = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let datagram = server.unicast_socket.recv_from(&mut buf).await.unwrap();
+            let len = datagram.bytes_received;
+            let addr = std::net::SocketAddr::V4(datagram.source);
             let data = &buf[..len];
             let view = MessageView::parse(data).unwrap();
             let sd_view = view.sd_header().unwrap();
@@ -1597,7 +2074,7 @@ mod tests {
         .unwrap();
 
         let ttl = parse_subscribe_ack_ttl(&resp_buf[..resp_len]);
-        assert!(ttl > 0, "Expected ACK (TTL > 0), got TTL={}", ttl);
+        assert!(ttl > 0, "Expected ACK (TTL > 0), got TTL={ttl}");
 
         server_handle.await.unwrap();
     }
@@ -1653,7 +2130,7 @@ mod tests {
         let total = fill_ipv4_endpoints(&mut buf, 1, 30000);
         let iter = sd::OptionIter::new(&buf[..total]);
 
-        let got = Server::extract_subscriber_endpoint(&iter, 0, 1, 0, 0);
+        let got = extract_subscriber_endpoint(&iter, 0, 1, 0, 0);
         assert_eq!(
             got,
             Some(SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 30000))
@@ -1663,7 +2140,7 @@ mod tests {
     #[test]
     fn extract_endpoint_zero_options_in_both_runs_returns_none() {
         let iter = sd::OptionIter::new(&[]);
-        assert_eq!(Server::extract_subscriber_endpoint(&iter, 0, 0, 0, 0), None);
+        assert_eq!(extract_subscriber_endpoint(&iter, 0, 0, 0, 0), None);
     }
 
     #[test]
@@ -1675,7 +2152,7 @@ mod tests {
         let total = fill_ipv4_endpoints(&mut buf, 2, 30100);
         let iter = sd::OptionIter::new(&buf[..total]);
 
-        assert_eq!(Server::extract_subscriber_endpoint(&iter, 1, 0, 0, 0), None);
+        assert_eq!(extract_subscriber_endpoint(&iter, 1, 0, 0, 0), None);
     }
 
     #[test]
@@ -1687,7 +2164,7 @@ mod tests {
         let total = fill_ipv4_endpoints(&mut buf, 2, 30200);
         let iter = sd::OptionIter::new(&buf[..total]);
 
-        let got = Server::extract_subscriber_endpoint(&iter, 0, 2, 0, 0);
+        let got = extract_subscriber_endpoint(&iter, 0, 2, 0, 0);
         assert_eq!(
             got,
             Some(SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 30200))
@@ -1706,7 +2183,7 @@ mod tests {
         let total = fill_ipv4_endpoints(&mut buf, 3, 30300);
         let iter = sd::OptionIter::new(&buf[..total]);
 
-        let got = Server::extract_subscriber_endpoint(&iter, 0, 1, 2, 1);
+        let got = extract_subscriber_endpoint(&iter, 0, 1, 2, 1);
         assert_eq!(
             got,
             Some(SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 30300))
@@ -1721,7 +2198,7 @@ mod tests {
         let total = fill_ipv4_endpoints(&mut buf, 4, 30400);
         let iter = sd::OptionIter::new(&buf[..total]);
 
-        let got = Server::extract_subscriber_endpoint(&iter, 2, 1, 0, 0);
+        let got = extract_subscriber_endpoint(&iter, 2, 1, 0, 0);
         assert_eq!(
             got,
             Some(SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 30402))
@@ -1737,7 +2214,7 @@ mod tests {
         let iter = sd::OptionIter::new(&buf[..total]);
 
         // Take only 1 option starting at index 1 -> port 30501.
-        let got = Server::extract_subscriber_endpoint(&iter, 1, 1, 0, 0);
+        let got = extract_subscriber_endpoint(&iter, 1, 1, 0, 0);
         assert_eq!(
             got,
             Some(SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 30501))
@@ -1761,7 +2238,7 @@ mod tests {
         offset += write_load_balancing_option(&mut buf[offset..], 3, 4);
         let iter = sd::OptionIter::new(&buf[..offset]);
 
-        let got = Server::extract_subscriber_endpoint(&iter, 0, 3, 0, 0);
+        let got = extract_subscriber_endpoint(&iter, 0, 3, 0, 0);
         assert_eq!(
             got,
             Some(SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 30600))
@@ -1776,7 +2253,7 @@ mod tests {
         offset += write_load_balancing_option(&mut buf[offset..], 3, 4);
         let iter = sd::OptionIter::new(&buf[..offset]);
 
-        assert_eq!(Server::extract_subscriber_endpoint(&iter, 0, 2, 0, 0), None);
+        assert_eq!(extract_subscriber_endpoint(&iter, 0, 2, 0, 0), None);
     }
 
     #[test]
@@ -1787,7 +2264,7 @@ mod tests {
         let total = fill_ipv4_endpoints(&mut buf, 2, 30700);
         let iter = sd::OptionIter::new(&buf[..total]);
 
-        let got = Server::extract_subscriber_endpoint(&iter, 0, 0, 1, 1);
+        let got = extract_subscriber_endpoint(&iter, 0, 0, 1, 1);
         assert_eq!(
             got,
             Some(SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 30701))
@@ -1862,20 +2339,19 @@ mod tests {
         // datagram. We drive `handle_sd_message` directly rather than
         // `server.run()` so we can assert state after the call.
         let client_socket = UdpSocket::bind("127.0.0.1:0").await.unwrap();
-        let sd_addr = match server.sd_socket.local_addr().unwrap() {
-            std::net::SocketAddr::V4(v4) => v4,
-            std::net::SocketAddr::V6(_) => panic!("expected v4 sd socket"),
-        };
+        let sd_addr = server.sd_socket.local_addr().unwrap();
         client_socket.send_to(&message, sd_addr).await.unwrap();
 
         let mut buf = vec![0u8; 65_535];
-        let (len, sender) = tokio::time::timeout(
+        let datagram = tokio::time::timeout(
             std::time::Duration::from_secs(2),
             server.sd_socket.recv_from(&mut buf),
         )
         .await
         .expect("timeout receiving combined SD packet")
         .unwrap();
+        let len = datagram.bytes_received;
+        let sender = std::net::SocketAddr::V4(datagram.source);
         let view = MessageView::parse(&buf[..len]).unwrap();
         let sd_view = view.sd_header().unwrap();
         server.handle_sd_message(&sd_view, sender).await.unwrap();
@@ -1913,9 +2389,9 @@ mod tests {
 
     /// Construct a passive server on loopback with an ephemeral unicast
     /// port. Tests use this as a standard fixture.
-    async fn make_passive_server(service_id: u16, instance_id: u16) -> Server {
+    async fn make_passive_server(service_id: u16, instance_id: u16) -> TestServer {
         let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 0, service_id, instance_id);
-        Server::new_passive(config)
+        TestServer::new_passive(config)
             .await
             .expect("new_passive should succeed")
     }
@@ -1944,16 +2420,11 @@ mod tests {
         // the same module.
         let server = make_passive_server(0x005C, 0x0001).await;
         let sd_addr = server.sd_socket.local_addr().unwrap();
-        match sd_addr {
-            std::net::SocketAddr::V4(v4) => {
-                assert_ne!(
-                    v4.port(),
-                    30490,
-                    "passive SD socket must not bind the SOME/IP SD port"
-                );
-            }
-            std::net::SocketAddr::V6(_) => panic!("expected IPv4 SD address"),
-        }
+        assert_ne!(
+            sd_addr.port(),
+            30490,
+            "passive SD socket must not bind the SOME/IP SD port"
+        );
     }
 
     #[tokio::test]
@@ -1969,7 +2440,8 @@ mod tests {
         let subscriber = SocketAddrV4::new(Ipv4Addr::new(127, 0, 0, 2), 40_000);
         publisher
             .register_subscriber(0x005C, 0x0001, 0x0001, subscriber)
-            .await;
+            .await
+            .unwrap();
 
         assert!(publisher.has_subscribers(0x005C, 0x0001, 0x0001).await);
         assert_eq!(publisher.subscriber_count(0x005C, 0x0001, 0x0001).await, 1);
@@ -1982,11 +2454,12 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn start_announcing_on_passive_returns_invalid_input() {
+    async fn announcement_loop_on_passive_returns_invalid_input() {
         let server = make_passive_server(0x005C, 0x0001).await;
         let err = server
-            .start_announcing()
-            .expect_err("start_announcing on a passive server must fail");
+            .announcement_loop()
+            .err()
+            .expect("announcement_loop on a passive server must fail");
         match err {
             Error::Io(io_err) => {
                 assert_eq!(io_err.kind(), std::io::ErrorKind::InvalidInput);
@@ -2029,18 +2502,114 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn start_announcing_on_regular_server_still_succeeds() {
-        // Regression guard: the new is_passive check must not break the
+    async fn announcement_loop_on_regular_server_still_succeeds() {
+        // Regression guard: the is_passive check must not break the
         // standard non-passive path.
         let (server, _port) = create_test_server(0x005C, 0x0001).await;
-        server
-            .start_announcing()
-            .expect("start_announcing on a regular server must still succeed");
-        // The announcer task runs forever; the test succeeds as soon as
-        // start_announcing returns Ok. The spawned task is cleaned up
-        // when the Tokio test runtime shuts down at the end of this
-        // test — `tokio::spawn` tasks are not aborted by dropping
-        // unrelated handles, they ride the runtime lifecycle.
+        let fut = server
+            .announcement_loop()
+            .expect("announcement_loop on a regular server must build");
+        // The announcer loops forever; the test succeeds as soon as
+        // construction returns Ok.
+        // Do not poll or spawn the future: doing so would leave the
+        // announcer running and emitting multicast for the rest of the
+        // test binary's lifetime, interfering with parallel tests that
+        // bind the same multicast group. We only care that construction
+        // returned Ok, so drop the future without polling it.
+        drop(fut);
+    }
+
+    /// Direct test that `announcement_loop` actually emits an SD
+    /// announcement when driven. Explicit coverage for the primary entry
+    /// point (avoids regressions where only the deleted shim was exercised).
+    #[ignore = "requires MULTICAST on loopback; consistent with the \
+                #[ignore]-gated sd_state.rs tests. Runs in any environment \
+                where loopback multicast is available."]
+    #[tokio::test]
+    async fn announcement_loop_sends_offer_service_when_driven() {
+        use crate::protocol::MessageId;
+
+        // Use service/instance IDs not used elsewhere in this test module
+        // so parallel tests joined to the same SD multicast group cannot
+        // produce false matches.
+        const SID: u16 = 0xAA01;
+        const IID: u16 = 0xFF01;
+
+        // Bind a receiver on the SD multicast port with loopback so we
+        // actually see the outgoing announcement. Use a dedicated
+        // receiver socket via socket2 to match the SD bind pattern.
+        let iface = std::net::Ipv4Addr::LOCALHOST;
+        let recv = {
+            let s = socket2::Socket::new(
+                socket2::Domain::IPV4,
+                socket2::Type::DGRAM,
+                Some(socket2::Protocol::UDP),
+            )
+            .unwrap();
+            s.set_reuse_address(true).unwrap();
+            #[cfg(unix)]
+            s.set_reuse_port(true).unwrap();
+            s.bind(&std::net::SocketAddr::new(IpAddr::V4(iface), sd::MULTICAST_PORT).into())
+                .unwrap();
+            s.set_nonblocking(true).unwrap();
+            let std_s: std::net::UdpSocket = s.into();
+            let rs = tokio::net::UdpSocket::from_std(std_s).unwrap();
+            rs.join_multicast_v4(sd::MULTICAST_IP, iface).unwrap();
+            rs
+        };
+
+        let config = ServerConfig::new(iface, 30501, SID, IID);
+        let server = TestServer::new_with_loopback(config, true).await.unwrap();
+        let fut = server.announcement_loop().expect("build loop");
+        let handle = tokio::spawn(fut);
+
+        // Filter out any stray SD traffic from other parallel tests
+        // until we see one whose OfferService entry carries OUR sid/iid.
+        // Bounded by a single outer timeout so a totally-silent server
+        // (the regression we actually care about) still fails the test.
+        let mut buf = [0u8; 1500];
+        let offer_fields = tokio::time::timeout(std::time::Duration::from_secs(3), async {
+            loop {
+                let (n, _src) = recv.recv_from(&mut buf).await.expect("recv failed");
+                let Ok(view) = crate::protocol::MessageView::parse(&buf[..n]) else {
+                    continue;
+                };
+                if view.header().message_id() != MessageId::SD {
+                    continue;
+                }
+                let Ok(sd_view) = view.sd_header() else {
+                    continue;
+                };
+                let Some(entry) = sd_view.entries().next() else {
+                    continue;
+                };
+                if !matches!(entry.entry_type(), Ok(sd::EntryType::OfferService)) {
+                    continue;
+                }
+                if entry.service_id() != SID || entry.instance_id() != IID {
+                    continue;
+                }
+                break (
+                    entry.service_id(),
+                    entry.instance_id(),
+                    entry.major_version(),
+                    entry.ttl(),
+                );
+            }
+        })
+        .await
+        .expect("timed out waiting for our OfferService");
+
+        let (svc, inst, major, ttl) = offer_fields;
+        assert_eq!(svc, SID, "emitted service_id must match server config");
+        assert_eq!(inst, IID, "emitted instance_id must match server config");
+        assert_eq!(major, 1, "default major_version from ServerConfig::new");
+        assert!(
+            ttl > 0,
+            "OfferService TTL must be non-zero (TTL=0 means StopOffering)",
+        );
+
+        handle.abort();
     }
 
     #[tokio::test]
@@ -2057,12 +2626,8 @@ mod tests {
         // Different placeholder ports.
         assert_ne!(addr_a, addr_b);
         // And neither is 30490.
-        if let std::net::SocketAddr::V4(v4) = addr_a {
-            assert_ne!(v4.port(), 30490);
-        }
-        if let std::net::SocketAddr::V4(v4) = addr_b {
-            assert_ne!(v4.port(), 30490);
-        }
+        assert_ne!(addr_a.port(), 30490);
+        assert_ne!(addr_b.port(), 30490);
     }
 
     #[tokio::test]
@@ -2079,11 +2644,17 @@ mod tests {
         };
 
         let config = ServerConfig::new(Ipv4Addr::LOCALHOST, blocker_port, 0x005C, 0x0001);
-        let result = Server::new_passive(config).await;
+        let result = TestServer::new_passive(config).await;
         let Err(err) = result else {
             panic!("new_passive must fail when the unicast port is taken");
         };
         match err {
+            // The bind path goes through the `TransportFactory` trait,
+            // so port collisions surface as
+            // `Error::Transport(TransportError::AddressInUse)` instead
+            // of `Error::Io`. Both variants are accepted to keep the
+            // test stable across future transport-error refactors.
+            Error::Transport(crate::transport::TransportError::AddressInUse) => {}
             Error::Io(io_err) => {
                 assert!(
                     matches!(
@@ -2094,7 +2665,7 @@ mod tests {
                     io_err.kind()
                 );
             }
-            other => panic!("expected Error::Io, got {other:?}"),
+            other => panic!("expected Error::Io or Error::Transport(AddressInUse), got {other:?}"),
         }
         drop(blocker);
     }
@@ -2155,17 +2726,14 @@ mod tests {
         with_default(subscriber, || {
             // 0 endpoints → warn! "No IPv4 endpoint" branch.
             let iter_empty = sd::OptionIter::new(&[]);
-            assert_eq!(
-                Server::extract_subscriber_endpoint(&iter_empty, 0, 0, 0, 0),
-                None
-            );
+            assert_eq!(extract_subscriber_endpoint(&iter_empty, 0, 0, 0, 0), None);
 
             // 1 endpoint → trace! "Found IPv4 endpoint" branch.
             let mut buf_one = [0u8; 32];
             let len_one = fill_ipv4_endpoints(&mut buf_one, 1, 31000);
             let iter_one = sd::OptionIter::new(&buf_one[..len_one]);
             assert_eq!(
-                Server::extract_subscriber_endpoint(&iter_one, 0, 1, 0, 0),
+                extract_subscriber_endpoint(&iter_one, 0, 1, 0, 0),
                 Some(SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 31000))
             );
 
@@ -2174,9 +2742,89 @@ mod tests {
             let len_many = fill_ipv4_endpoints(&mut buf_many, 3, 31100);
             let iter_many = sd::OptionIter::new(&buf_many[..len_many]);
             assert_eq!(
-                Server::extract_subscriber_endpoint(&iter_many, 0, 3, 0, 0),
+                extract_subscriber_endpoint(&iter_many, 0, 3, 0, 0),
                 Some(SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 31100))
             );
         });
     }
+
+    /// Smoke test for [`Server::announcement_loop`]: a loopback server
+    /// with `multicast_loop` enabled should emit at least one
+    /// `OfferService` on the SD multicast group within a couple of
+    /// seconds.
+    ///
+    /// `#[ignore]`d for the same reason as the `sd_state` tests — hosts
+    /// without the MULTICAST flag on `lo` drop the packet silently. The
+    /// announcer task is captured and aborted at the end of the test so
+    /// it does not leak multicast traffic into other parallel tests.
+    #[ignore = "requires loopback multicast support (MULTICAST on lo)"]
+    #[tokio::test]
+    async fn announcement_loop_emits_first_offer_within_timeout() {
+        use crate::protocol::MessageView;
+        use crate::protocol::sd::EntryType;
+
+        let interface = Ipv4Addr::LOCALHOST;
+        // Pick a service_id and unicast port that do not collide with
+        // the other loopback-enabled server test in this file.
+        let service_id = 0xFE02;
+        let config = ServerConfig::new(interface, 30684, service_id, 0x43);
+
+        // Receiver joined to the SD multicast group on loopback.
+        let raw_rx = socket2::Socket::new(
+            socket2::Domain::IPV4,
+            socket2::Type::DGRAM,
+            Some(socket2::Protocol::UDP),
+        )
+        .unwrap();
+        raw_rx.set_reuse_address(true).unwrap();
+        #[cfg(unix)]
+        raw_rx.set_reuse_port(true).unwrap();
+        raw_rx.set_multicast_loop_v4(true).unwrap();
+        raw_rx
+            .bind(&std::net::SocketAddr::new(IpAddr::V4(interface), sd::MULTICAST_PORT).into())
+            .unwrap();
+        raw_rx.set_nonblocking(true).unwrap();
+        let rx: UdpSocket = UdpSocket::from_std(raw_rx.into()).unwrap();
+        rx.join_multicast_v4(sd::MULTICAST_IP, interface).unwrap();
+
+        let server = TestServer::new_with_loopback(config, true)
+            .await
+            .expect("server must bind with loopback enabled");
+        let announce_fut = server
+            .announcement_loop()
+            .expect("announcement_loop should build on a non-passive server");
+        let announce_handle = tokio::spawn(announce_fut);
+
+        // Scan the multicast group for our OfferService. The first tick
+        // happens immediately; 2s is ample headroom for scheduler jitter.
+        let recv_loop = async {
+            let mut buf = [0u8; 2048];
+            loop {
+                let (len, _from) = rx.recv_from(&mut buf).await.expect("recv_from");
+                let Ok(view) = MessageView::parse(&buf[..len]) else {
+                    continue;
+                };
+                if view.header().message_id().service_id() != 0xFFFF {
+                    continue;
+                }
+                let Ok(sd_view) = view.sd_header() else {
+                    continue;
+                };
+                let Some(entry) = sd_view.entries().next() else {
+                    continue;
+                };
+                if !matches!(entry.entry_type(), Ok(EntryType::OfferService)) {
+                    continue;
+                }
+                if entry.service_id() == service_id {
+                    return;
+                }
+            }
+        };
+        tokio::time::timeout(std::time::Duration::from_secs(2), recv_loop)
+            .await
+            .expect("announcement_loop should emit at least one OfferService within 2s");
+        announce_handle.abort();
+        let _ = announce_handle.await;
+    }
 }
diff --git a/src/server/sd_state.rs b/src/server/sd_state.rs
new file mode 100644
index 0000000..2deec16
--- /dev/null
+++ b/src/server/sd_state.rs
@@ -0,0 +1,681 @@
+//! Service Discovery session-state tracking, decoupled from socket ownership.
+//!
+//! [`SdStateManager`] owns the session-ID counter used by every outgoing
+//! SOME/IP-SD message this server emits (`OfferService` announcements,
+//! unicast Offer replies, `SubscribeAck`, `SubscribeNack`). It also builds
+//! and sends `OfferService` announcements when given a socket.
+//!
+//! Keeping this state in its own type prepares the server for upcoming
+//! transport abstraction: once `TransportSocket` lands, the `&UdpSocket`
+//! parameter on [`SdStateManager::send_offer_service`] becomes the single
+//! migration point for the announcement path.
+
+use core::sync::atomic::{AtomicU32, Ordering};
+use std::net::SocketAddrV4;
+
+use crate::protocol::sd::{
+    self, Entry, Flags, OptionsCount, RebootFlag, ServiceEntry, TransportProtocol,
+};
+use crate::transport::TransportSocket;
+
+use super::{Error, ServerConfig};
+
+/// Tracks the SD session-ID counter and emits `OfferService` announcements.
+///
+/// Session IDs increment with each SD message and wrap from `0xFFFF` back
+/// to `0x0001` (skipping `0`, which is reserved). Per AUTOSAR SOME/IP-SD,
+/// the reboot flag on emitted SD messages is
+/// [`RebootFlag::RecentlyRebooted`] from startup until the counter wraps
+/// once, then [`RebootFlag::Continuous`] permanently — `SdStateManager`
+/// tracks that transition and exposes it via [`Self::reboot_flag`] so every
+/// server-side SD emission path reads from a single source of truth.
+#[derive(Debug)]
+pub(super) struct SdStateManager {
+    /// Packed `(has_wrapped, session_id)` state.
+    ///
+    /// - bits 0..16: current session id (1..=0xFFFF, never 0).
+    /// - bit 16: `has_wrapped` flag — once set, never cleared.
+    /// - bits 17..32: reserved, must remain 0.
+    ///
+    /// Packed into a single `AtomicU32` so a single `fetch_update`
+    /// produces a consistent `(session_id, reboot_flag)` pair across
+    /// concurrent emitters around the `0xFFFF → 0x0001` wrap boundary.
+    /// Two separate atomics could be interleaved by another emitter
+    /// between the increment and the wrap-flag latch; with one atomic,
+    /// the pair is computed in one CAS step.
+    session_state: AtomicU32,
+}
+
+const SID_MASK: u32 = 0xFFFF;
+const WRAPPED_BIT: u32 = 1 << 16;
+
+impl SdStateManager {
+    pub(super) const fn new() -> Self {
+        Self::with_initial(1)
+    }
+
+    /// Construct with a specific starting session counter. Primarily used by
+    /// tests to validate wrap behavior; callers in production should use
+    /// [`Self::new`].
+    pub(super) const fn with_initial(initial: u16) -> Self {
+        Self {
+            // has_wrapped starts false; session_id starts at `initial`.
+            session_state: AtomicU32::new(initial as u32),
+        }
+    }
+
+    /// Advance the counter and return the next SOME/IP-SD session ID
+    /// (`client_id = 0`, session ID in the low 16 bits) together with the
+    /// reboot flag that *belongs to this same emission*. Skips 0 on wrap,
+    /// and latches the `has_wrapped` bit the first time the counter
+    /// crosses the `0xFFFF → 0x0001` boundary so the reboot flag flips
+    /// to [`RebootFlag::Continuous`] permanently.
+    ///
+    /// `(session_id, reboot_flag)` is computed atomically inside one
+    /// `fetch_update` so concurrent emitters always agree on the pair.
+    /// A previous implementation used two separate atomics and could
+    /// race around the wrap boundary, advertising
+    /// `(0xFFFF, Continuous)` or `(0x0001, RecentlyRebooted)` — both
+    /// violations of AUTOSAR SOME/IP-SD's stated semantics that the
+    /// wrap message itself carries `Continuous`.
+    pub(super) fn next_session_id_with_reboot_flag(&self) -> (u32, RebootFlag) {
+        let prev_state = self
+            .session_state
+            .fetch_update(Ordering::AcqRel, Ordering::Acquire, |state| {
+                let prev_sid = (state & SID_MASK) as u16;
+                let prev_wrapped = (state & WRAPPED_BIT) != 0;
+                let next_sid = match prev_sid.wrapping_add(1) {
+                    0 => 1u16,
+                    n => n,
+                };
+                // Latch wrap on the 0xFFFF → 0x0001 transition.
+                let next_wrapped = prev_wrapped || prev_sid == u16::MAX;
+                let next_state =
+                    (u32::from(next_sid)) | (if next_wrapped { WRAPPED_BIT } else { 0 });
+                Some(next_state)
+            })
+            .unwrap();
+        // Re-derive the new state from the prev we observed; this is
+        // the *same* computation the closure performed and produces
+        // exactly the new state we just stored.
+        let prev_sid = (prev_state & SID_MASK) as u16;
+        let prev_wrapped = (prev_state & WRAPPED_BIT) != 0;
+        let next_sid = match prev_sid.wrapping_add(1) {
+            0 => 1u16,
+            n => n,
+        };
+        let next_wrapped = prev_wrapped || prev_sid == u16::MAX;
+        let session_id = u32::from(next_sid);
+        let reboot_flag = if next_wrapped {
+            RebootFlag::Continuous
+        } else {
+            RebootFlag::RecentlyRebooted
+        };
+        (session_id, reboot_flag)
+    }
+
+    /// Convenience: advance the counter and return only the session id.
+    /// Use [`Self::next_session_id_with_reboot_flag`] when the same
+    /// emission also needs the reboot flag — calling these two methods
+    /// separately races around the wrap boundary. Only used by unit
+    /// tests; production paths take the atomic pair.
+    #[cfg(test)]
+    pub(super) fn next_session_id(&self) -> u32 {
+        self.next_session_id_with_reboot_flag().0
+    }
+
+    /// Current SD reboot flag for this server.
+    ///
+    /// Returns [`RebootFlag::RecentlyRebooted`] until the session counter
+    /// has wrapped past `0xFFFF` at least once, then
+    /// [`RebootFlag::Continuous`] permanently. Production emission paths
+    /// must use [`Self::next_session_id_with_reboot_flag`] instead to
+    /// avoid a TOCTOU race around the wrap boundary; this accessor is
+    /// `#[cfg(test)]`-only so future code cannot accidentally reach for
+    /// the racy pair.
+    #[cfg(test)]
+    pub(super) fn reboot_flag(&self) -> RebootFlag {
+        if (self.session_state.load(Ordering::Acquire) & WRAPPED_BIT) != 0 {
+            RebootFlag::Continuous
+        } else {
+            RebootFlag::RecentlyRebooted
+        }
+    }
+
+    /// Send a multicast `OfferService` announcement for the given config.
+    pub(super) async fn send_offer_service<T: TransportSocket>(
+        &self,
+        config: &ServerConfig,
+        socket: &T,
+    ) -> Result<(), Error> {
+        use crate::protocol::Header as SomeIpHeader;
+        use crate::traits::WireFormat;
+
+        let entry = Entry::OfferService(ServiceEntry {
+            index_first_options_run: 0,
+            index_second_options_run: 0,
+            options_count: OptionsCount::new(1, 0),
+            service_id: config.service_id,
+            instance_id: config.instance_id,
+            major_version: config.major_version,
+            ttl: config.ttl,
+            minor_version: config.minor_version,
+        });
+
+        let option = sd::Options::IpV4Endpoint {
+            ip: config.interface,
+            port: config.local_port,
+            protocol: TransportProtocol::Udp,
+        };
+
+        let entries = [entry];
+        let options = [option];
+        // Atomic (sid, reboot_flag) pair so that concurrent emissions
+        // around the wrap boundary cannot disagree about whether this
+        // very message advertises `RecentlyRebooted` or `Continuous`.
+        // See `next_session_id_with_reboot_flag` docs for the race.
+        let (sid, reboot_flag) = self.next_session_id_with_reboot_flag();
+        let sd_payload = sd::Header::new(Flags::new_sd(reboot_flag), &entries, &options);
+
+        // Stack-allocated send buffer — alloc-free per-tick path.
+        // 16-byte SOME/IP header + the SD payload, capped at the UDP
+        // datagram limit.
+        let mut buffer = [0u8; crate::UDP_BUFFER_SIZE];
+        let sd_data_len = sd_payload.encode_to_slice(&mut buffer[16..])?;
+        let someip_header = SomeIpHeader::new_sd(sid, sd_data_len);
+        someip_header.encode_to_slice(&mut buffer[..16])?;
+        let total_len = 16 + sd_data_len;
+
+        let multicast_addr = SocketAddrV4::new(sd::MULTICAST_IP, sd::MULTICAST_PORT);
+
+        tracing::trace!(
+            "Sending OfferService: service=0x{:04X}, instance={}, port={}, size={} bytes",
+            config.service_id,
+            config.instance_id,
+            config.local_port,
+            total_len
+        );
+        tracing::trace!("OfferService data: {:02X?}", &buffer[..total_len.min(64)]);
+
+        socket.send_to(&buffer[..total_len], multicast_addr).await?;
+        tracing::trace!("Sent to {}", multicast_addr);
+
+        Ok(())
+    }
+}
+
+#[cfg(all(test, feature = "server-tokio"))]
+mod tests {
+    use super::{SdStateManager, ServerConfig};
+    use crate::protocol::sd::{self, EntryType, Flags, RebootFlag, TransportProtocol};
+    use crate::protocol::{MessageType, MessageView, ReturnCode};
+    use crate::tokio_transport::TokioSocket;
+    use crate::transport::{SocketOptions, TransportFactory};
+    use std::net::{IpAddr, Ipv4Addr, SocketAddr, SocketAddrV4};
+    use std::time::Duration;
+    use tokio::net::UdpSocket;
+
+    /// Test-only `service_id` for `send_offer_service` tests. Distinct from
+    /// the 0x5B / 0x5C values used elsewhere in this crate so that parallel
+    /// tests joined to the same SD multicast group do not produce false
+    /// matches. If you add a new test that emits a multicast `OfferService`,
+    /// give it its own dedicated `service_id` too.
+    const TEST_SERVICE_ID: u16 = 0xFE01;
+    const TEST_INSTANCE_ID: u16 = 0x42;
+    /// Port value placed in the emitted `IpV4Endpoint` option so the
+    /// round-trip assertion has something non-zero to check. The test does
+    /// not bind this port — it only appears in the announcement payload.
+    const TEST_ADVERTISED_PORT: u16 = 40210;
+
+    #[test]
+    fn next_session_id_wraps_past_ffff_skipping_zero() {
+        let sd = SdStateManager::with_initial(0xFFFE);
+
+        // 0xFFFE -> 0xFFFF
+        assert_eq!(sd.next_session_id(), 0xFFFF);
+
+        // 0xFFFF -> wraps to 0x0001 (0 is skipped)
+        assert_eq!(sd.next_session_id(), 0x0001);
+    }
+
+    #[test]
+    fn next_session_id_starts_at_two_from_default_new() {
+        let sd = SdStateManager::new();
+        // new() seeds at 1; first next_session_id increments to 2
+        assert_eq!(sd.next_session_id(), 2);
+    }
+
+    /// Concurrent emitters around the wrap boundary must never produce
+    /// a `(session_id, reboot_flag)` pair where one is pre-wrap and the
+    /// other is post-wrap. Regression for the two-atomic TOCTOU race.
+    ///
+    /// We seed near the wrap and have many threads call
+    /// `next_session_id_with_reboot_flag` concurrently. Every
+    /// `(0xFFFF, _)` must carry `RecentlyRebooted`, every `(0x0001, _)`
+    /// (the wrap message) and beyond must carry `Continuous`.
+    #[test]
+    fn next_session_id_with_reboot_flag_never_mismatches_around_wrap() {
+        use std::sync::Arc;
+        for _trial in 0..20 {
+            let sd = Arc::new(SdStateManager::with_initial(0xFFF0));
+            let mut handles = std::vec::Vec::new();
+            for _ in 0..32 {
+                let s = Arc::clone(&sd);
+                handles.push(std::thread::spawn(move || {
+                    let (sid, flag) = s.next_session_id_with_reboot_flag();
+                    (sid, flag)
+                }));
+            }
+            for h in handles {
+                let (sid, flag) = h.join().unwrap();
+                // sid is u32 in 1..=0xFFFF (never 0).
+                assert!((1..=0xFFFF).contains(&sid), "sid out of range: {sid:#x}");
+                if sid == 0xFFFF {
+                    // The 0xFFFF emission is the LAST pre-wrap.
+                    assert_eq!(
+                        flag,
+                        RebootFlag::RecentlyRebooted,
+                        "sid=0xFFFF must carry RecentlyRebooted"
+                    );
+                } else if sid <= 0xFFEF {
+                    // We seeded at 0xFFF0, so any sid in 1..=0xFFEF
+                    // means the counter wrapped past 0xFFFF. Must be
+                    // Continuous.
+                    assert_eq!(
+                        flag,
+                        RebootFlag::Continuous,
+                        "post-wrap sid={sid:#x} must carry Continuous"
+                    );
+                }
+                // sids in 0xFFF0..=0xFFFE are the pre-wrap window —
+                // both flags are valid depending on whether this trial
+                // wrapped before/after the emission. Don't assert.
+            }
+        }
+    }
+
+    // ── Reboot-flag tracking ────────────────────────────────────────────
+    //
+    // AUTOSAR SOME/IP-SD: the reboot bit on emitted SD messages must be
+    // set until the session counter wraps past `0xFFFF` for the first
+    // time, then cleared permanently. These tests drive `SdStateManager`
+    // directly (no socket) and verify the state machine that every
+    // server-side SD emission path (`send_offer_service`, plus unicast
+    // offer / `SubscribeAck` / `SubscribeNack` in `server::Server`) now
+    // reads from via [`SdStateManager::reboot_flag`].
+
+    #[test]
+    fn reboot_flag_is_recently_rebooted_on_fresh_manager() {
+        // Default constructor: counter hasn't wrapped, flag must indicate
+        // a recent reboot so peers can re-synchronize SD state.
+        let sd = SdStateManager::new();
+        assert_eq!(sd.reboot_flag(), RebootFlag::RecentlyRebooted);
+    }
+
+    #[test]
+    fn reboot_flag_stays_recently_rebooted_below_wrap() {
+        // Advancing the counter short of a wrap must not flip the flag —
+        // it's specifically the 0xFFFF → 0x0001 transition that matters,
+        // not "has next_session_id been called more than once".
+        let sd = SdStateManager::with_initial(0x1233);
+        for _ in 0..10 {
+            sd.next_session_id();
+        }
+        assert_eq!(sd.reboot_flag(), RebootFlag::RecentlyRebooted);
+    }
+
+    #[test]
+    fn reboot_flag_flips_to_continuous_exactly_on_wrap() {
+        // Step the counter across the wrap boundary and assert the flag
+        // transitions on the precise call that crosses 0xFFFF → 0x0001.
+        let sd = SdStateManager::with_initial(0xFFFE);
+        assert_eq!(sd.reboot_flag(), RebootFlag::RecentlyRebooted);
+
+        // 0xFFFE -> 0xFFFF: prev=0xFFFE, no wrap.
+        assert_eq!(sd.next_session_id(), 0xFFFF);
+        assert_eq!(
+            sd.reboot_flag(),
+            RebootFlag::RecentlyRebooted,
+            "counter reached 0xFFFF but has not yet wrapped — flag must still be RecentlyRebooted",
+        );
+
+        // 0xFFFF -> 0x0001 (skip 0): prev=0xFFFF, wrap latches.
+        assert_eq!(sd.next_session_id(), 0x0001);
+        assert_eq!(
+            sd.reboot_flag(),
+            RebootFlag::Continuous,
+            "wrap just occurred — flag must now be Continuous",
+        );
+    }
+
+    #[test]
+    fn reboot_flag_is_monotonic_after_wrap() {
+        // Once the flag latches to Continuous it never goes back, even
+        // after the counter wraps a second time or is advanced
+        // indefinitely. Guard against a regression that would re-derive
+        // the flag from the current counter value (which would wrongly
+        // flip back to RecentlyRebooted at 0x0001).
+        let sd = SdStateManager::with_initial(0xFFFE);
+        sd.next_session_id(); // -> 0xFFFF
+        sd.next_session_id(); // wrap -> 0x0001
+        assert_eq!(sd.reboot_flag(), RebootFlag::Continuous);
+
+        // Many further advances, including crossing 0xFFFF again.
+        for _ in 0..(u32::from(u16::MAX) + 5) {
+            sd.next_session_id();
+        }
+        assert_eq!(sd.reboot_flag(), RebootFlag::Continuous);
+    }
+
+    // ── Multicast-loopback harness ──────────────────────────────────────
+    //
+    // All tests below drive `send_offer_service` against a real UDP socket
+    // and read the emitted packet off a second socket joined to the SD
+    // multicast group. These are `#[ignore]`d on environments whose
+    // loopback interface does not carry the `MULTICAST` flag (check with
+    // `ip link show lo`); on such hosts the kernel drops multicast on
+    // `lo` before loopback reflection, so the receiver times out. Runs
+    // in any environment where loopback multicast is available.
+
+    /// Bind a receiver socket on the SD multicast port, ready to
+    /// `join_multicast_v4`.
+    fn build_mcast_receiver(interface: Ipv4Addr) -> std::io::Result<UdpSocket> {
+        let raw = socket2::Socket::new(
+            socket2::Domain::IPV4,
+            socket2::Type::DGRAM,
+            Some(socket2::Protocol::UDP),
+        )?;
+        raw.set_reuse_address(true)?;
+        #[cfg(unix)]
+        raw.set_reuse_port(true)?;
+        raw.set_multicast_loop_v4(true)?;
+        raw.bind(&SocketAddr::new(IpAddr::V4(interface), sd::MULTICAST_PORT).into())?;
+        raw.set_nonblocking(true)?;
+        UdpSocket::from_std(raw.into())
+    }
+
+    /// Bind a sender [`TokioSocket`] on an ephemeral port with
+    /// `multicast_if` pinned to the loopback interface so emitted
+    /// packets loop back to any receiver joined to the same group on
+    /// that interface. Uses the [`TransportFactory`] surface so the
+    /// resulting socket implements [`crate::transport::TransportSocket`]
+    /// — which is what the now-generic
+    /// [`SdStateManager::send_offer_service`] requires.
+    async fn build_mcast_sender(
+        interface: Ipv4Addr,
+    ) -> Result<TokioSocket, crate::transport::TransportError> {
+        let mut opts = SocketOptions::new();
+        opts.reuse_address = true;
+        opts.reuse_port = true;
+        opts.multicast_if_v4 = Some(interface);
+        opts.multicast_loop_v4 = Some(true);
+        crate::tokio_transport::TokioTransport
+            .bind(SocketAddrV4::new(interface, 0), &opts)
+            .await
+    }
+
+    /// Fields extracted from a received SOME/IP-SD `OfferService` packet.
+    /// Keeping these together makes per-test assertions a straight list of
+    /// `assert_eq!`s against expected values.
+    struct ReceivedOffer {
+        request_id: u32,
+        someip_service_id: u16,
+        someip_method_id: u16,
+        message_type: MessageType,
+        return_code: ReturnCode,
+        protocol_version: u8,
+        interface_version: u8,
+        flags: Flags,
+        entry_service_id: u16,
+        entry_instance_id: u16,
+        entry_major_version: u8,
+        entry_minor_version: u32,
+        entry_ttl: u32,
+        endpoint_ip: Ipv4Addr,
+        endpoint_port: u16,
+        endpoint_protocol: TransportProtocol,
+    }
+
+    /// Wait for a multicast `OfferService` matching `expected_service_id`,
+    /// returning its decoded fields. Other packets on the group (from
+    /// concurrent tests) are ignored; a single outer timeout bounds the
+    /// whole filter loop.
+    async fn recv_our_offer(
+        rx: &UdpSocket,
+        expected_service_id: u16,
+        within: Duration,
+    ) -> ReceivedOffer {
+        let recv_loop = async {
+            let mut buf = [0u8; 2048];
+            loop {
+                let (len, _from) = rx
+                    .recv_from(&mut buf)
+                    .await
+                    .expect("recv_from should succeed");
+                let Ok(view) = MessageView::parse(&buf[..len]) else {
+                    continue;
+                };
+                if view.header().message_id().service_id() != 0xFFFF {
+                    continue;
+                }
+                let Ok(sd_view) = view.sd_header() else {
+                    continue;
+                };
+                let Some(entry) = sd_view.entries().next() else {
+                    continue;
+                };
+                if !matches!(entry.entry_type(), Ok(EntryType::OfferService)) {
+                    continue;
+                }
+                if entry.service_id() != expected_service_id {
+                    continue;
+                }
+                let first_option = sd_view
+                    .options()
+                    .next()
+                    .expect("OfferService should carry an endpoint option");
+                let (endpoint_ip, endpoint_protocol, endpoint_port) = first_option
+                    .as_ipv4()
+                    .expect("endpoint option should decode as IPv4");
+                return ReceivedOffer {
+                    request_id: view.header().request_id(),
+                    someip_service_id: view.header().message_id().service_id(),
+                    someip_method_id: view.header().message_id().method_id(),
+                    message_type: view.header().message_type().message_type(),
+                    return_code: view.header().return_code(),
+                    protocol_version: view.header().protocol_version(),
+                    interface_version: view.header().interface_version(),
+                    flags: sd_view.flags(),
+                    entry_service_id: entry.service_id(),
+                    entry_instance_id: entry.instance_id(),
+                    entry_major_version: entry.major_version(),
+                    entry_minor_version: entry.minor_version(),
+                    entry_ttl: entry.ttl(),
+                    endpoint_ip,
+                    endpoint_port,
+                    endpoint_protocol,
+                };
+            }
+        };
+        tokio::time::timeout(within, recv_loop)
+            .await
+            .expect("timed out waiting for our OfferService")
+    }
+
+    /// Assert every field of the SOME/IP + SD envelope that
+    /// `send_offer_service` is responsible for — not just the entry body.
+    /// A future regression that garbles the endpoint option, flips a flag,
+    /// or changes the SOME/IP message type should fail here.
+    ///
+    /// `expected_reboot` lets pre-wrap callers assert `RecentlyRebooted`
+    /// and post-wrap callers assert `Continuous`; the flag is tracked by
+    /// `SdStateManager::has_wrapped` and read via `reboot_flag()` at each
+    /// send.
+    fn assert_offer_matches(
+        offer: &ReceivedOffer,
+        config: &ServerConfig,
+        expected_request_id: u32,
+        expected_reboot: RebootFlag,
+    ) {
+        // SOME/IP envelope
+        assert_eq!(offer.someip_service_id, 0xFFFF, "SD uses service_id 0xFFFF");
+        assert_eq!(offer.someip_method_id, 0x8100, "SD uses method_id 0x8100");
+        assert_eq!(offer.message_type, MessageType::Notification);
+        assert_eq!(offer.return_code, ReturnCode::Ok);
+        assert_eq!(offer.protocol_version, 0x01);
+        assert_eq!(offer.interface_version, 0x01);
+        assert_eq!(
+            offer.request_id, expected_request_id,
+            "request_id is session_id in low 16 bits, client_id zero in high 16",
+        );
+        // SD flags — reboot comes from SdStateManager::reboot_flag (latches
+        // to Continuous after the session counter wraps past 0xFFFF);
+        // unicast is always true for SD.
+        assert_eq!(offer.flags.reboot(), expected_reboot);
+        assert!(offer.flags.unicast());
+        // OfferService entry
+        assert_eq!(offer.entry_service_id, config.service_id);
+        assert_eq!(offer.entry_instance_id, config.instance_id);
+        assert_eq!(offer.entry_major_version, config.major_version);
+        assert_eq!(offer.entry_minor_version, config.minor_version);
+        assert_eq!(offer.entry_ttl, config.ttl);
+        // Endpoint option
+        assert_eq!(offer.endpoint_ip, config.interface);
+        assert_eq!(offer.endpoint_port, config.local_port);
+        assert_eq!(offer.endpoint_protocol, TransportProtocol::Udp);
+    }
+
+    /// Standard loopback receiver/sender pair used by the send-path tests.
+    async fn mcast_rx_tx() -> (UdpSocket, TokioSocket) {
+        let interface = Ipv4Addr::LOCALHOST;
+        let rx = build_mcast_receiver(interface).expect("bind receiver");
+        rx.join_multicast_v4(sd::MULTICAST_IP, interface)
+            .expect("join SD multicast group");
+        let tx = build_mcast_sender(interface).await.expect("bind sender");
+        (rx, tx)
+    }
+
+    #[ignore = "requires MULTICAST on loopback; skipped on hosts whose `lo` \
+                lacks the MULTICAST flag. Runs in any environment where \
+                loopback multicast is available."]
+    #[tokio::test]
+    async fn send_offer_service_emits_parseable_offer_to_multicast() {
+        let config = ServerConfig::new(
+            Ipv4Addr::LOCALHOST,
+            TEST_ADVERTISED_PORT,
+            TEST_SERVICE_ID,
+            TEST_INSTANCE_ID,
+        );
+        let (rx, tx) = mcast_rx_tx().await;
+
+        // Seed with a recognisable value so on-wire session_id is exact.
+        let sd_state = SdStateManager::with_initial(0x1233);
+        sd_state
+            .send_offer_service(&config, &tx)
+            .await
+            .expect("send_offer_service should succeed on a configured socket");
+
+        let offer = recv_our_offer(&rx, config.service_id, Duration::from_secs(2)).await;
+        // next_session_id advances 0x1233 -> 0x1234; client_id is zero.
+        // Fresh SdStateManager: counter has not wrapped, reboot flag is
+        // RecentlyRebooted.
+        assert_offer_matches(&offer, &config, 0x0000_1234, RebootFlag::RecentlyRebooted);
+    }
+
+    #[ignore = "requires MULTICAST on loopback; skipped on hosts whose `lo` \
+                lacks the MULTICAST flag. Runs in any environment where \
+                loopback multicast is available."]
+    #[tokio::test]
+    async fn send_offer_service_advances_session_id_across_calls() {
+        // Back-to-back sends must consume distinct, incrementing session
+        // IDs — catches a regression where `send_offer_service` reads the
+        // counter without advancing it, or reuses a cached value.
+        let config = ServerConfig::new(
+            Ipv4Addr::LOCALHOST,
+            TEST_ADVERTISED_PORT,
+            TEST_SERVICE_ID,
+            TEST_INSTANCE_ID,
+        );
+        let (rx, tx) = mcast_rx_tx().await;
+
+        let sd_state = SdStateManager::with_initial(0x1233);
+        sd_state.send_offer_service(&config, &tx).await.unwrap();
+        sd_state.send_offer_service(&config, &tx).await.unwrap();
+
+        let first = recv_our_offer(&rx, config.service_id, Duration::from_secs(2)).await;
+        let second = recv_our_offer(&rx, config.service_id, Duration::from_secs(2)).await;
+        assert_eq!(first.request_id, 0x0000_1234);
+        assert_eq!(second.request_id, 0x0000_1235);
+    }
+
+    #[ignore = "requires MULTICAST on loopback; skipped on hosts whose `lo` \
+                lacks the MULTICAST flag. Runs in any environment where \
+                loopback multicast is available."]
+    #[tokio::test]
+    async fn send_offer_service_wraps_session_id_through_zero_on_send() {
+        // Session counter wrap must be visible on the wire: 0xFFFE -> 0xFFFF
+        // -> 0x0001 (skipping the reserved 0). Exercises the wrap branch
+        // *through* the send path, not only the unit test of next_session_id.
+        let config = ServerConfig::new(
+            Ipv4Addr::LOCALHOST,
+            TEST_ADVERTISED_PORT,
+            TEST_SERVICE_ID,
+            TEST_INSTANCE_ID,
+        );
+        let (rx, tx) = mcast_rx_tx().await;
+
+        let sd_state = SdStateManager::with_initial(0xFFFE);
+        sd_state.send_offer_service(&config, &tx).await.unwrap();
+        sd_state.send_offer_service(&config, &tx).await.unwrap();
+
+        let first = recv_our_offer(&rx, config.service_id, Duration::from_secs(2)).await;
+        let second = recv_our_offer(&rx, config.service_id, Duration::from_secs(2)).await;
+        assert_eq!(first.request_id, 0x0000_FFFF);
+        assert_eq!(
+            second.request_id, 0x0000_0001,
+            "must skip reserved 0 on wrap"
+        );
+        // Reboot flag latches: the first emission goes out before the
+        // wrap happens (prev=0xFFFE), so it still advertises
+        // RecentlyRebooted; the second emission is the one whose
+        // next_session_id call crossed 0xFFFF -> 0x0001, so the flag
+        // Flips to Continuous permanently from there on.
+        assert_eq!(
+            first.flags.reboot(),
+            RebootFlag::RecentlyRebooted,
+            "first emit is pre-wrap and must still advertise RecentlyRebooted",
+        );
+        assert_eq!(
+            second.flags.reboot(),
+            RebootFlag::Continuous,
+            "post-wrap emit must advertise Continuous",
+        );
+    }
+
+    #[ignore = "requires MULTICAST on loopback; skipped on hosts whose `lo` \
+                lacks the MULTICAST flag. Runs in any environment where \
+                loopback multicast is available."]
+    #[tokio::test]
+    async fn send_offer_service_preserves_zero_ttl() {
+        // TTL=0 is a legitimate SOME/IP-SD value meaning "stop offering";
+        // `send_offer_service` must preserve it end-to-end rather than,
+        // say, defaulting it back to the ServerConfig::new value of 3.
+        let mut config = ServerConfig::new(
+            Ipv4Addr::LOCALHOST,
+            TEST_ADVERTISED_PORT,
+            TEST_SERVICE_ID,
+            TEST_INSTANCE_ID,
+        );
+        config.ttl = 0;
+        let (rx, tx) = mcast_rx_tx().await;
+
+        let sd_state = SdStateManager::with_initial(0x1233);
+        sd_state.send_offer_service(&config, &tx).await.unwrap();
+
+        let offer = recv_our_offer(&rx, config.service_id, Duration::from_secs(2)).await;
+        assert_offer_matches(&offer, &config, 0x0000_1234, RebootFlag::RecentlyRebooted);
+        // Belt-and-suspenders: assert_offer_matches already checks this,
+        // but the purpose of this test is specifically the zero case.
+        assert_eq!(offer.entry_ttl, 0);
+    }
+}
diff --git a/src/server/service_info.rs b/src/server/service_info.rs
index 59bf38a..a702278 100644
--- a/src/server/service_info.rs
+++ b/src/server/service_info.rs
@@ -52,6 +52,7 @@ pub struct Subscriber {
 
 impl Subscriber {
     /// Create a new subscriber
+    #[must_use]
     pub fn new(
         address: SocketAddrV4,
         service_id: u16,
diff --git a/src/server/subscription_manager.rs b/src/server/subscription_manager.rs
index 28667bc..57d180c 100644
--- a/src/server/subscription_manager.rs
+++ b/src/server/subscription_manager.rs
@@ -1,13 +1,74 @@
 //! Manages event group subscriptions
 
 use super::service_info::Subscriber;
-use std::{collections::HashMap, net::SocketAddrV4, vec::Vec};
+use core::future::Future;
+use heapless::{Vec as HeaplessVec, index_map::FnvIndexMap};
+#[cfg(feature = "server-tokio")]
+use std::sync::Arc;
+use std::{net::SocketAddrV4, vec::Vec};
+#[cfg(feature = "server-tokio")]
+use tokio::sync::RwLock;
 
-/// Manages subscriptions to event groups
+/// Max number of distinct `(service_id, instance_id, event_group_id)` event
+/// groups with active subscribers. Must be a power of two.
+const EVENT_GROUPS_CAP: usize = 32;
+
+/// Max number of subscribers per event group. Excess subscribers are dropped
+/// with a `warn!` log rather than silently.
+pub(crate) const SUBSCRIBERS_PER_GROUP: usize = 16;
+
+// Compile-time invariants. Trip these at `cargo build` so that retuning
+// the constants above can't quietly produce a `subscribe` impl that
+// panics on first push (zero `SUBSCRIBERS_PER_GROUP`) or that fails the
+// `heapless::FnvIndexMap` build (non-power-of-two `EVENT_GROUPS_CAP`).
+const _: () = assert!(
+    SUBSCRIBERS_PER_GROUP >= 1,
+    "SUBSCRIBERS_PER_GROUP must be >= 1: a value of 0 would crash subscribe() on first push"
+);
+const _: () = assert!(
+    EVENT_GROUPS_CAP.is_power_of_two(),
+    "EVENT_GROUPS_CAP must be a power of two for heapless::FnvIndexMap"
+);
+
+/// Why a call to [`SubscriptionManager::subscribe`] failed to record a new
+/// subscriber. Callers (typically the server's `Subscribe` handler) should
+/// use this to emit a `SubscribeNack` instead of a misleading `SubscribeAck`.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum SubscribeError {
+    /// The per-event-group subscriber list is already full
+    /// (`SUBSCRIBERS_PER_GROUP` entries). The caller's request was not
+    /// recorded.
+    SubscribersPerGroupFull,
+    /// The outer event-group map is already full (`EVENT_GROUPS_CAP`
+    /// distinct `(service_id, instance_id, event_group_id)` keys). The
+    /// caller's request was not recorded.
+    EventGroupsFull,
+}
+
+impl core::fmt::Display for SubscribeError {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        match self {
+            Self::SubscribersPerGroupFull => write!(
+                f,
+                "subscribers-per-group at capacity ({SUBSCRIBERS_PER_GROUP})"
+            ),
+            Self::EventGroupsFull => {
+                write!(f, "event-group map at capacity ({EVENT_GROUPS_CAP})")
+            }
+        }
+    }
+}
+
+type SubscribersList = HeaplessVec<Subscriber, SUBSCRIBERS_PER_GROUP>;
+
+/// Manages subscriptions to event groups.
+///
+/// Capacity is bounded at compile time: up to `EVENT_GROUPS_CAP` distinct
+/// event groups, each with up to `SUBSCRIBERS_PER_GROUP` subscribers.
 #[derive(Debug)]
 pub struct SubscriptionManager {
     /// Map of (`service_id`, `instance_id`, `event_group_id`) -> list of subscribers
-    subscriptions: HashMap<(u16, u16, u16), Vec<Subscriber>>,
+    subscriptions: FnvIndexMap<(u16, u16, u16), SubscribersList, EVENT_GROUPS_CAP>,
 }
 
 impl SubscriptionManager {
@@ -15,35 +76,123 @@ impl SubscriptionManager {
     #[must_use]
     pub fn new() -> Self {
         Self {
-            subscriptions: HashMap::new(),
+            subscriptions: FnvIndexMap::new(),
         }
     }
 
-    /// Add a subscriber to an event group
+    /// Add a subscriber to an event group.
+    ///
+    /// Returns `Ok(())` both when a new subscriber is added and when the
+    /// given `(service_id, instance_id, event_group_id, subscriber_addr)`
+    /// is already subscribed — the call is idempotent / deduplicated, and
+    /// no stored subscriber state is modified on a duplicate. There is no
+    /// TTL bump or other refresh side-effect today; if TTL-refresh
+    /// semantics are added later, this docstring and the duplicate-log
+    /// wording will be updated together.
+    ///
+    /// Returns `Err(SubscribeError)` when the request could not be
+    /// recorded because a bounded capacity was hit — the caller
+    /// (typically the server's `Subscribe` handler) should send a
+    /// `SubscribeNack` on `Err`, not a `SubscribeAck`.
+    ///
+    /// # Errors
+    ///
+    /// Returns:
+    /// - `SubscribeError::SubscribersPerGroupFull` when an existing event
+    ///   group already has `SUBSCRIBERS_PER_GROUP` subscribers and this
+    ///   call would push a new one.
+    /// - `SubscribeError::EventGroupsFull` when this is the first
+    ///   subscriber for a previously-unseen `(service_id, instance_id,
+    ///   event_group_id)` triple but the outer event-group map is full
+    ///   (`EVENT_GROUPS_CAP` distinct groups).
+    ///
+    /// # Panics
+    ///
+    /// Panics if `SUBSCRIBERS_PER_GROUP == 0`, a compile-time constant that
+    /// must be at least one for a newly-allocated subscriber list to accept
+    /// its first entry.
     pub fn subscribe(
         &mut self,
         service_id: u16,
         instance_id: u16,
         event_group_id: u16,
         subscriber_addr: SocketAddrV4,
-    ) {
+    ) -> Result<(), SubscribeError> {
         let key = (service_id, instance_id, event_group_id);
-        let subscribers = self.subscriptions.entry(key).or_default();
 
-        // Deduplicate: if this address is already subscribed, just refresh (don't add again)
-        if subscribers.iter().any(|s| s.address == subscriber_addr) {
-            tracing::debug!(
-                "Refreshed existing subscriber {} for service 0x{:04X}, instance {}, event group 0x{:04X}",
+        if let Some(subscribers) = self.subscriptions.get_mut(&key) {
+            // Deduplicate: if this address is already subscribed, skip adding
+            // it again. No stored subscriber state is modified — the log
+            // message reflects that. If real refresh semantics (e.g. TTL
+            // bump on re-subscribe) are wanted later, update the per-
+            // subscriber record here and rename the log accordingly.
+            if subscribers.iter().any(|s| s.address == subscriber_addr) {
+                tracing::debug!(
+                    "Subscriber {} already subscribed for service 0x{:04X}, instance {}, \
+                     event group 0x{:04X}; skipping duplicate",
+                    subscriber_addr,
+                    service_id,
+                    instance_id,
+                    event_group_id
+                );
+                return Ok(());
+            }
+
+            let subscriber =
+                Subscriber::new(subscriber_addr, service_id, instance_id, event_group_id);
+            if subscribers.push(subscriber).is_err() {
+                tracing::warn!(
+                    "Subscribers-per-group at capacity ({}); dropping new subscriber {} \
+                     for service 0x{:04X}, instance {}, event group 0x{:04X}",
+                    SUBSCRIBERS_PER_GROUP,
+                    subscriber_addr,
+                    service_id,
+                    instance_id,
+                    event_group_id
+                );
+                return Err(SubscribeError::SubscribersPerGroupFull);
+            }
+
+            tracing::info!(
+                "Subscriber {} added for service 0x{:04X}, instance {}, event group 0x{:04X}",
                 subscriber_addr,
                 service_id,
                 instance_id,
                 event_group_id
             );
-            return;
+            return Ok(());
         }
 
-        let subscriber = Subscriber::new(subscriber_addr, service_id, instance_id, event_group_id);
-        subscribers.push(subscriber);
+        // New event group — allocate the list and insert.
+        let mut list = SubscribersList::new();
+        // The first push into an empty heapless::Vec cannot fail as long
+        // as SUBSCRIBERS_PER_GROUP >= 1 (enforced by the constant's
+        // definition). Use `expect` here — a future refactor setting the
+        // cap to 0 would trip this at test time instead of silently
+        // dropping the only subscriber for a new event group.
+        list.push(Subscriber::new(
+            subscriber_addr,
+            service_id,
+            instance_id,
+            event_group_id,
+        ))
+        .expect(
+            "new SubscribersList must accept the first subscriber; \
+             SUBSCRIBERS_PER_GROUP must be >= 1",
+        );
+
+        if self.subscriptions.insert(key, list).is_err() {
+            tracing::warn!(
+                "Event-group map at capacity ({}); dropping subscriber {} for new group \
+                 service 0x{:04X}, instance {}, event group 0x{:04X}",
+                EVENT_GROUPS_CAP,
+                subscriber_addr,
+                service_id,
+                instance_id,
+                event_group_id
+            );
+            return Err(SubscribeError::EventGroupsFull);
+        }
 
         tracing::info!(
             "Subscriber {} added for service 0x{:04X}, instance {}, event group 0x{:04X}",
@@ -52,6 +201,7 @@ impl SubscriptionManager {
             instance_id,
             event_group_id
         );
+        Ok(())
     }
 
     /// Remove a subscriber from an event group
@@ -90,13 +240,16 @@ impl SubscriptionManager {
         event_group_id: u16,
     ) -> Vec<Subscriber> {
         let key = (service_id, instance_id, event_group_id);
-        self.subscriptions.get(&key).cloned().unwrap_or_default()
+        self.subscriptions
+            .get(&key)
+            .map(|list| list.iter().cloned().collect())
+            .unwrap_or_default()
     }
 
     /// Get total number of active subscriptions
     #[must_use]
     pub fn subscription_count(&self) -> usize {
-        self.subscriptions.values().map(std::vec::Vec::len).sum()
+        self.subscriptions.values().map(|v| v.len()).sum()
     }
 }
 
@@ -106,6 +259,124 @@ impl Default for SubscriptionManager {
     }
 }
 
+/// Shared handle to the server's subscription table.
+///
+/// Abstracts over `Arc<RwLock<SubscriptionManager>>` on `std` and over
+/// critical-section-backed equivalents on bare metal. The futures
+/// returned by the methods are not required to be `Send`, allowing
+/// single-threaded executors (embassy-style) to satisfy the trait
+/// without an `Arc<RwLock>`-style shared state.
+///
+/// Both `Server` and `EventPublisher` clone the same handle at construction
+/// time; the underlying subscription state is shared between them.
+pub trait SubscriptionHandle: Clone + 'static {
+    /// Add a subscriber to an event group.
+    ///
+    /// Idempotent: if the subscriber is already present, this is a no-op
+    /// returning `Ok(())`. Returns `Err(SubscribeError)` if a capacity
+    /// limit would be exceeded.
+    fn subscribe(
+        &self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        subscriber_addr: SocketAddrV4,
+    ) -> impl Future<Output = Result<(), SubscribeError>> + '_;
+
+    /// Remove a subscriber from an event group.
+    fn unsubscribe(
+        &self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        subscriber_addr: SocketAddrV4,
+    ) -> impl Future<Output = ()> + '_;
+
+    /// Visit each subscriber for the given event group with `f`.
+    ///
+    /// The implementation typically holds an internal read lock for the
+    /// duration of the visit; `f` is a synchronous `FnMut` callback —
+    /// the caller MUST NOT yield inside it. A common pattern is to copy
+    /// the subscriber addresses into a stack-allocated buffer here, then
+    /// release the lock and dispatch sends in a second phase.
+    ///
+    /// Returns the total number of subscribers visited. Replaces the
+    /// previous `get_subscribers -> Vec<Subscriber>` API; the visitor
+    /// pattern lets `EventPublisher::publish_event` avoid a per-event
+    /// heap allocation.
+    fn for_each_subscriber<'a, F>(
+        &'a self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        f: F,
+    ) -> impl Future<Output = usize> + 'a
+    where
+        F: FnMut(&Subscriber) + 'a;
+}
+
+#[cfg(feature = "server-tokio")]
+impl SubscriptionHandle for Arc<RwLock<SubscriptionManager>> {
+    fn subscribe(
+        &self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        subscriber_addr: SocketAddrV4,
+    ) -> impl Future<Output = Result<(), SubscribeError>> + '_ {
+        let this = self.clone();
+        async move {
+            this.write()
+                .await
+                .subscribe(service_id, instance_id, event_group_id, subscriber_addr)
+        }
+    }
+
+    fn unsubscribe(
+        &self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        subscriber_addr: SocketAddrV4,
+    ) -> impl Future<Output = ()> + '_ {
+        let this = self.clone();
+        async move {
+            this.write().await.unsubscribe(
+                service_id,
+                instance_id,
+                event_group_id,
+                subscriber_addr,
+            );
+        }
+    }
+
+    fn for_each_subscriber<'a, F>(
+        &'a self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        mut f: F,
+    ) -> impl Future<Output = usize> + 'a
+    where
+        F: FnMut(&Subscriber) + 'a,
+    {
+        let this = self.clone();
+        async move {
+            let guard = this.read().await;
+            let key = (service_id, instance_id, event_group_id);
+            match guard.subscriptions.get(&key) {
+                Some(list) => {
+                    for sub in list {
+                        f(sub);
+                    }
+                    list.len()
+                }
+                None => 0,
+            }
+        }
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -117,7 +388,7 @@ mod tests {
         let addr = SocketAddrV4::new(Ipv4Addr::new(192, 168, 1, 1), 8080);
 
         // Subscribe
-        manager.subscribe(0x5B, 1, 0x01, addr);
+        manager.subscribe(0x5B, 1, 0x01, addr).unwrap();
         assert_eq!(manager.subscription_count(), 1);
 
         // Get subscribers
@@ -135,11 +406,11 @@ mod tests {
         let mut manager = SubscriptionManager::new();
         let addr = SocketAddrV4::new(Ipv4Addr::new(192, 168, 1, 1), 8080);
 
-        manager.subscribe(0x5B, 1, 0x01, addr);
+        manager.subscribe(0x5B, 1, 0x01, addr).unwrap();
         assert_eq!(manager.subscription_count(), 1);
 
         // Subscribe same address again — should deduplicate
-        manager.subscribe(0x5B, 1, 0x01, addr);
+        manager.subscribe(0x5B, 1, 0x01, addr).unwrap();
         assert_eq!(manager.subscription_count(), 1);
     }
 
@@ -164,4 +435,176 @@ mod tests {
         let manager = SubscriptionManager::default();
         assert_eq!(manager.subscription_count(), 0);
     }
+
+    #[test]
+    fn subscribers_per_group_capacity_overflow() {
+        let mut manager = SubscriptionManager::new();
+        // Fill one event group to capacity.
+        for i in 0..SUBSCRIBERS_PER_GROUP {
+            let addr =
+                SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 8000 + u16::try_from(i).unwrap());
+            manager.subscribe(0x5B, 1, 0x01, addr).unwrap();
+        }
+        assert_eq!(manager.subscription_count(), SUBSCRIBERS_PER_GROUP);
+
+        // One more is dropped, and the call reports SubscribersPerGroupFull
+        // so the server can NACK.
+        let extra = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 9999);
+        assert_eq!(
+            manager.subscribe(0x5B, 1, 0x01, extra),
+            Err(SubscribeError::SubscribersPerGroupFull),
+        );
+        assert_eq!(manager.subscription_count(), SUBSCRIBERS_PER_GROUP);
+        // Extra subscriber should not appear in the list.
+        let subs = manager.get_subscribers(0x5B, 1, 0x01);
+        assert!(subs.iter().all(|s| s.address != extra));
+    }
+
+    #[test]
+    fn event_groups_capacity_overflow() {
+        let mut manager = SubscriptionManager::new();
+        let addr = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 8000);
+        // Fill the outer map to capacity with distinct event groups.
+        for i in 0..EVENT_GROUPS_CAP {
+            let eg = u16::try_from(i).unwrap();
+            manager.subscribe(0x5B, 1, eg, addr).unwrap();
+        }
+        assert_eq!(manager.subscription_count(), EVENT_GROUPS_CAP);
+
+        // A new event group beyond capacity is dropped, and the call reports
+        // EventGroupsFull so the server can NACK.
+        let overflow_eg = u16::try_from(EVENT_GROUPS_CAP).unwrap();
+        assert_eq!(
+            manager.subscribe(0x5B, 1, overflow_eg, addr),
+            Err(SubscribeError::EventGroupsFull),
+        );
+        assert_eq!(manager.subscription_count(), EVENT_GROUPS_CAP);
+        assert!(manager.get_subscribers(0x5B, 1, overflow_eg).is_empty());
+    }
+
+    #[test]
+    fn unsubscribe_one_of_multiple_leaves_group_intact() {
+        let mut manager = SubscriptionManager::new();
+        let a1 = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 8001);
+        let a2 = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 2), 8002);
+
+        manager.subscribe(0x5B, 1, 0x01, a1).unwrap();
+        manager.subscribe(0x5B, 1, 0x01, a2).unwrap();
+        assert_eq!(manager.subscription_count(), 2);
+
+        // Remove just a1 — group must stay with a2 only.
+        manager.unsubscribe(0x5B, 1, 0x01, a1);
+        assert_eq!(manager.subscription_count(), 1);
+        let subs = manager.get_subscribers(0x5B, 1, 0x01);
+        assert_eq!(subs.len(), 1);
+        assert_eq!(subs[0].address, a2);
+    }
+
+    #[test]
+    fn unsubscribe_address_not_in_existing_group_is_noop() {
+        let mut manager = SubscriptionManager::new();
+        let a1 = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 8001);
+        let a2 = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 2), 8002);
+
+        manager.subscribe(0x5B, 1, 0x01, a1).unwrap();
+        // a2 was never subscribed — unsubscribe must not panic or affect a1.
+        manager.unsubscribe(0x5B, 1, 0x01, a2);
+        assert_eq!(manager.subscription_count(), 1);
+        assert_eq!(manager.get_subscribers(0x5B, 1, 0x01)[0].address, a1);
+    }
+
+    #[test]
+    fn get_subscribers_returns_all_in_group() {
+        let mut manager = SubscriptionManager::new();
+        let addrs: Vec<SocketAddrV4> = (0..4)
+            .map(|i| SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, i + 1), 8000 + u16::from(i)))
+            .collect();
+        for &a in &addrs {
+            manager.subscribe(0x5B, 1, 0x01, a).unwrap();
+        }
+        let subs = manager.get_subscribers(0x5B, 1, 0x01);
+        assert_eq!(subs.len(), 4);
+        for &a in &addrs {
+            assert!(subs.iter().any(|s| s.address == a));
+        }
+    }
+
+    #[test]
+    fn subscription_count_spans_multiple_event_groups() {
+        let mut manager = SubscriptionManager::new();
+        let a = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 8000);
+        manager.subscribe(0x5B, 1, 0x01, a).unwrap();
+        manager.subscribe(0x5B, 1, 0x02, a).unwrap();
+        manager.subscribe(0x5C, 1, 0x01, a).unwrap();
+        assert_eq!(manager.subscription_count(), 3);
+    }
+
+    #[test]
+    fn subscribe_error_display() {
+        use std::string::ToString;
+        assert!(
+            SubscribeError::SubscribersPerGroupFull
+                .to_string()
+                .contains("subscribers-per-group"),
+        );
+        assert!(
+            SubscribeError::EventGroupsFull
+                .to_string()
+                .contains("event-group"),
+        );
+    }
+
+    #[cfg(feature = "server-tokio")]
+    mod tokio_handle {
+        use super::*;
+        use std::sync::Arc;
+        use tokio::sync::RwLock;
+
+        #[tokio::test]
+        async fn for_each_subscriber_visits_all() {
+            let handle: Arc<RwLock<SubscriptionManager>> =
+                Arc::new(RwLock::new(SubscriptionManager::new()));
+            let a1 = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 8001);
+            let a2 = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 2), 8002);
+
+            handle.subscribe(0x5B, 1, 0x01, a1).await.unwrap();
+            handle.subscribe(0x5B, 1, 0x01, a2).await.unwrap();
+
+            let mut visited = Vec::new();
+            let count = handle
+                .for_each_subscriber(0x5B, 1, 0x01, |s| visited.push(s.address))
+                .await;
+
+            assert_eq!(count, 2);
+            assert!(visited.contains(&a1));
+            assert!(visited.contains(&a2));
+        }
+
+        #[tokio::test]
+        async fn for_each_subscriber_empty_group_returns_zero() {
+            let handle: Arc<RwLock<SubscriptionManager>> =
+                Arc::new(RwLock::new(SubscriptionManager::new()));
+            let count = handle.for_each_subscriber(0x5B, 1, 0x01, |_| {}).await;
+            assert_eq!(count, 0);
+        }
+
+        #[tokio::test]
+        async fn for_each_subscriber_reflects_unsubscribe() {
+            let handle: Arc<RwLock<SubscriptionManager>> =
+                Arc::new(RwLock::new(SubscriptionManager::new()));
+            let a1 = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 1), 8001);
+            let a2 = SocketAddrV4::new(Ipv4Addr::new(10, 0, 0, 2), 8002);
+
+            handle.subscribe(0x5B, 1, 0x01, a1).await.unwrap();
+            handle.subscribe(0x5B, 1, 0x01, a2).await.unwrap();
+            handle.unsubscribe(0x5B, 1, 0x01, a1).await;
+
+            let mut visited = Vec::new();
+            let count = handle
+                .for_each_subscriber(0x5B, 1, 0x01, |s| visited.push(s.address))
+                .await;
+            assert_eq!(count, 1);
+            assert_eq!(visited, [a2]);
+        }
+    }
 }
diff --git a/src/static_channels/mod.rs b/src/static_channels/mod.rs
new file mode 100644
index 0000000..d945da6
--- /dev/null
+++ b/src/static_channels/mod.rs
@@ -0,0 +1,1412 @@
+//! Static-pool no-alloc backend for [`ChannelFactory`].
+//!
+//! `crate::embassy_channels::EmbassySyncChannels` (under
+//! `feature = "embassy_channels"`) heap-allocates one
+//! `Arc<Channel<...>>` per `oneshot()` / `bounded()` / `unbounded()`
+//! call. On a real bare-metal target that violates the strategic
+//! "zero heap after `Client::new` returns" goal, because
+//! `Client`'s run-loop awaits a oneshot for every request-response
+//! pair.
+//!
+//! This module hands out `&'static` references into pre-allocated
+//! `static` pools instead. The user declares pools (typically via
+//! the [`define_static_channels!`](crate::define_static_channels) macro)
+//! sized to their workload's high-water mark; once seeded, no further
+//! allocation occurs.
+//!
+//! # Per-`T` `*Pooled<MyChannels>` impls
+//!
+//! [`ChannelFactory`] requires each constructor method to have
+//! `T: *Pooled<Self>`. Static-pool consumers publish per-`T`
+//! impls that route to the appropriate pool. The
+//! [`define_static_channels!`](crate::define_static_channels) macro
+//! generates them; the primitives in this module are the runtime they
+//! call into.
+//!
+//! # Pool exhaustion
+//!
+//! If an `OneshotPool::claim()` / `MpscPool::claim_bounded()` call finds the
+//! pool empty it returns `None`. The trait method
+//! `*Pooled::*_pair() -> (Sender, Receiver)` cannot return `None` —
+//! it has no error channel — so generated impls **panic** on
+//! exhaustion. Sizing the pool to the workload's high-water mark is
+//! the user's responsibility; an exhaustion panic is a config error,
+//! not a runtime error.
+//!
+//! # Cancellation semantics
+//!
+//! - **Sender drop without `send`**: the slot's cancellation flag is
+//!   set; the receiver's pending `recv()` resolves to
+//!   `Err(OneshotCancelled)` (oneshot) or `None` (bounded /
+//!   unbounded mpsc, after the last sender drops).
+//! - **Receiver drop**: any pending value in the slot is dropped when
+//!   the slot is reclaimed. Bounded senders blocked on a full channel
+//!   are all woken via the slot's `MultiWakerRegistration` so each
+//!   resolves to `Err(())` on its next poll — including cloned senders
+//!   beyond the registration's static cap, which fall back to the
+//!   "wake-on-next-register" path.
+
+#![allow(clippy::module_name_repetitions)]
+
+use core::cell::{Cell, RefCell};
+use core::future::{Future, poll_fn};
+use core::pin::Pin;
+use core::sync::atomic::{AtomicBool, AtomicU8, AtomicUsize, Ordering};
+use core::task::Poll;
+
+use embassy_sync::blocking_mutex::Mutex as BlockingMutex;
+use embassy_sync::blocking_mutex::raw::CriticalSectionRawMutex;
+use embassy_sync::channel::Channel;
+use embassy_sync::waitqueue::{AtomicWaker, MultiWakerRegistration};
+
+/// Maximum number of distinct waiting senders we wake on receiver drop.
+/// More than this and the multi-waker auto-wakes-and-clears on the next
+/// register, so the close path remains correct under any sender count —
+/// it just degrades to "wake on next register" for the overflow case.
+const SEND_WAKER_CAP: usize = 8;
+
+use crate::transport::{
+    MpscRecv, MpscSend, OneshotCancelled, OneshotRecv, OneshotSend, UnboundedRecv, UnboundedSend,
+};
+
+// ── Oneshot ───────────────────────────────────────────────────────────
+
+const O_SENDER_ALIVE: u8 = 0b001;
+const O_RECEIVER_ALIVE: u8 = 0b010;
+const O_CANCELLED: u8 = 0b100;
+
+/// One slot of a [`OneshotPool`]. Const-constructible so a `static`
+/// array of slots can be initialized in const context.
+pub struct OneshotSlot<T: Send + 'static> {
+    chan: Channel<CriticalSectionRawMutex, T, 1>,
+    /// Woken by the sender's drop when it cancels without sending.
+    /// (The chan's internal waker handles the value-arrival path.)
+    cancel_waker: AtomicWaker,
+    /// `O_SENDER_ALIVE | O_RECEIVER_ALIVE | O_CANCELLED` bitmask.
+    state: AtomicU8,
+    /// Free-list link (1-based pool index; 0 = none).
+    next_free: AtomicUsize,
+}
+
+impl<T: Send + 'static> OneshotSlot<T> {
+    /// Const-constructible empty slot.
+    #[must_use]
+    pub const fn new() -> Self {
+        Self {
+            chan: Channel::new(),
+            cancel_waker: AtomicWaker::new(),
+            state: AtomicU8::new(0),
+            next_free: AtomicUsize::new(0),
+        }
+    }
+}
+
+impl<T: Send + 'static> Default for OneshotSlot<T> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+/// Reclaim hook used by [`StaticOneshotSender`] / [`StaticOneshotReceiver`]
+/// in their `Drop` impls. Erases the pool's `POOL_SIZE` so handles do
+/// not carry it.
+trait OneshotReclaim<T: Send + 'static>: Send + Sync + 'static {
+    fn release(&self, slot: &'static OneshotSlot<T>);
+}
+
+/// A pool of [`OneshotSlot`]s. Place in a `static` and call
+/// [`Self::claim`] to obtain a sender/receiver pair.
+pub struct OneshotPool<T: Send + 'static, const POOL_SIZE: usize> {
+    slots: [OneshotSlot<T>; POOL_SIZE],
+    free_head: BlockingMutex<CriticalSectionRawMutex, Cell<usize>>,
+    seeded: AtomicBool,
+}
+
+impl<T: Send + 'static, const POOL_SIZE: usize> OneshotPool<T, POOL_SIZE> {
+    /// Const-constructible empty pool. Free-list is seeded lazily on
+    /// the first [`Self::claim`].
+    #[must_use]
+    pub const fn new() -> Self {
+        Self {
+            slots: [const { OneshotSlot::new() }; POOL_SIZE],
+            free_head: BlockingMutex::new(Cell::new(0)),
+            seeded: AtomicBool::new(false),
+        }
+    }
+
+    /// Try to obtain a fresh sender/receiver pair. Returns `None` if
+    /// the pool is exhausted.
+    pub fn claim(&'static self) -> Option<(StaticOneshotSender<T>, StaticOneshotReceiver<T>)> {
+        self.ensure_seeded();
+        let slot = self.pop_free()?;
+        slot.state
+            .store(O_SENDER_ALIVE | O_RECEIVER_ALIVE, Ordering::Release);
+        // No stale value should be in the channel (we drained on
+        // release), but be defensive.
+        let _ = slot.chan.try_receive();
+        Some((
+            StaticOneshotSender {
+                slot,
+                pool: self,
+                sent: false,
+            },
+            StaticOneshotReceiver { slot, pool: self },
+        ))
+    }
+
+    fn ensure_seeded(&self) {
+        // Seed the free list under the same mutex `pop_free` takes, so a
+        // racing claimer cannot win the mutex between our (won) CAS and
+        // our `free_head.lock(|h| h.set(1))` and observe `head == 0`.
+        // The `seeded` atomic is only an optimisation — once true, we
+        // skip the mutex acquire entirely.
+        if self.seeded.load(Ordering::Acquire) {
+            return;
+        }
+        self.free_head.lock(|h| {
+            // Re-check under the mutex; another claimer may have seeded
+            // while we were contending for it.
+            if self.seeded.load(Ordering::Acquire) {
+                return;
+            }
+            // Link slots[0] -> slots[1] -> ... -> slots[N-1] -> 0.
+            for i in 0..POOL_SIZE {
+                let next = if i + 1 < POOL_SIZE { i + 2 } else { 0 };
+                self.slots[i].next_free.store(next, Ordering::Release);
+            }
+            h.set(1);
+            self.seeded.store(true, Ordering::Release);
+        });
+    }
+
+    fn pop_free(&self) -> Option<&OneshotSlot<T>> {
+        self.free_head.lock(|h| {
+            let head = h.get();
+            if head == 0 {
+                return None;
+            }
+            let slot = &self.slots[head - 1];
+            let next = slot.next_free.load(Ordering::Acquire);
+            h.set(next);
+            slot.next_free.store(0, Ordering::Release);
+            Some(slot)
+        })
+    }
+}
+
+impl<T: Send + 'static, const POOL_SIZE: usize> Default for OneshotPool<T, POOL_SIZE> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<T: Send + 'static, const POOL_SIZE: usize> OneshotReclaim<T> for OneshotPool<T, POOL_SIZE> {
+    fn release(&self, slot: &'static OneshotSlot<T>) {
+        let base = self.slots.as_ptr() as usize;
+        let here = core::ptr::from_ref::<OneshotSlot<T>>(slot) as usize;
+        let stride = core::mem::size_of::<OneshotSlot<T>>();
+        debug_assert!(stride > 0, "OneshotSlot must be sized");
+        debug_assert!(here >= base);
+        let idx = (here - base) / stride;
+        debug_assert!(idx < POOL_SIZE, "slot does not belong to this pool");
+        // Drop any stale value still in the channel.
+        let _ = slot.chan.try_receive();
+        // Overwrite any stale waker still registered by the previous
+        // tenant so the next claim's first registration does not wake
+        // (and potentially poke) a defunct task. `register` overwrites
+        // the previous slot if the new waker would-wake a different
+        // task, so registering the noop waker effectively clears it.
+        slot.cancel_waker.register(core::task::Waker::noop());
+        slot.state.store(0, Ordering::Release);
+        self.free_head.lock(|h| {
+            slot.next_free.store(h.get(), Ordering::Release);
+            h.set(idx + 1);
+        });
+    }
+}
+
+/// Send half of a static-pool oneshot.
+pub struct StaticOneshotSender<T: Send + 'static> {
+    slot: &'static OneshotSlot<T>,
+    pool: &'static dyn OneshotReclaim<T>,
+    sent: bool,
+}
+
+impl<T: Send + 'static> OneshotSend<T> for StaticOneshotSender<T> {
+    fn send(mut self, value: T) -> Result<(), T> {
+        // Refuse to send if the receiver has already dropped.
+        // (A subsequent receiver drop between this check and try_send
+        // is harmless — the value lands in the slot and is drained on
+        // slot release.)
+        if self.slot.state.load(Ordering::Acquire) & O_RECEIVER_ALIVE == 0 {
+            return Err(value);
+        }
+        match self.slot.chan.try_send(value) {
+            Ok(()) => {
+                self.sent = true;
+                Ok(())
+            }
+            Err(embassy_sync::channel::TrySendError::Full(v)) => Err(v),
+        }
+    }
+}
+
+impl<T: Send + 'static> Drop for StaticOneshotSender<T> {
+    fn drop(&mut self) {
+        if !self.sent {
+            self.slot.state.fetch_or(O_CANCELLED, Ordering::AcqRel);
+            self.slot.cancel_waker.wake();
+        }
+        let prev = self.slot.state.fetch_and(!O_SENDER_ALIVE, Ordering::AcqRel);
+        let after = prev & !O_SENDER_ALIVE;
+        if (after & O_RECEIVER_ALIVE) == 0 {
+            self.pool.release(self.slot);
+        }
+    }
+}
+
+/// Receive half of a static-pool oneshot.
+pub struct StaticOneshotReceiver<T: Send + 'static> {
+    slot: &'static OneshotSlot<T>,
+    pool: &'static dyn OneshotReclaim<T>,
+}
+
+impl<T: Send + 'static> OneshotRecv<T> for StaticOneshotReceiver<T> {
+    async fn recv(self) -> Result<T, OneshotCancelled> {
+        let slot = self.slot;
+        let result = poll_fn(move |cx| {
+            // 1. Try the channel first.
+            if let Ok(v) = slot.chan.try_receive() {
+                return Poll::Ready(Ok(v));
+            }
+            // 2. Check cancellation.
+            if slot.state.load(Ordering::Acquire) & O_CANCELLED != 0 {
+                return Poll::Ready(Err(OneshotCancelled));
+            }
+            // 3. Register on the cancel waker.
+            slot.cancel_waker.register(cx.waker());
+            // 4. Register on the channel's internal waker by polling
+            //    a transient receive future. embassy-sync registers
+            //    the waker on poll and does not unregister on drop.
+            {
+                let mut fut = slot.chan.receive();
+                // SAFETY: `fut` is stack-pinned, polled exactly
+                // once, then dropped before this scope ends. No
+                // reference to `fut` escapes.
+                let pinned = unsafe { Pin::new_unchecked(&mut fut) };
+                if let Poll::Ready(v) = pinned.poll(cx) {
+                    return Poll::Ready(Ok(v));
+                }
+            }
+            // 5. Final re-check to close the lost-wakeup window
+            //    between the early try_receive and the waker
+            //    registrations.
+            if let Ok(v) = slot.chan.try_receive() {
+                return Poll::Ready(Ok(v));
+            }
+            if slot.state.load(Ordering::Acquire) & O_CANCELLED != 0 {
+                return Poll::Ready(Err(OneshotCancelled));
+            }
+            Poll::Pending
+        })
+        .await;
+        // `self` drops here on return, running receiver-side bookkeeping.
+        drop(self);
+        result
+    }
+}
+
+impl<T: Send + 'static> Drop for StaticOneshotReceiver<T> {
+    fn drop(&mut self) {
+        let prev = self
+            .slot
+            .state
+            .fetch_and(!O_RECEIVER_ALIVE, Ordering::AcqRel);
+        let after = prev & !O_RECEIVER_ALIVE;
+        if (after & O_SENDER_ALIVE) == 0 {
+            self.pool.release(self.slot);
+        }
+    }
+}
+
+// ── Mpsc (bounded + unbounded share the slot/pool machinery) ──────────
+
+/// One slot of an [`MpscPool`]. Const-constructible.
+///
+/// Used by both bounded ([`StaticBoundedSender`] /
+/// [`StaticBoundedReceiver`]) and unbounded ([`StaticUnboundedSender`]
+/// / [`StaticUnboundedReceiver`]) pools — the public sender/receiver
+/// types differ, but the slot machinery is shared.
+pub struct MpscSlot<T: Send + 'static, const SLOT_CAP: usize> {
+    chan: Channel<CriticalSectionRawMutex, T, SLOT_CAP>,
+    /// Wakes the receiver on close.
+    close_waker: AtomicWaker,
+    /// Wakes senders that are `await`ing on a full channel when the
+    /// receiver drops. Multi-slot so all cloned senders blocked on a
+    /// full channel are unblocked on close — a single `AtomicWaker`
+    /// would deadlock the non-most-recent senders permanently.
+    send_wakers:
+        BlockingMutex<CriticalSectionRawMutex, RefCell<MultiWakerRegistration<SEND_WAKER_CAP>>>,
+    /// Number of live senders (clones) + 1 if receiver is alive.
+    /// 0 → slot returns to free list.
+    refcount: AtomicUsize,
+    /// Set when the last sender drops while receiver is still alive,
+    /// so the receiver's `recv()` resolves to `None`. Also set when the
+    /// receiver drops, so subsequent sender ops return `Err`.
+    closed: AtomicBool,
+    next_free: AtomicUsize,
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> MpscSlot<T, SLOT_CAP> {
+    /// Const-constructible empty slot.
+    #[must_use]
+    pub const fn new() -> Self {
+        Self {
+            chan: Channel::new(),
+            close_waker: AtomicWaker::new(),
+            send_wakers: BlockingMutex::new(RefCell::new(MultiWakerRegistration::new())),
+            refcount: AtomicUsize::new(0),
+            closed: AtomicBool::new(false),
+            next_free: AtomicUsize::new(0),
+        }
+    }
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> Default for MpscSlot<T, SLOT_CAP> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+trait MpscReclaim<T: Send + 'static, const SLOT_CAP: usize>: Send + Sync + 'static {
+    fn release(&self, slot: &'static MpscSlot<T, SLOT_CAP>);
+}
+
+/// A pool of [`MpscSlot`]s. Place in a `static` and call
+/// [`Self::claim_bounded`] or [`Self::claim_unbounded`].
+pub struct MpscPool<T: Send + 'static, const POOL_SIZE: usize, const SLOT_CAP: usize> {
+    slots: [MpscSlot<T, SLOT_CAP>; POOL_SIZE],
+    free_head: BlockingMutex<CriticalSectionRawMutex, Cell<usize>>,
+    seeded: AtomicBool,
+}
+
+impl<T: Send + 'static, const POOL_SIZE: usize, const SLOT_CAP: usize>
+    MpscPool<T, POOL_SIZE, SLOT_CAP>
+{
+    /// Const-constructible empty pool.
+    #[must_use]
+    pub const fn new() -> Self {
+        Self {
+            slots: [const { MpscSlot::new() }; POOL_SIZE],
+            free_head: BlockingMutex::new(Cell::new(0)),
+            seeded: AtomicBool::new(false),
+        }
+    }
+
+    /// Claim a slot for use as a bounded MPSC channel.
+    pub fn claim_bounded(
+        &'static self,
+    ) -> Option<(
+        StaticBoundedSender<T, SLOT_CAP>,
+        StaticBoundedReceiver<T, SLOT_CAP>,
+    )> {
+        let slot = self.claim_inner()?;
+        Some((
+            StaticBoundedSender { slot, pool: self },
+            StaticBoundedReceiver { slot, pool: self },
+        ))
+    }
+
+    /// Claim a slot for use as an unbounded MPSC channel. (Embassy-sync
+    /// has no truly unbounded channel; this uses `SLOT_CAP` as the
+    /// effective capacity.)
+    pub fn claim_unbounded(
+        &'static self,
+    ) -> Option<(
+        StaticUnboundedSender<T, SLOT_CAP>,
+        StaticUnboundedReceiver<T, SLOT_CAP>,
+    )> {
+        let slot = self.claim_inner()?;
+        Some((
+            StaticUnboundedSender { slot, pool: self },
+            StaticUnboundedReceiver { slot, pool: self },
+        ))
+    }
+
+    fn claim_inner(&'static self) -> Option<&'static MpscSlot<T, SLOT_CAP>> {
+        self.ensure_seeded();
+        let slot = self.pop_free()?;
+        slot.refcount.store(2, Ordering::Release); // 1 sender + 1 receiver.
+        slot.closed.store(false, Ordering::Release);
+        // Defensive: drain any stale value.
+        while slot.chan.try_receive().is_ok() {}
+        Some(slot)
+    }
+
+    fn ensure_seeded(&self) {
+        // See `OneshotPool::ensure_seeded` for the rationale: seeding
+        // must happen under the same mutex `pop_free` takes, otherwise a
+        // racing claimer can win the mutex first and observe an empty
+        // free list.
+        if self.seeded.load(Ordering::Acquire) {
+            return;
+        }
+        self.free_head.lock(|h| {
+            if self.seeded.load(Ordering::Acquire) {
+                return;
+            }
+            for i in 0..POOL_SIZE {
+                let next = if i + 1 < POOL_SIZE { i + 2 } else { 0 };
+                self.slots[i].next_free.store(next, Ordering::Release);
+            }
+            h.set(1);
+            self.seeded.store(true, Ordering::Release);
+        });
+    }
+
+    fn pop_free(&self) -> Option<&MpscSlot<T, SLOT_CAP>> {
+        self.free_head.lock(|h| {
+            let head = h.get();
+            if head == 0 {
+                return None;
+            }
+            let slot = &self.slots[head - 1];
+            let next = slot.next_free.load(Ordering::Acquire);
+            h.set(next);
+            slot.next_free.store(0, Ordering::Release);
+            Some(slot)
+        })
+    }
+}
+
+impl<T: Send + 'static, const POOL_SIZE: usize, const SLOT_CAP: usize> Default
+    for MpscPool<T, POOL_SIZE, SLOT_CAP>
+{
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<T: Send + 'static, const POOL_SIZE: usize, const SLOT_CAP: usize> MpscReclaim<T, SLOT_CAP>
+    for MpscPool<T, POOL_SIZE, SLOT_CAP>
+{
+    fn release(&self, slot: &'static MpscSlot<T, SLOT_CAP>) {
+        let base = self.slots.as_ptr() as usize;
+        let here = core::ptr::from_ref::<MpscSlot<T, SLOT_CAP>>(slot) as usize;
+        let stride = core::mem::size_of::<MpscSlot<T, SLOT_CAP>>();
+        debug_assert!(stride > 0);
+        debug_assert!(here >= base);
+        let idx = (here - base) / stride;
+        debug_assert!(idx < POOL_SIZE);
+        while slot.chan.try_receive().is_ok() {}
+        // Overwrite any stale wakers still registered by the previous
+        // tenant so the next claim's first registration does not poke
+        // a defunct task.
+        slot.close_waker.register(core::task::Waker::noop());
+        slot.send_wakers.lock(|w| w.borrow_mut().wake());
+        slot.refcount.store(0, Ordering::Release);
+        slot.closed.store(false, Ordering::Release);
+        self.free_head.lock(|h| {
+            slot.next_free.store(h.get(), Ordering::Release);
+            h.set(idx + 1);
+        });
+    }
+}
+
+// ── Bounded MPSC handles ──────────────────────────────────────────────
+
+/// Bounded sender backed by a [`MpscPool`]. `Clone` increments the
+/// slot's sender refcount; the receiver's `recv()` resolves to `None`
+/// only after every clone (and the original) has been dropped.
+pub struct StaticBoundedSender<T: Send + 'static, const SLOT_CAP: usize> {
+    slot: &'static MpscSlot<T, SLOT_CAP>,
+    pool: &'static dyn MpscReclaim<T, SLOT_CAP>,
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> Clone for StaticBoundedSender<T, SLOT_CAP> {
+    fn clone(&self) -> Self {
+        self.slot.refcount.fetch_add(1, Ordering::AcqRel);
+        Self {
+            slot: self.slot,
+            pool: self.pool,
+        }
+    }
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> Drop for StaticBoundedSender<T, SLOT_CAP> {
+    fn drop(&mut self) {
+        // If we are the last sender (and receiver is alive — i.e.
+        // refcount goes from 2→1 with the receiver-bit being the
+        // remaining one), set closed + wake.
+        let prev = self.slot.refcount.fetch_sub(1, Ordering::AcqRel);
+        if prev == 2 {
+            // Could be either "last sender, receiver alive" (we want
+            // to close+wake) or "last receiver, sender alive" (no
+            // close/wake — that's the receiver's drop). To
+            // distinguish, set closed before decrementing? Simpler:
+            // set closed unconditionally here. If the receiver was
+            // the one that just dropped, `closed` is meaningless —
+            // the slot will be reclaimed when refcount hits 0.
+            self.slot.closed.store(true, Ordering::Release);
+            self.slot.close_waker.wake();
+        } else if prev == 1 {
+            self.pool.release(self.slot);
+        }
+    }
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> MpscSend<T> for StaticBoundedSender<T, SLOT_CAP> {
+    async fn send(&self, value: T) -> Result<(), ()> {
+        let slot = self.slot;
+        // Fast path: receiver already gone.
+        if slot.closed.load(Ordering::Acquire) {
+            return Err(());
+        }
+        // Pin the embassy SendFuture on the stack so it survives
+        // across yields without losing the captured value. Race it
+        // against the closed flag via send_wakers.
+        let mut send_fut = core::pin::pin!(slot.chan.send(value));
+        poll_fn(|cx| {
+            // If the receiver is already closed, report Err(()). A
+            // send that polls Ready before the closed check returns
+            // Ok(()), even if close happened concurrently after the
+            // pre-poll check.
+            if slot.closed.load(Ordering::Acquire) {
+                return Poll::Ready(Err(()));
+            }
+            match send_fut.as_mut().poll(cx) {
+                Poll::Ready(()) => Poll::Ready(Ok(())),
+                Poll::Pending => {
+                    // Register on send_wakers so a receiver drop wakes
+                    // *all* awaiting senders, not just the most-recent.
+                    // The embassy SendFuture has separately registered
+                    // on the channel's internal waker.
+                    slot.send_wakers
+                        .lock(|w| w.borrow_mut().register(cx.waker()));
+                    // Re-check closed after registering, to close the
+                    // lost-wakeup window.
+                    if slot.closed.load(Ordering::Acquire) {
+                        return Poll::Ready(Err(()));
+                    }
+                    Poll::Pending
+                }
+            }
+        })
+        .await
+    }
+}
+
+/// Bounded receiver backed by a [`MpscPool`].
+pub struct StaticBoundedReceiver<T: Send + 'static, const SLOT_CAP: usize> {
+    slot: &'static MpscSlot<T, SLOT_CAP>,
+    pool: &'static dyn MpscReclaim<T, SLOT_CAP>,
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> Drop for StaticBoundedReceiver<T, SLOT_CAP> {
+    fn drop(&mut self) {
+        // Receiver gone — mark closed and wake every pending sender
+        // that's awaiting on a full channel. The send-side poll_fn
+        // races the wake against the closed flag and observes Err.
+        // Multi-waker so cloned senders are all woken, not just the
+        // most-recently-registered one.
+        self.slot.closed.store(true, Ordering::Release);
+        self.slot.send_wakers.lock(|w| w.borrow_mut().wake());
+        let prev = self.slot.refcount.fetch_sub(1, Ordering::AcqRel);
+        if prev == 1 {
+            self.pool.release(self.slot);
+        }
+    }
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> MpscRecv<T> for StaticBoundedReceiver<T, SLOT_CAP> {
+    fn recv(&mut self) -> impl Future<Output = Option<T>> + Send + '_ {
+        let slot = self.slot;
+        async move { mpsc_recv_inner(slot).await }
+    }
+
+    fn poll_recv(&mut self, cx: &mut core::task::Context<'_>) -> core::task::Poll<Option<T>> {
+        mpsc_poll_recv(self.slot, cx)
+    }
+}
+
+// ── Unbounded MPSC handles ────────────────────────────────────────────
+
+/// Unbounded sender — `send_now` returns `Err(value)` on a full slot
+/// rather than blocking. Pool sizing must be generous enough that the
+/// fixed-capacity slot is effectively unbounded for the workload; the
+/// crate's existing Tokio path uses 128 as the default.
+pub struct StaticUnboundedSender<T: Send + 'static, const SLOT_CAP: usize> {
+    slot: &'static MpscSlot<T, SLOT_CAP>,
+    pool: &'static dyn MpscReclaim<T, SLOT_CAP>,
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> Clone for StaticUnboundedSender<T, SLOT_CAP> {
+    fn clone(&self) -> Self {
+        self.slot.refcount.fetch_add(1, Ordering::AcqRel);
+        Self {
+            slot: self.slot,
+            pool: self.pool,
+        }
+    }
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> Drop for StaticUnboundedSender<T, SLOT_CAP> {
+    fn drop(&mut self) {
+        let prev = self.slot.refcount.fetch_sub(1, Ordering::AcqRel);
+        if prev == 2 {
+            self.slot.closed.store(true, Ordering::Release);
+            self.slot.close_waker.wake();
+        } else if prev == 1 {
+            self.pool.release(self.slot);
+        }
+    }
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> UnboundedSend<T>
+    for StaticUnboundedSender<T, SLOT_CAP>
+{
+    fn send_now(&self, value: T) -> Result<(), T> {
+        // Refuse to push into a slot whose receiver has dropped, AND
+        // reject `Full` from the underlying channel. The trait's
+        // unified `Result<(), T>` does not distinguish "closed" from
+        // "full" — callers that need to retry on transient fullness
+        // should size `SLOT_CAP` so they do not happen, since the
+        // unbounded sender only differs from the bounded one in its
+        // non-await contract; both can fail with `Err(value)` here.
+        if self.slot.closed.load(Ordering::Acquire) {
+            return Err(value);
+        }
+        self.slot.chan.try_send(value).map_err(|e| match e {
+            embassy_sync::channel::TrySendError::Full(v) => v,
+        })
+    }
+}
+
+/// Unbounded receiver.
+pub struct StaticUnboundedReceiver<T: Send + 'static, const SLOT_CAP: usize> {
+    slot: &'static MpscSlot<T, SLOT_CAP>,
+    pool: &'static dyn MpscReclaim<T, SLOT_CAP>,
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> Drop for StaticUnboundedReceiver<T, SLOT_CAP> {
+    fn drop(&mut self) {
+        self.slot.closed.store(true, Ordering::Release);
+        // Unbounded send_now never awaits, but we still wake
+        // send_wakers so any bounded sender on a slot that was reused
+        // for unbounded duty observes the close. Cheap and safe.
+        self.slot.send_wakers.lock(|w| w.borrow_mut().wake());
+        let prev = self.slot.refcount.fetch_sub(1, Ordering::AcqRel);
+        if prev == 1 {
+            self.pool.release(self.slot);
+        }
+    }
+}
+
+impl<T: Send + 'static, const SLOT_CAP: usize> UnboundedRecv<T>
+    for StaticUnboundedReceiver<T, SLOT_CAP>
+{
+    fn recv(&mut self) -> impl Future<Output = Option<T>> + Send + '_ {
+        let slot = self.slot;
+        async move { mpsc_recv_inner(slot).await }
+    }
+}
+
+// ── Shared MPSC recv plumbing ─────────────────────────────────────────
+
+async fn mpsc_recv_inner<T: Send + 'static, const SLOT_CAP: usize>(
+    slot: &'static MpscSlot<T, SLOT_CAP>,
+) -> Option<T> {
+    poll_fn(|cx| mpsc_poll_recv(slot, cx)).await
+}
+
+fn mpsc_poll_recv<T: Send + 'static, const SLOT_CAP: usize>(
+    slot: &'static MpscSlot<T, SLOT_CAP>,
+    cx: &mut core::task::Context<'_>,
+) -> core::task::Poll<Option<T>> {
+    if let Ok(v) = slot.chan.try_receive() {
+        return Poll::Ready(Some(v));
+    }
+    if slot.closed.load(Ordering::Acquire) {
+        // Drain race: a sender may have pushed a final value
+        // concurrently with closing.
+        if let Ok(v) = slot.chan.try_receive() {
+            return Poll::Ready(Some(v));
+        }
+        return Poll::Ready(None);
+    }
+    slot.close_waker.register(cx.waker());
+    {
+        let mut fut = slot.chan.receive();
+        // SAFETY: `fut` is stack-pinned, polled once, then dropped.
+        let pinned = unsafe { Pin::new_unchecked(&mut fut) };
+        if let Poll::Ready(v) = pinned.poll(cx) {
+            return Poll::Ready(Some(v));
+        }
+    }
+    if let Ok(v) = slot.chan.try_receive() {
+        return Poll::Ready(Some(v));
+    }
+    if slot.closed.load(Ordering::Acquire) {
+        if let Ok(v) = slot.chan.try_receive() {
+            return Poll::Ready(Some(v));
+        }
+        return Poll::Ready(None);
+    }
+    Poll::Pending
+}
+
+// ── Debug impls ───────────────────────────────────────────────────────
+
+impl<T: Send + 'static> core::fmt::Debug for OneshotSlot<T> {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.debug_struct("OneshotSlot")
+            .field("state", &self.state)
+            .finish_non_exhaustive()
+    }
+}
+
+impl<T: Send + 'static, const N: usize> core::fmt::Debug for OneshotPool<T, N> {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.debug_struct("OneshotPool").finish_non_exhaustive()
+    }
+}
+
+impl<T: Send + 'static> core::fmt::Debug for StaticOneshotSender<T> {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.debug_struct("StaticOneshotSender")
+            .field("sent", &self.sent)
+            .finish_non_exhaustive()
+    }
+}
+
+impl<T: Send + 'static> core::fmt::Debug for StaticOneshotReceiver<T> {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.debug_struct("StaticOneshotReceiver")
+            .finish_non_exhaustive()
+    }
+}
+
+impl<T: Send + 'static, const N: usize> core::fmt::Debug for MpscSlot<T, N> {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.debug_struct("MpscSlot")
+            .field("refcount", &self.refcount)
+            .field("closed", &self.closed)
+            .finish_non_exhaustive()
+    }
+}
+
+impl<T: Send + 'static, const P: usize, const N: usize> core::fmt::Debug for MpscPool<T, P, N> {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.debug_struct("MpscPool").finish_non_exhaustive()
+    }
+}
+
+impl<T: Send + 'static, const N: usize> core::fmt::Debug for StaticBoundedSender<T, N> {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.debug_struct("StaticBoundedSender")
+            .finish_non_exhaustive()
+    }
+}
+
+impl<T: Send + 'static, const N: usize> core::fmt::Debug for StaticBoundedReceiver<T, N> {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.debug_struct("StaticBoundedReceiver")
+            .finish_non_exhaustive()
+    }
+}
+
+impl<T: Send + 'static, const N: usize> core::fmt::Debug for StaticUnboundedSender<T, N> {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.debug_struct("StaticUnboundedSender")
+            .finish_non_exhaustive()
+    }
+}
+
+impl<T: Send + 'static, const N: usize> core::fmt::Debug for StaticUnboundedReceiver<T, N> {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.debug_struct("StaticUnboundedReceiver")
+            .finish_non_exhaustive()
+    }
+}
+
+// ── `define_static_channels!` macro ───────────────────────────────────
+
+/// Default slot capacity for unbounded channels declared via
+/// [`define_static_channels!`](crate::define_static_channels). Matches the value used by the
+/// embassy-sync-backed `EmbassySyncChannels::unbounded`. Each
+/// unbounded `T` declared in the macro gets its own `MpscPool`
+/// sized at `pool_size × UNBOUNDED_DEFAULT_CAP`.
+pub const UNBOUNDED_DEFAULT_CAP: usize = 128;
+
+/// Generates a no-alloc [`ChannelFactory`] from a user-authored pool
+/// layout.
+///
+/// [`ChannelFactory`]: crate::transport::ChannelFactory
+///
+/// The macro emits:
+/// - A unit struct `pub struct $name;` implementing
+///   [`ChannelFactory`] with associated types pointing at this
+///   module's [`StaticOneshotSender`] / `StaticBoundedSender` /
+///   `StaticUnboundedSender` (and matching receivers).
+/// - One `impl OneshotPooled<$name> for T` per `oneshot` entry,
+///   wrapping a function-local `static OneshotPool<T, POOL_SIZE>`.
+/// - One `impl BoundedPooled<$name, SLOT_CAP> for T` per `bounded`
+///   entry.
+/// - One `impl UnboundedPooled<$name> for T` per `unbounded` entry,
+///   each backed by an `MpscPool<T, POOL_SIZE,
+///   UNBOUNDED_DEFAULT_CAP>`.
+///
+/// Pool exhaustion in the generated `*_pair()` impls is reported
+/// via `expect()` (see module-level docs).
+///
+/// # Example
+///
+/// ```ignore
+/// use simple_someip::define_static_channels;
+///
+/// define_static_channels! {
+///     name: MyChannels,
+///     oneshot: [
+///         (Result<(), MyError>, 80),
+///         (RebootResponse, 4),
+///     ],
+///     bounded: [
+///         ((ControlMessage<P, MyChannels>, 4), 1),
+///         ((SendMessage<P, MyChannels>, 16), 8),
+///     ],
+///     unbounded: [
+///         (ClientUpdate<P>, 1),
+///     ],
+/// }
+/// ```
+///
+/// All three sections are required; pass an empty `[]` if a family
+/// has no entries. The bounded entry shape is
+/// `((Type, slot_cap), pool_size)` to disambiguate the slot cap
+/// from the pool size in the macro grammar.
+#[macro_export]
+macro_rules! define_static_channels {
+    // Entry point: explicit visibility.
+    ( vis: $vis:vis, name: $name:ident, $($rest:tt)* ) => {
+        $crate::define_static_channels! { @body $vis, $name, $($rest)* }
+    };
+    // Entry point: no visibility token — default to `pub`.
+    ( name: $name:ident, $($rest:tt)* ) => {
+        $crate::define_static_channels! { @body pub, $name, $($rest)* }
+    };
+    (
+        @body $vis:vis, $name:ident,
+        oneshot: [ $( ($ot:ty, $opool:literal) ),* $(,)? ],
+        bounded: [ $( (($bt:ty, $bcap:literal), $bpool:literal) ),* $(,)? ],
+        unbounded: [ $( ($ut:ty, $upool:literal) ),* $(,)? ] $(,)?
+    ) => {
+        #[derive(Clone, Copy, Debug)]
+        $vis struct $name;
+
+        impl $crate::transport::ChannelFactory for $name {
+            type OneshotSender<T: ::core::marker::Send + 'static> =
+                $crate::static_channels::StaticOneshotSender<T>;
+            type OneshotReceiver<T: ::core::marker::Send + 'static> =
+                $crate::static_channels::StaticOneshotReceiver<T>;
+            type BoundedSender<T: ::core::marker::Send + 'static, const N: usize> =
+                $crate::static_channels::StaticBoundedSender<T, N>;
+            type BoundedReceiver<T: ::core::marker::Send + 'static, const N: usize> =
+                $crate::static_channels::StaticBoundedReceiver<T, N>;
+            type UnboundedSender<T: ::core::marker::Send + 'static> =
+                $crate::static_channels::StaticUnboundedSender<
+                    T,
+                    { $crate::static_channels::UNBOUNDED_DEFAULT_CAP },
+                >;
+            type UnboundedReceiver<T: ::core::marker::Send + 'static> =
+                $crate::static_channels::StaticUnboundedReceiver<
+                    T,
+                    { $crate::static_channels::UNBOUNDED_DEFAULT_CAP },
+                >;
+        }
+
+        $(
+            impl $crate::transport::OneshotPooled<$name> for $ot {
+                fn oneshot_pair() -> (
+                    <$name as $crate::transport::ChannelFactory>::OneshotSender<Self>,
+                    <$name as $crate::transport::ChannelFactory>::OneshotReceiver<Self>,
+                ) {
+                    static POOL: $crate::static_channels::OneshotPool<$ot, $opool> =
+                        $crate::static_channels::OneshotPool::new();
+                    POOL.claim().expect(::core::concat!(
+                        "OneshotPool<",
+                        ::core::stringify!($ot),
+                        ", ",
+                        ::core::stringify!($opool),
+                        "> exhausted; increase the pool size declared in define_static_channels!"
+                    ))
+                }
+            }
+        )*
+
+        $(
+            impl $crate::transport::BoundedPooled<$name, $bcap> for $bt {
+                fn bounded_pair() -> (
+                    <$name as $crate::transport::ChannelFactory>::BoundedSender<Self, $bcap>,
+                    <$name as $crate::transport::ChannelFactory>::BoundedReceiver<Self, $bcap>,
+                ) {
+                    static POOL: $crate::static_channels::MpscPool<$bt, $bpool, $bcap> =
+                        $crate::static_channels::MpscPool::new();
+                    POOL.claim_bounded().expect(::core::concat!(
+                        "MpscPool<",
+                        ::core::stringify!($bt),
+                        ", pool=",
+                        ::core::stringify!($bpool),
+                        ", slot_cap=",
+                        ::core::stringify!($bcap),
+                        "> exhausted; increase the pool size declared in define_static_channels!"
+                    ))
+                }
+            }
+        )*
+
+        $(
+            impl $crate::transport::UnboundedPooled<$name> for $ut {
+                fn unbounded_pair() -> (
+                    <$name as $crate::transport::ChannelFactory>::UnboundedSender<Self>,
+                    <$name as $crate::transport::ChannelFactory>::UnboundedReceiver<Self>,
+                ) {
+                    static POOL: $crate::static_channels::MpscPool<
+                        $ut,
+                        $upool,
+                        { $crate::static_channels::UNBOUNDED_DEFAULT_CAP },
+                    > = $crate::static_channels::MpscPool::new();
+                    POOL.claim_unbounded().expect(::core::concat!(
+                        "MpscPool<",
+                        ::core::stringify!($ut),
+                        ", pool=",
+                        ::core::stringify!($upool),
+                        ", unbounded> exhausted; increase the pool size declared in define_static_channels!"
+                    ))
+                }
+            }
+        )*
+    };
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use core::future::Future;
+    use core::pin::pin;
+    use core::task::{Context, Poll, Waker};
+    use std::boxed::Box;
+
+    fn poll_once<F: Future>(f: &mut core::pin::Pin<&mut F>) -> Poll<F::Output> {
+        let waker = Waker::noop();
+        let mut cx = Context::from_waker(waker);
+        f.as_mut().poll(&mut cx)
+    }
+
+    // ── Oneshot tests ─────────────────────────────────────────────────
+
+    static ONESHOT_POOL_4: OneshotPool<u32, 4> = OneshotPool::new();
+
+    #[test]
+    fn oneshot_send_recv_happy_path() {
+        let (tx, rx) = ONESHOT_POOL_4.claim().expect("pool not empty");
+        tx.send(42).unwrap();
+        let mut fut = pin!(rx.recv());
+        match poll_once(&mut fut) {
+            Poll::Ready(Ok(v)) => assert_eq!(v, 42),
+            other => panic!("expected ready ok, got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn oneshot_sender_drop_cancels_receiver() {
+        let (tx, rx) = ONESHOT_POOL_4.claim().expect("pool not empty");
+        drop(tx);
+        let mut fut = pin!(rx.recv());
+        match poll_once(&mut fut) {
+            Poll::Ready(Err(OneshotCancelled)) => {}
+            other => panic!("expected cancelled, got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn oneshot_claim_release_cycles() {
+        static POOL: OneshotPool<u32, 4> = OneshotPool::new();
+        // Claim all 4, verify pool is exhausted, drop, re-claim.
+        let p1 = POOL.claim().unwrap();
+        let p2 = POOL.claim().unwrap();
+        let p3 = POOL.claim().unwrap();
+        let p4 = POOL.claim().unwrap();
+        assert!(POOL.claim().is_none(), "5th claim must exhaust");
+        drop((p1, p2, p3, p4));
+        let p5 = POOL.claim();
+        assert!(p5.is_some(), "post-drop claim must succeed");
+    }
+
+    #[test]
+    fn oneshot_pool_exhaustion_returns_none() {
+        static POOL_2: OneshotPool<u32, 2> = OneshotPool::new();
+        let _a = POOL_2.claim().unwrap();
+        let _b = POOL_2.claim().unwrap();
+        assert!(POOL_2.claim().is_none(), "third claim must exhaust");
+    }
+
+    /// Concurrent first-claim: two threads call `claim()` on the same
+    /// freshly-`new()`'d pool simultaneously. Both must succeed (the
+    /// pool has 8 slots). Regression for the seeding race where one
+    /// thread won the CAS and started looping while the other took
+    /// `free_head` first and observed `head == 0`.
+    #[test]
+    fn oneshot_concurrent_first_claim_does_not_panic() {
+        use std::sync::Arc;
+        use std::sync::atomic::{AtomicUsize, Ordering as O};
+        static POOL: OneshotPool<u32, 8> = OneshotPool::new();
+        let success_count = Arc::new(AtomicUsize::new(0));
+        let mut handles = std::vec::Vec::new();
+        for _ in 0..4 {
+            let s = Arc::clone(&success_count);
+            handles.push(std::thread::spawn(move || {
+                if POOL.claim().is_some() {
+                    s.fetch_add(1, O::SeqCst);
+                }
+            }));
+        }
+        for h in handles {
+            h.join().unwrap();
+        }
+        assert_eq!(
+            success_count.load(O::SeqCst),
+            4,
+            "all 4 concurrent claims should have succeeded against an 8-slot pool",
+        );
+    }
+
+    /// Multi-sender close broadcast: when the receiver drops, every
+    /// cloned sender that is awaiting a full-channel `send` must
+    /// resolve to `Err(())`. Regression for the old single-slot
+    /// `AtomicWaker` which only woke the most-recently-registered
+    /// sender.
+    #[test]
+    fn mpsc_bounded_receiver_drop_wakes_all_cloned_senders() {
+        static POOL: MpscPool<u32, 4, 1> = MpscPool::new();
+        let (tx, rx) = POOL.claim_bounded().expect("claim");
+        // Fill the channel so any further send awaits.
+        let mut filler_fut = pin!(tx.send(0));
+        match poll_once(&mut filler_fut) {
+            Poll::Ready(Ok(())) => {}
+            other => panic!("filler send should resolve immediately: {other:?}"),
+        }
+        // Three cloned senders, all awaiting on the full channel.
+        let clones: std::vec::Vec<_> = (0..3).map(|_| tx.clone()).collect();
+        let mut futs: std::vec::Vec<_> = clones
+            .iter()
+            .enumerate()
+            .map(|(i, c)| Box::pin(c.send(u32::try_from(i).unwrap() + 1)))
+            .collect();
+        for f in &mut futs {
+            // Each should park (channel is full).
+            match f.as_mut().poll(&mut Context::from_waker(Waker::noop())) {
+                Poll::Pending => {}
+                Poll::Ready(other) => panic!("expected Pending, got Ready({other:?})"),
+            }
+        }
+        drop(rx);
+        // Each cloned sender's pending future must now resolve to Err.
+        for f in &mut futs {
+            match f.as_mut().poll(&mut Context::from_waker(Waker::noop())) {
+                Poll::Ready(Err(())) => {}
+                Poll::Ready(Ok(())) => {
+                    panic!("expected Err after receiver drop on cloned sender, got Ok")
+                }
+                Poll::Pending => panic!("expected Err after receiver drop, got Pending"),
+            }
+        }
+    }
+
+    #[test]
+    fn mpsc_concurrent_first_claim_does_not_panic() {
+        use std::sync::Arc;
+        use std::sync::atomic::{AtomicUsize, Ordering as O};
+        static POOL: MpscPool<u32, 8, 4> = MpscPool::new();
+        let success_count = Arc::new(AtomicUsize::new(0));
+        let mut handles = std::vec::Vec::new();
+        for _ in 0..4 {
+            let s = Arc::clone(&success_count);
+            handles.push(std::thread::spawn(move || {
+                if POOL.claim_bounded().is_some() {
+                    s.fetch_add(1, O::SeqCst);
+                }
+            }));
+        }
+        for h in handles {
+            h.join().unwrap();
+        }
+        assert_eq!(
+            success_count.load(O::SeqCst),
+            4,
+            "all 4 concurrent claims should have succeeded against an 8-slot pool",
+        );
+    }
+
+    // ── Bounded MPSC tests ────────────────────────────────────────────
+
+    static MPSC_POOL: MpscPool<u32, 2, 4> = MpscPool::new();
+
+    #[test]
+    fn mpsc_bounded_send_recv() {
+        let (tx, mut rx) = MPSC_POOL.claim_bounded().expect("pool not empty");
+        let mut send_fut = pin!(tx.send(7));
+        assert!(matches!(poll_once(&mut send_fut), Poll::Ready(Ok(()))));
+        let mut recv_fut = pin!(rx.recv());
+        match poll_once(&mut recv_fut) {
+            Poll::Ready(Some(7)) => {}
+            other => panic!("expected ready Some(7), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn mpsc_bounded_clone_then_drop_all_closes_receiver() {
+        static POOL: MpscPool<u32, 1, 2> = MpscPool::new();
+        let (tx, mut rx) = POOL.claim_bounded().expect("pool not empty");
+        let tx2 = tx.clone();
+        drop(tx);
+        // One clone still alive — receiver should not be closed yet.
+        {
+            let mut recv_fut = pin!(rx.recv());
+            assert!(matches!(poll_once(&mut recv_fut), Poll::Pending));
+        }
+        drop(tx2);
+        // All senders gone → receiver resolves to None.
+        let mut recv_fut = pin!(rx.recv());
+        match poll_once(&mut recv_fut) {
+            Poll::Ready(None) => {}
+            other => panic!("expected ready None, got {other:?}"),
+        }
+    }
+
+    // ── Unbounded MPSC tests ──────────────────────────────────────────
+
+    #[test]
+    fn unbounded_send_now_returns_full_when_capacity_exhausted() {
+        static POOL: MpscPool<u32, 1, 2> = MpscPool::new();
+        let (tx, _rx) = POOL.claim_unbounded().expect("pool not empty");
+        assert!(tx.send_now(1).is_ok());
+        assert!(tx.send_now(2).is_ok());
+        match tx.send_now(3) {
+            Err(3) => {}
+            other => panic!("expected Err(3), got {other:?}"),
+        }
+    }
+
+    // ── define_static_channels! macro ─────────────────────────────────
+
+    // Witness that the macro expands to a `ChannelFactory` with all
+    // three families wired and that the per-`T` `*Pooled` impls
+    // dispatch correctly.
+    crate::define_static_channels! {
+        name: MacroTestChannels,
+        oneshot: [
+            (u32, 4),
+            (Result<i32, ()>, 2),
+        ],
+        bounded: [
+            ((u8, 4), 2),
+        ],
+        unbounded: [
+            (u16, 1),
+        ],
+    }
+
+    #[test]
+    fn macro_oneshot_dispatches_through_factory() {
+        use crate::transport::{ChannelFactory, OneshotSend};
+        let (tx, rx) = MacroTestChannels::oneshot::<u32>();
+        tx.send(99).unwrap();
+        let mut fut = pin!(<_ as crate::transport::OneshotRecv<u32>>::recv(rx));
+        match poll_once(&mut fut) {
+            Poll::Ready(Ok(99)) => {}
+            other => panic!("expected ready Ok(99), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn macro_bounded_dispatches_through_factory() {
+        use crate::transport::{ChannelFactory, MpscRecv, MpscSend};
+        let (tx, mut rx) = MacroTestChannels::bounded::<u8, 4>();
+        {
+            let mut send_fut = pin!(tx.send(7));
+            assert!(matches!(poll_once(&mut send_fut), Poll::Ready(Ok(()))));
+        }
+        let mut recv_fut = pin!(rx.recv());
+        match poll_once(&mut recv_fut) {
+            Poll::Ready(Some(7)) => {}
+            other => panic!("expected ready Some(7), got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn macro_unbounded_dispatches_through_factory() {
+        use crate::transport::{ChannelFactory, UnboundedSend};
+        let (tx, _rx) = MacroTestChannels::unbounded::<u16>();
+        assert!(tx.send_now(1234).is_ok());
+    }
+
+    // ── Waker-tracking helper ─────────────────────────────────────────
+
+    use std::sync::Arc;
+    use std::sync::atomic::{AtomicBool, Ordering as SAtomic};
+
+    struct WakeFlag(AtomicBool);
+    impl std::task::Wake for WakeFlag {
+        fn wake(self: Arc<Self>) {
+            self.0.store(true, SAtomic::Release);
+        }
+        fn wake_by_ref(self: &Arc<Self>) {
+            self.0.store(true, SAtomic::Release);
+        }
+    }
+    fn tracking_waker() -> (Arc<WakeFlag>, Waker) {
+        let flag = Arc::new(WakeFlag(AtomicBool::new(false)));
+        let waker = Waker::from(flag.clone());
+        (flag, waker)
+    }
+
+    // ── Waker firing tests ────────────────────────────────────────────
+
+    #[test]
+    fn oneshot_waker_fires_on_send() {
+        static POOL: OneshotPool<u32, 2> = OneshotPool::new();
+        let (tx, rx) = POOL.claim().expect("pool not empty");
+        let (flag, waker) = tracking_waker();
+        let mut cx = Context::from_waker(&waker);
+        let mut fut = pin!(rx.recv());
+        assert!(matches!(fut.as_mut().poll(&mut cx), Poll::Pending));
+        tx.send(42u32).unwrap();
+        assert!(
+            flag.0.load(SAtomic::Acquire),
+            "waker must fire when value is sent"
+        );
+        let noop = Waker::noop();
+        let mut cx2 = Context::from_waker(noop);
+        assert!(matches!(fut.as_mut().poll(&mut cx2), Poll::Ready(Ok(42))));
+    }
+
+    #[test]
+    fn oneshot_cancel_waker_fires_on_sender_drop() {
+        static POOL: OneshotPool<u32, 2> = OneshotPool::new();
+        let (tx, rx) = POOL.claim().expect("pool not empty");
+        let (flag, waker) = tracking_waker();
+        let mut cx = Context::from_waker(&waker);
+        let mut fut = pin!(rx.recv());
+        assert!(matches!(fut.as_mut().poll(&mut cx), Poll::Pending));
+        drop(tx);
+        assert!(
+            flag.0.load(SAtomic::Acquire),
+            "waker must fire when sender is dropped (cancel)"
+        );
+        let noop = Waker::noop();
+        let mut cx2 = Context::from_waker(noop);
+        assert!(matches!(
+            fut.as_mut().poll(&mut cx2),
+            Poll::Ready(Err(OneshotCancelled))
+        ));
+    }
+
+    #[test]
+    fn mpsc_close_waker_fires_on_all_senders_drop() {
+        static POOL: MpscPool<u32, 1, 4> = MpscPool::new();
+        let (tx, mut rx) = POOL.claim_bounded().expect("pool not empty");
+        let tx2 = tx.clone();
+        let (flag, waker) = tracking_waker();
+        let mut cx = Context::from_waker(&waker);
+        let mut fut = pin!(rx.recv());
+        assert!(matches!(fut.as_mut().poll(&mut cx), Poll::Pending));
+        drop(tx);
+        assert!(
+            !flag.0.load(SAtomic::Acquire),
+            "waker must not fire until last sender drops"
+        );
+        drop(tx2);
+        assert!(
+            flag.0.load(SAtomic::Acquire),
+            "waker must fire when last sender drops"
+        );
+        let noop = Waker::noop();
+        let mut cx2 = Context::from_waker(noop);
+        assert!(matches!(fut.as_mut().poll(&mut cx2), Poll::Ready(None)));
+    }
+
+    #[test]
+    fn mpsc_bounded_pool_exhaustion_returns_none() {
+        static POOL: MpscPool<u32, 1, 4> = MpscPool::new();
+        let _a = POOL.claim_bounded().expect("pool not empty");
+        assert!(
+            POOL.claim_bounded().is_none(),
+            "second claim must exhaust pool of size 1"
+        );
+    }
+
+    // ── Sender-side close-semantic tests ──────────────────────────────
+
+    #[test]
+    fn oneshot_send_after_receiver_drop_returns_err() {
+        static POOL: OneshotPool<u32, 2> = OneshotPool::new();
+        let (tx, rx) = POOL.claim().expect("pool not empty");
+        drop(rx);
+        match tx.send(42) {
+            Err(42) => {}
+            other => panic!("expected Err(42) after receiver drop, got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn unbounded_send_now_after_receiver_drop_returns_err() {
+        static POOL: MpscPool<u32, 1, 4> = MpscPool::new();
+        let (tx, rx) = POOL.claim_unbounded().expect("pool not empty");
+        drop(rx);
+        match tx.send_now(7) {
+            Err(7) => {}
+            other => panic!("expected Err(7) after receiver drop, got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn bounded_send_unblocks_with_err_on_receiver_drop() {
+        static POOL: MpscPool<u32, 1, 1> = MpscPool::new();
+        let (tx, rx) = POOL.claim_bounded().expect("pool not empty");
+        // Capacity is 1; fill it.
+        {
+            let mut send_fut = pin!(tx.send(1));
+            assert!(matches!(poll_once(&mut send_fut), Poll::Ready(Ok(()))));
+        }
+        // Next send must wait — channel is full.
+        let mut send_fut = pin!(tx.send(2));
+        let (flag, waker) = tracking_waker();
+        let mut cx = Context::from_waker(&waker);
+        assert!(matches!(send_fut.as_mut().poll(&mut cx), Poll::Pending));
+        // Drop the receiver — sender's send_waker must fire and the
+        // next poll must return Err(()).
+        drop(rx);
+        assert!(
+            flag.0.load(SAtomic::Acquire),
+            "send_waker must fire when receiver drops while sender is awaiting"
+        );
+        let noop = Waker::noop();
+        let mut cx2 = Context::from_waker(noop);
+        match send_fut.as_mut().poll(&mut cx2) {
+            Poll::Ready(Err(())) => {}
+            other => panic!("expected Err(()) after receiver drop, got {other:?}"),
+        }
+    }
+
+    #[test]
+    fn bounded_send_after_receiver_drop_returns_err_fast_path() {
+        static POOL: MpscPool<u32, 1, 4> = MpscPool::new();
+        let (tx, rx) = POOL.claim_bounded().expect("pool not empty");
+        drop(rx);
+        let mut send_fut = pin!(tx.send(99));
+        match poll_once(&mut send_fut) {
+            Poll::Ready(Err(())) => {}
+            other => panic!("expected Err(()) on closed slot, got {other:?}"),
+        }
+    }
+}
diff --git a/src/tokio_transport.rs b/src/tokio_transport.rs
new file mode 100644
index 0000000..e720a86
--- /dev/null
+++ b/src/tokio_transport.rs
@@ -0,0 +1,691 @@
+//! Tokio + socket2 implementation of the [`crate::transport`] traits.
+//!
+//! This is the default `std` backend. [`TokioTransport`] constructs
+//! configured [`TokioSocket`]s via `socket2` for bind-time options (reuse,
+//! multicast interface, multicast loop) and converts them to
+//! [`tokio::net::UdpSocket`] for the async I/O loop. [`TokioTimer`] is a
+//! thin wrapper over `tokio::time::sleep`.
+//!
+//! Gated behind `#[cfg(any(feature = "client-tokio", feature = "server-tokio"))]` —
+//! the `client-tokio` and `server-tokio` features are exactly the ones
+//! that pull in `tokio` and `socket2`, so no new dependency edge is
+//! introduced.
+//!
+//! # Example
+//!
+//! ```no_run
+//! # #[cfg(any(feature = "client-tokio", feature = "server-tokio"))]
+//! # async fn demo() -> Result<(), simple_someip::TransportError> {
+//! use core::net::{Ipv4Addr, SocketAddrV4};
+//! use simple_someip::{SocketOptions, TransportFactory, TransportSocket};
+//! use simple_someip::tokio_transport::TokioTransport;
+//!
+//! let factory = TokioTransport::default();
+//! let mut options = SocketOptions::new();
+//! options.reuse_address = true;
+//!
+//! let mut sock = factory
+//!     .bind(SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0), &options)
+//!     .await?;
+//! let bound = sock.local_addr()?;
+//! println!("bound to {bound}");
+//! # Ok(())
+//! # }
+//! ```
+
+use core::future::Future;
+use core::net::{Ipv4Addr, SocketAddrV4};
+use core::pin::Pin;
+use core::task::{Context, Poll};
+use core::time::Duration;
+use std::net::{IpAddr, SocketAddr};
+use tokio::io::ReadBuf;
+use tokio::net::UdpSocket;
+
+use crate::transport::{
+    ChannelFactory, IoErrorKind, MpscRecv, MpscSend, OneshotCancelled, OneshotRecv, OneshotSend,
+    ReceivedDatagram, SocketOptions, Timer, TransportError, TransportFactory, TransportSocket,
+    UnboundedRecv, UnboundedSend,
+};
+
+/// Factory that binds [`TokioSocket`]s configured via `socket2`.
+///
+/// Unit struct — all required state (the tokio runtime) is implicit in the
+/// ambient task context at call time.
+#[derive(Debug, Default, Clone, Copy)]
+pub struct TokioTransport;
+
+/// A bound UDP socket backed by [`tokio::net::UdpSocket`].
+#[derive(Debug)]
+pub struct TokioSocket {
+    inner: UdpSocket,
+}
+
+impl TokioSocket {
+    /// Read back the current value of the `IP_MULTICAST_LOOP` flag. Thin
+    /// wrapper over [`tokio::net::UdpSocket::multicast_loop_v4`], exposed
+    /// for tests that verify [`SocketOptions::multicast_loop_v4`] is
+    /// applied and for field debugging.
+    ///
+    /// # Errors
+    ///
+    /// Returns [`TransportError`] if the backend cannot read the flag.
+    #[allow(dead_code)] // used in tests; kept available for field debugging.
+    pub(crate) fn multicast_loop_v4(&self) -> Result<bool, TransportError> {
+        self.inner.multicast_loop_v4().map_err(|e| map_io_error(&e))
+    }
+}
+
+/// Sleep backed by [`tokio::time::sleep`].
+///
+/// Used internally at every periodic-tick site in the crate: the 125ms
+/// idle tick in `Inner::run_future`, the 1s announcement tick in
+/// `Server::announcement_loop`, and the user-supplied interval in
+/// `Client::sd_announcements_loop`. A bare-metal consumer swapping this
+/// out for `embassy_time` (or similar) needs to replace three references
+/// to `TokioTimer` with their own `Timer` impl — no trait rewrite
+/// required.
+#[derive(Debug, Default, Clone, Copy)]
+pub struct TokioTimer;
+
+/// [`crate::transport::Spawner`] impl that routes submitted futures
+/// to `tokio::spawn`.
+///
+/// Zero-size unit struct; every `Inner<P, TokioSpawner>` / `Client<P>`
+/// pays nothing for the abstraction (the `Inner` carries the spawner
+/// generic; `Client<P>` is a thin handle that forwards to it).
+/// Bare-metal consumers substitute their own `Spawner` via the
+/// `crate::Client::new_with_spawner_and_loopback` constructor.
+#[derive(Debug, Default, Clone, Copy)]
+pub struct TokioSpawner;
+
+/// Named future returned by [`TokioTransport::bind`].
+///
+/// `socket2::Socket::bind` is synchronous, so the body runs to
+/// completion on the first poll; the named struct exists only to
+/// satisfy the [`TransportFactory::BindFuture`] GAT on stable Rust
+/// without TAIT. Auto-derives `Send`.
+pub struct TokioBindFuture {
+    addr: SocketAddrV4,
+    options: SocketOptions,
+}
+
+impl Future for TokioBindFuture {
+    type Output = Result<TokioSocket, TransportError>;
+
+    fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let addr = self.addr;
+        let options = self.options;
+        Poll::Ready(bind_with_options(addr, options).map_err(|e| map_io_error(&e)))
+    }
+}
+
+impl TransportFactory for TokioTransport {
+    type Socket = TokioSocket;
+    type BindFuture<'a> = TokioBindFuture;
+
+    fn bind<'a>(&'a self, addr: SocketAddrV4, options: &'a SocketOptions) -> Self::BindFuture<'a> {
+        TokioBindFuture {
+            addr,
+            options: *options,
+        }
+    }
+}
+
+/// Named future returned by [`TokioSocket::send_to`].
+///
+/// Drives [`tokio::net::UdpSocket::poll_send_to`] directly so the GAT
+/// associated type ([`TransportSocket::SendFuture`]) can be named on
+/// stable Rust without heap-allocating a [`futures::future::BoxFuture`]
+/// per datagram. Auto-derives `Send`.
+pub struct SendTo<'a> {
+    socket: &'a UdpSocket,
+    buf: &'a [u8],
+    target: SocketAddr,
+}
+
+impl Future for SendTo<'_> {
+    type Output = Result<(), TransportError>;
+
+    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        match self.socket.poll_send_to(cx, self.buf, self.target) {
+            Poll::Pending => Poll::Pending,
+            Poll::Ready(Ok(_n)) => Poll::Ready(Ok(())),
+            Poll::Ready(Err(e)) => Poll::Ready(Err(map_io_error(&e))),
+        }
+    }
+}
+
+/// Named future returned by [`TokioSocket::recv_from`].
+///
+/// Drives [`tokio::net::UdpSocket::poll_recv_from`] directly so the GAT
+/// associated type ([`TransportSocket::RecvFuture`]) can be named on
+/// stable Rust without heap-allocating a [`futures::future::BoxFuture`]
+/// per datagram. Auto-derives `Send`.
+pub struct RecvFrom<'a> {
+    socket: &'a UdpSocket,
+    buf: &'a mut [u8],
+}
+
+impl Future for RecvFrom<'_> {
+    type Output = Result<ReceivedDatagram, TransportError>;
+
+    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        // No self-references; safe to project to &mut Self.
+        let me = self.get_mut();
+        let mut read_buf = ReadBuf::new(me.buf);
+        match me.socket.poll_recv_from(cx, &mut read_buf) {
+            Poll::Pending => Poll::Pending,
+            Poll::Ready(Err(e)) => Poll::Ready(Err(map_io_error(&e))),
+            Poll::Ready(Ok(src)) => {
+                let n = read_buf.filled().len();
+                let source = match src {
+                    SocketAddr::V4(v4) => v4,
+                    // SOME/IP is IPv4-only; an IPv6 source on our socket is
+                    // either impossible (v4 bind) or a misconfiguration.
+                    SocketAddr::V6(_) => return Poll::Ready(Err(TransportError::Unsupported)),
+                };
+                // Caveat: `tokio::net::UdpSocket::poll_recv_from` silently
+                // truncates when the caller's `buf` is smaller than the
+                // datagram and returns only the bytes that fit — it does
+                // NOT expose a truncation flag. Surfacing a reliable
+                // `truncated: bool` here would require a platform-specific
+                // `recvmsg`/MSG_TRUNC path (libc + unsafe), which is
+                // deferred for now. Until then, this field is always
+                // `false` for the Tokio backend; callers must not rely on
+                // it for truncation detection. This is documented on
+                // `ReceivedDatagram::truncated`'s field doc.
+                Poll::Ready(Ok(ReceivedDatagram {
+                    bytes_received: n,
+                    source,
+                    truncated: false,
+                }))
+            }
+        }
+    }
+}
+
+impl TransportSocket for TokioSocket {
+    type SendFuture<'a> = SendTo<'a>;
+    type RecvFuture<'a> = RecvFrom<'a>;
+
+    fn send_to<'a>(&'a self, buf: &'a [u8], target: SocketAddrV4) -> Self::SendFuture<'a> {
+        SendTo {
+            socket: &self.inner,
+            buf,
+            target: SocketAddr::V4(target),
+        }
+    }
+
+    fn recv_from<'a>(&'a self, buf: &'a mut [u8]) -> Self::RecvFuture<'a> {
+        RecvFrom {
+            socket: &self.inner,
+            buf,
+        }
+    }
+
+    fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+        match self.inner.local_addr().map_err(|e| map_io_error(&e))? {
+            SocketAddr::V4(v4) => Ok(v4),
+            SocketAddr::V6(_) => Err(TransportError::Unsupported),
+        }
+    }
+
+    fn join_multicast_v4(&self, group: Ipv4Addr, iface: Ipv4Addr) -> Result<(), TransportError> {
+        self.inner
+            .join_multicast_v4(group, iface)
+            .map_err(|e| map_io_error(&e))
+    }
+
+    fn leave_multicast_v4(&self, group: Ipv4Addr, iface: Ipv4Addr) -> Result<(), TransportError> {
+        self.inner
+            .leave_multicast_v4(group, iface)
+            .map_err(|e| map_io_error(&e))
+    }
+}
+
+/// Named future returned by [`TokioTimer::sleep`].
+///
+/// Wraps `tokio::time::Sleep` so the [`Timer::SleepFuture`] GAT can be
+/// named on stable Rust. Auto-derives `Send`.
+pub struct TokioSleep {
+    inner: tokio::time::Sleep,
+}
+
+impl Future for TokioSleep {
+    type Output = ();
+
+    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        // SAFETY: structural pinning of the `inner` Sleep field. We never
+        // move out of `inner` and we project pin through it consistently.
+        let inner = unsafe { self.map_unchecked_mut(|s| &mut s.inner) };
+        inner.poll(cx).map(|()| ())
+    }
+}
+
+impl Timer for TokioTimer {
+    type SleepFuture<'a> = TokioSleep;
+
+    fn sleep(&self, duration: Duration) -> Self::SleepFuture<'_> {
+        TokioSleep {
+            inner: tokio::time::sleep(duration),
+        }
+    }
+}
+
+impl crate::transport::Spawner for TokioSpawner {
+    fn spawn(&self, future: impl Future<Output = ()> + Send + 'static) {
+        // Drop the returned `JoinHandle` — per-socket loops run until
+        // their owning `SocketManager` drops its channel ends, at
+        // which point the future completes naturally.
+        //
+        // Wrap in `catch_unwind` so a panic inside the spawned task is
+        // logged through the `tracing` pipeline that the rest of the
+        // crate uses, instead of being swallowed silently to stderr by
+        // tokio's default panic handler. The caller's
+        // `Error::SocketClosedUnexpectedly` (surfaced when the
+        // panicking task drops its channel ends) then has a
+        // corresponding diagnostic in the operator's logs.
+        use futures::FutureExt;
+        drop(tokio::spawn(async move {
+            let result = std::panic::AssertUnwindSafe(future).catch_unwind().await;
+            if let Err(payload) = result {
+                let msg = panic_payload_str(&payload);
+                tracing::error!(
+                    panic_message = msg,
+                    "spawned task panicked; channels will close",
+                );
+            }
+        }));
+    }
+}
+
+/// Best-effort extraction of a printable message from a panic payload.
+fn panic_payload_str(payload: &std::boxed::Box<dyn std::any::Any + Send>) -> &str {
+    if let Some(s) = payload.downcast_ref::<&'static str>() {
+        s
+    } else if let Some(s) = payload.downcast_ref::<std::string::String>() {
+        s.as_str()
+    } else {
+        "<non-string panic payload>"
+    }
+}
+
+/// Synchronously create and configure a UDP socket via `socket2`, then
+/// hand it to tokio. Mirrors the existing bind paths in
+/// `crate::client::socket_manager` and `crate::server` (rendered as
+/// code literals because both are feature-gated and would break
+/// default-feature rustdoc builds via broken intra-doc links) so
+/// behavior is identical.
+fn bind_with_options(addr: SocketAddrV4, options: SocketOptions) -> std::io::Result<TokioSocket> {
+    let raw = socket2::Socket::new(
+        socket2::Domain::IPV4,
+        socket2::Type::DGRAM,
+        Some(socket2::Protocol::UDP),
+    )?;
+    if options.reuse_address {
+        raw.set_reuse_address(true)?;
+    }
+    #[cfg(unix)]
+    if options.reuse_port {
+        raw.set_reuse_port(true)?;
+    }
+    if let Some(iface) = options.multicast_if_v4 {
+        raw.set_multicast_if_v4(&iface)?;
+    }
+    // Apply the multicast-loop flag whenever the caller is doing
+    // multicast (interface configured) OR explicitly asked for
+    // loop=true. Skipping the syscall only when both are unset avoids
+    // a no-op call on plain-unicast sockets while still honoring an
+    // explicit caller request.
+    if let Some(loop_v4) = options.multicast_loop_v4 {
+        raw.set_multicast_loop_v4(loop_v4)?;
+    }
+    let bind_addr = SocketAddr::new(IpAddr::V4(*addr.ip()), addr.port());
+    raw.bind(&bind_addr.into())?;
+    raw.set_nonblocking(true)?;
+    let std_sock: std::net::UdpSocket = raw.into();
+    let inner = UdpSocket::from_std(std_sock)?;
+    Ok(TokioSocket { inner })
+}
+
+/// Map a `std::io::Error` into [`TransportError`]. The mapping is
+/// conservative — anything that is not a clear match becomes
+/// [`TransportError::Io`] with [`IoErrorKind::Other`] — and is not
+/// considered stable (adding finer mappings is not a breaking change).
+///
+/// The full `std::io::Error` (raw errno, OS message, chained source) is
+/// discarded by design to keep the public [`TransportError`] enum
+/// portable and `no_std`-safe. To keep field debugging possible anyway,
+/// the original error is emitted to the tracing subscriber before
+/// mapping — at `debug!` for common steady-state conditions
+/// (`TimedOut`, `Interrupted`, `ConnectionRefused`) so they don't
+/// drown out actionable warnings under load, and at `warn!` for
+/// everything else (misconfiguration-indicating kinds like
+/// `AddrInUse` / `PermissionDenied` / `NetworkUnreachable` and the
+/// fallback `Other`). Operators should look at `warn!` lines; the
+/// `debug!` lines are there for deep-dive debugging only.
+fn map_io_error(e: &std::io::Error) -> TransportError {
+    use std::io::ErrorKind as K;
+    let kind = e.kind();
+    let mapped = match kind {
+        K::AddrInUse => TransportError::AddressInUse,
+        K::Unsupported => TransportError::Unsupported,
+        K::TimedOut => TransportError::Io(IoErrorKind::TimedOut),
+        K::Interrupted => TransportError::Io(IoErrorKind::Interrupted),
+        K::PermissionDenied => TransportError::Io(IoErrorKind::PermissionDenied),
+        K::ConnectionRefused => TransportError::Io(IoErrorKind::ConnectionRefused),
+        K::NetworkUnreachable | K::HostUnreachable => {
+            TransportError::Io(IoErrorKind::NetworkUnreachable)
+        }
+        K::WouldBlock => TransportError::Io(IoErrorKind::WouldBlock),
+        _ => TransportError::Io(IoErrorKind::Other),
+    };
+    // Log at `warn!` for unexpected / misconfiguration-indicating
+    // kinds (permission denied, address-in-use, network unreachable,
+    // fallback Other) where ops should probably look. Common
+    // steady-state conditions (timeouts, interrupted syscalls,
+    // connection refused during transient outages) drop to `debug!`
+    // so we don't drown out actionable warnings under load.
+    match kind {
+        K::TimedOut | K::Interrupted | K::ConnectionRefused => {
+            tracing::debug!(
+                "tokio transport io error: {e} (raw_os={:?}, kind={:?}) mapped to {mapped}",
+                e.raw_os_error(),
+                kind,
+            );
+        }
+        _ => {
+            tracing::warn!(
+                "tokio transport io error: {e} (raw_os={:?}, kind={:?}) mapped to {mapped}",
+                e.raw_os_error(),
+                kind,
+            );
+        }
+    }
+    mapped
+}
+
+// ── TokioChannels ─────────────────────────────────────────────────────────
+
+/// [`ChannelFactory`] implementation backed by `tokio::sync::mpsc` and
+/// `tokio::sync::oneshot`. This is the default channel backend for `std +
+/// tokio` builds (active when the `client-tokio` or `server-tokio` feature
+/// is enabled — the bare `client` / `server` features supply the
+/// trait-surface only and require a caller-provided `ChannelFactory`).
+#[derive(Clone, Copy)]
+pub struct TokioChannels;
+
+// Newtype wrappers are needed because Rust does not allow implementing a
+// foreign trait on a foreign type (orphan rule). Wrapping the tokio receiver
+// types lets us impl OneshotRecv / UnboundedRecv on them.
+
+/// Newtype wrapping `tokio::sync::oneshot::Receiver<T>` to implement
+/// [`OneshotRecv`].
+pub struct TokioOneshotReceiver<T>(pub(crate) tokio::sync::oneshot::Receiver<T>);
+
+/// Newtype wrapping `tokio::sync::mpsc::UnboundedReceiver<T>` to implement
+/// [`UnboundedRecv`].
+pub struct TokioUnboundedReceiver<T>(pub(crate) tokio::sync::mpsc::UnboundedReceiver<T>);
+
+impl<T: Send + 'static> OneshotSend<T> for tokio::sync::oneshot::Sender<T> {
+    fn send(self, value: T) -> Result<(), T> {
+        tokio::sync::oneshot::Sender::send(self, value)
+    }
+}
+
+impl<T: Send + 'static> OneshotRecv<T> for TokioOneshotReceiver<T> {
+    async fn recv(self) -> Result<T, OneshotCancelled> {
+        self.0.await.map_err(|_| OneshotCancelled)
+    }
+}
+
+impl<T: Send + 'static> MpscSend<T> for tokio::sync::mpsc::Sender<T> {
+    async fn send(&self, value: T) -> Result<(), ()> {
+        tokio::sync::mpsc::Sender::send(self, value)
+            .await
+            .map_err(|_| ())
+    }
+}
+
+impl<T: Send + 'static> MpscRecv<T> for tokio::sync::mpsc::Receiver<T> {
+    fn recv(&mut self) -> impl Future<Output = Option<T>> + Send + '_ {
+        self.recv()
+    }
+
+    fn poll_recv(&mut self, cx: &mut core::task::Context<'_>) -> core::task::Poll<Option<T>> {
+        self.poll_recv(cx)
+    }
+}
+
+impl<T: Send + 'static> UnboundedSend<T> for tokio::sync::mpsc::UnboundedSender<T> {
+    fn send_now(&self, value: T) -> Result<(), T> {
+        self.send(value).map_err(|e| e.0)
+    }
+}
+
+impl<T: Send + 'static> UnboundedRecv<T> for TokioUnboundedReceiver<T> {
+    fn recv(&mut self) -> impl Future<Output = Option<T>> + Send + '_ {
+        self.0.recv()
+    }
+}
+
+impl ChannelFactory for TokioChannels {
+    type OneshotSender<T: Send + 'static> = tokio::sync::oneshot::Sender<T>;
+    type OneshotReceiver<T: Send + 'static> = TokioOneshotReceiver<T>;
+
+    // Tokio's `mpsc` channels store capacity at runtime, so the
+    // const-generic `N` is informational only — it does not affect
+    // the stored type. Embassy-sync's impl uses `N` differently (see
+    // `embassy_channels`).
+    type BoundedSender<T: Send + 'static, const N: usize> = tokio::sync::mpsc::Sender<T>;
+    type BoundedReceiver<T: Send + 'static, const N: usize> = tokio::sync::mpsc::Receiver<T>;
+
+    type UnboundedSender<T: Send + 'static> = tokio::sync::mpsc::UnboundedSender<T>;
+    type UnboundedReceiver<T: Send + 'static> = TokioUnboundedReceiver<T>;
+
+    // The three constructor methods (`oneshot`, `bounded`, `unbounded`)
+    // use the trait's default bodies, which delegate to the per-`T`
+    // `*Pooled<TokioChannels>` blanket impls below. Tokio has a single
+    // shared allocator, so every `T: Send + 'static` is poolable; the
+    // blanket impls capture that.
+}
+
+// Blanket `*Pooled` impls for every `T: Send + 'static` against
+// `TokioChannels`. Tokio has a single shared allocator and so does not
+// need per-`T` storage — each call constructs a fresh channel.
+impl<T: Send + 'static> crate::transport::OneshotPooled<TokioChannels> for T {
+    fn oneshot_pair() -> (
+        <TokioChannels as ChannelFactory>::OneshotSender<T>,
+        <TokioChannels as ChannelFactory>::OneshotReceiver<T>,
+    ) {
+        let (tx, rx) = tokio::sync::oneshot::channel();
+        (tx, TokioOneshotReceiver(rx))
+    }
+}
+
+impl<T: Send + 'static, const N: usize> crate::transport::BoundedPooled<TokioChannels, N> for T {
+    fn bounded_pair() -> (
+        <TokioChannels as ChannelFactory>::BoundedSender<T, N>,
+        <TokioChannels as ChannelFactory>::BoundedReceiver<T, N>,
+    ) {
+        tokio::sync::mpsc::channel(N)
+    }
+}
+
+impl<T: Send + 'static> crate::transport::UnboundedPooled<TokioChannels> for T {
+    fn unbounded_pair() -> (
+        <TokioChannels as ChannelFactory>::UnboundedSender<T>,
+        <TokioChannels as ChannelFactory>::UnboundedReceiver<T>,
+    ) {
+        let (tx, rx) = tokio::sync::mpsc::unbounded_channel();
+        (tx, TokioUnboundedReceiver(rx))
+    }
+}
+
+// ── EmbassySyncChannels (extracted) ──────────────────────────────────────
+//
+// The bare-metal `ChannelFactory` impl previously lived here as a sub-
+// module. The `tokio_transport` module is now gated to `client-tokio` /
+// `server-tokio`, so a `--features client,bare_metal` build without tokio
+// could no longer reach `EmbassySyncChannels`. The impl has been moved to
+// `crate::embassy_channels` (gated by `feature = "embassy_channels"`) so
+// it is reachable from any client build.
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[tokio::test]
+    async fn bind_ephemeral_and_report_local_addr() {
+        let factory = TokioTransport;
+        let sock = factory
+            .bind(
+                SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0),
+                &SocketOptions::default(),
+            )
+            .await
+            .expect("bind");
+        let addr = sock.local_addr().expect("local_addr");
+        assert_eq!(*addr.ip(), Ipv4Addr::LOCALHOST);
+        assert_ne!(addr.port(), 0, "kernel must assign a non-zero port");
+    }
+
+    #[tokio::test]
+    async fn round_trip_send_recv_between_two_sockets() {
+        let factory = TokioTransport;
+        let opts = SocketOptions::default();
+
+        let recv = factory
+            .bind(SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0), &opts)
+            .await
+            .unwrap();
+        let recv_addr = recv.local_addr().unwrap();
+
+        let send = factory
+            .bind(SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0), &opts)
+            .await
+            .unwrap();
+
+        let payload = b"hello tokio transport";
+        send.send_to(payload, recv_addr).await.unwrap();
+
+        let mut buf = [0u8; 64];
+        let datagram = tokio::time::timeout(Duration::from_secs(2), recv.recv_from(&mut buf))
+            .await
+            .expect("recv timed out")
+            .expect("recv failed");
+
+        assert_eq!(datagram.bytes_received, payload.len());
+        assert_eq!(&buf[..datagram.bytes_received], payload);
+        assert!(!datagram.truncated);
+    }
+
+    #[tokio::test]
+    async fn reuse_address_option_allows_rebind_pattern() {
+        // Two sockets with reuse_address=true should be able to bind the
+        // same port on platforms where SO_REUSEADDR permits it (windows
+        // and linux both do for DGRAM).
+        let opts = SocketOptions {
+            reuse_address: true,
+            ..SocketOptions::default()
+        };
+
+        let factory = TokioTransport;
+        let a = factory
+            .bind(SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0), &opts)
+            .await
+            .unwrap();
+        let port = a.local_addr().unwrap().port();
+
+        // Bind a second socket with the same options; with reuse_address
+        // on, the OS allows this for UDP DGRAM on the platforms we support.
+        // If the OS refuses, fall back to a plain bind — we're not testing
+        // OS semantics here, only that the option is applied without error.
+        let b = factory
+            .bind(SocketAddrV4::new(Ipv4Addr::LOCALHOST, port), &opts)
+            .await;
+        // Either success or AddrInUse is acceptable; the assertion is
+        // that bind_with_options does not produce a different surprise
+        // (like Unsupported or a raw Io panic).
+        match b {
+            Ok(_) | Err(TransportError::AddressInUse) => {}
+            Err(other) => panic!("unexpected rebind error: {other:?}"),
+        }
+        drop(a);
+    }
+
+    #[tokio::test]
+    async fn multicast_loop_v4_option_propagates_in_both_directions() {
+        // Guards against a regression where `multicast_loop_v4` was
+        // silently ignored on a multicast bind and the socket kept the
+        // OS default, diverging from the explicit request.
+        // `bind_with_options` only applies `set_multicast_loop_v4` when
+        // `multicast_if_v4` is `Some` (a plain-unicast bind has no
+        // meaningful multicast-loop setting), so this test always pairs
+        // the loop flag with a multicast interface.
+        let factory = TokioTransport;
+
+        let opts_off = SocketOptions {
+            multicast_loop_v4: Some(false),
+            multicast_if_v4: Some(Ipv4Addr::LOCALHOST),
+            ..SocketOptions::default()
+        };
+        let sock_off = factory
+            .bind(SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0), &opts_off)
+            .await
+            .expect("bind off");
+        assert!(
+            !sock_off.multicast_loop_v4().expect("read off flag"),
+            "multicast_loop_v4=false must disable IP_MULTICAST_LOOP"
+        );
+
+        let opts_on = SocketOptions {
+            multicast_loop_v4: Some(true),
+            multicast_if_v4: Some(Ipv4Addr::LOCALHOST),
+            ..SocketOptions::default()
+        };
+        let sock_on = factory
+            .bind(SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0), &opts_on)
+            .await
+            .expect("bind on");
+        assert!(
+            sock_on.multicast_loop_v4().expect("read on flag"),
+            "multicast_loop_v4=true must enable IP_MULTICAST_LOOP"
+        );
+    }
+
+    #[tokio::test]
+    async fn timer_sleep_elapses_at_least_requested() {
+        let timer = TokioTimer;
+        let started = tokio::time::Instant::now();
+        timer.sleep(Duration::from_millis(25)).await;
+        assert!(started.elapsed() >= Duration::from_millis(25));
+    }
+
+    #[test]
+    fn map_io_error_covers_common_kinds() {
+        use std::io::{Error, ErrorKind};
+        assert!(matches!(
+            map_io_error(&Error::from(ErrorKind::AddrInUse)),
+            TransportError::AddressInUse
+        ));
+        assert!(matches!(
+            map_io_error(&Error::from(ErrorKind::TimedOut)),
+            TransportError::Io(IoErrorKind::TimedOut)
+        ));
+        assert!(matches!(
+            map_io_error(&Error::from(ErrorKind::ConnectionRefused)),
+            TransportError::Io(IoErrorKind::ConnectionRefused)
+        ));
+        assert!(matches!(
+            map_io_error(&Error::from(ErrorKind::Unsupported)),
+            TransportError::Unsupported
+        ));
+        // Fallback path
+        assert!(matches!(
+            map_io_error(&Error::from(ErrorKind::Other)),
+            TransportError::Io(IoErrorKind::Other)
+        ));
+    }
+}
diff --git a/src/traits.rs b/src/traits.rs
index abd3134..6cd8c2f 100644
--- a/src/traits.rs
+++ b/src/traits.rs
@@ -103,11 +103,14 @@ pub trait PayloadWireFormat: core::fmt::Debug + Send + Sized + Sync {
 
     /// Override the reboot flag on an SD header in-place.
     ///
-    /// Used by `Client::start_sd_announcements` (when the `client` feature is
-    /// enabled) to refresh the reboot flag per-tick from the client's tracked
-    /// state.
+    /// Used by `Client::sd_announcements_loop` (when the `client` feature is
+    /// enabled) to refresh the reboot flag per-tick from the client's
+    /// tracked state. Defaults to a no-op so that `std`-but-not-`client`
+    /// consumers (e.g. host-side tooling that builds SD headers manually
+    /// without ever driving an announcement loop) don't have to provide
+    /// an impl that will never be called.
     #[cfg(feature = "std")]
-    fn set_reboot_flag(header: &mut Self::SdHeader, reboot: sd::RebootFlag);
+    fn set_reboot_flag(_header: &mut Self::SdHeader, _reboot: sd::RebootFlag) {}
 
     /// Extract offered/stopped service endpoints from this SD payload.
     ///
diff --git a/src/transport.rs b/src/transport.rs
new file mode 100644
index 0000000..df98ae8
--- /dev/null
+++ b/src/transport.rs
@@ -0,0 +1,1478 @@
+//! Executor-agnostic transport abstraction.
+//!
+//! [`TransportSocket`] is the minimum UDP surface `simple-someip` needs from
+//! its networking backend: unicast and multicast send/recv plus a few
+//! socket-level knobs. [`TransportFactory`] constructs bound and configured
+//! sockets at startup. [`Timer`] provides async sleep.
+//!
+//! # Why a trait, and why like this
+//!
+//! The crate's `client` and `server` modules today use a tokio-based UDP
+//! backend, with sockets created/configured via `socket2` (for reuse /
+//! multicast-interface / multicast-loop options) and then handed off as
+//! `tokio::net::UdpSocket` for the async I/O loop. That works on
+//! `std + tokio` but makes no-`std` / non-tokio embedded use impossible.
+//! These traits are the integration point for alternative backends (lwIP,
+//! smoltcp, etc.).
+//!
+//! Three explicit design choices:
+//!
+//! 1. **Executor-agnostic for socket / timer I/O.** [`TransportSocket`]
+//!    and [`Timer`] methods return `impl Future`, not `async fn`, and
+//!    those traits make no statement about `Send` or `'static` bounds on
+//!    their returned futures. Callers that need those bounds (e.g. to
+//!    `tokio::spawn`) require them at the consumer site. Bare-metal
+//!    callers driving the future on a single executor task pay no `Send`
+//!    tax for socket I/O. **[`Spawner::spawn`] is the deliberate
+//!    exception:** it is a multi-task abstraction by definition, so it
+//!    requires `Send + 'static` on its argument. Single-core executors
+//!    that need a `!Send` variant (embassy with `task_arena_size = 0`,
+//!    `LocalSet`-style models) need either a future `spawn_local` shim
+//!    or a hand-rolled adapter; the `Send + 'static` bound is documented
+//!    on the trait method itself.
+//! 2. **IPv4-only address type.** This transport abstraction currently
+//!    uses [`core::net::SocketAddrV4`] directly rather than `SocketAddr`,
+//!    matching the crate's present transport-layer reach for unicast and
+//!    the standard SD IPv4 multicast address
+//!    ([`crate::protocol::sd::MULTICAST_IP`], `239.255.0.255`). This
+//!    saves every backend from writing a `SocketAddr::V6(_) =>
+//!    Unsupported` arm, and documents the crate's actual reach at this
+//!    layer. (The protocol layer parses IPv6 SD option endpoints too;
+//!    only the transport bind / send is IPv4-today.)
+//! 3. **No object safety.** Because `impl Future` is used in method return
+//!    positions, the traits cannot be made into trait objects
+//!    (`Box<dyn TransportSocket>` will not compile). This is intentional:
+//!    there is exactly one transport implementation per build, selected at
+//!    compile time, and monomorphization eliminates any dispatch overhead.
+//!    Consumers carry a generic `<T: TransportSocket>`.
+//!
+//! # `Send` and multithreaded executors
+//!
+//! Neither [`TransportSocket`] nor [`Timer`] method signatures require
+//! their returned futures to be `Send`. This is on purpose: single-threaded
+//! executors (embassy, smol's `LocalSet`, and any bare-metal task loop)
+//! benefit from the relaxation and can hold `!Send` state across yield
+//! points.
+//!
+//! Implementations targeting multithreaded executors such as `tokio::spawn`
+//! are expected to produce `Send + 'static` futures in practice. Consumers
+//! that require `Send` should enforce it through how they use the
+//! transport, not by naming the hidden future type returned by the trait
+//! methods — with RPITIT that type is anonymous and cannot be named, and
+//! there is no `TransportSocketSendFut`-style associated-type escape
+//! hatch here. Instead, wrap the call in an `async move` block and
+//! require `T: Send + 'static` on the captured state:
+//!
+//! ```ignore
+//! fn spawn_loop<T>(sock: T)
+//! where
+//!     T: TransportSocket + Send + 'static,
+//! {
+//!     tokio::spawn(async move {
+//!         let mut sock = sock;
+//!         /* use sock here */
+//!     });
+//! }
+//! ```
+//!
+//! A tokio-backed implementation where the underlying `UdpSocket` is
+//! already `Send + Sync` will produce `Send` futures automatically via
+//! `async` block capture inference, so the pattern above works without
+//! any extra trait-level future bound. Implementations that hold
+//! `!Send` state internally simply won't satisfy the `T: Send` bound
+//! — the compiler catches the mismatch at the `tokio::spawn` call
+//! site rather than inside the trait definition.
+//!
+//! # Status
+//!
+//! A default `std + tokio` implementation
+//! (`crate::tokio_transport::TokioTransport`,
+//! `crate::tokio_transport::TokioSocket`, `crate::tokio_transport::TokioTimer`)
+//! ships under the `client` and `server` features and is re-exported at the
+//! crate root. The paths are rendered as code literals rather than
+//! intra-doc links because the `tokio_transport` module is feature-gated,
+//! and links would otherwise break default-feature rustdoc builds. Other
+//! backends (for example `smoltcp::UdpSocket` + `embassy-time` on embedded)
+//! are the consumer's responsibility — the traits here are the integration
+//! point.
+//!
+//! # Minimal adapter sketch
+//!
+//! ```
+//! # #[cfg(feature = "client-tokio")]
+//! # fn wrapper() {
+//! use core::future::Future;
+//! use core::net::{Ipv4Addr, SocketAddrV4};
+//! use core::time::Duration;
+//! use futures::future::BoxFuture;
+//! use simple_someip::transport::{
+//!     IoErrorKind, ReceivedDatagram, SocketOptions, Timer, TransportError,
+//!     TransportFactory, TransportSocket,
+//! };
+//!
+//! struct TokioTransport;
+//!
+//! struct TokioSocket {
+//!     inner: tokio::net::UdpSocket,
+//! }
+//!
+//! impl TransportFactory for TokioTransport {
+//!     type Socket = TokioSocket;
+//!     fn bind(
+//!         &self,
+//!         addr: SocketAddrV4,
+//!         _options: &SocketOptions,
+//!     ) -> impl Future<Output = Result<Self::Socket, TransportError>> + Send {
+//!         async move {
+//!             let inner = tokio::net::UdpSocket::bind(addr)
+//!                 .await
+//!                 .map_err(|_| TransportError::Io(IoErrorKind::Other))?;
+//!             Ok(TokioSocket { inner })
+//!         }
+//!     }
+//! }
+//!
+//! impl TransportSocket for TokioSocket {
+//!     // `BoxFuture` keeps this sketch short. The real `TokioSocket`
+//!     // shipped under the `client` / `server` features uses named
+//!     // future structs that wrap `poll_send_to` / `poll_recv_from`
+//!     // for zero-allocation per datagram — see `tokio_transport.rs`.
+//!     type SendFuture<'a> = BoxFuture<'a, Result<(), TransportError>>;
+//!     type RecvFuture<'a> = BoxFuture<'a, Result<ReceivedDatagram, TransportError>>;
+//!
+//!     fn send_to<'a>(
+//!         &'a self,
+//!         buf: &'a [u8],
+//!         target: SocketAddrV4,
+//!     ) -> Self::SendFuture<'a> {
+//!         Box::pin(async move {
+//!             self.inner
+//!                 .send_to(buf, target)
+//!                 .await
+//!                 .map(|_| ())
+//!                 .map_err(|_| TransportError::Io(IoErrorKind::Other))
+//!         })
+//!     }
+//!     fn recv_from<'a>(
+//!         &'a self,
+//!         buf: &'a mut [u8],
+//!     ) -> Self::RecvFuture<'a> {
+//!         Box::pin(async move {
+//!             let (n, src) = self
+//!                 .inner
+//!                 .recv_from(buf)
+//!                 .await
+//!                 .map_err(|_| TransportError::Io(IoErrorKind::Other))?;
+//!             let source = match src {
+//!                 std::net::SocketAddr::V4(v4) => v4,
+//!                 std::net::SocketAddr::V6(_) => return Err(TransportError::Unsupported),
+//!             };
+//!             Ok(ReceivedDatagram {
+//!                 bytes_received: n,
+//!                 source,
+//!                 truncated: false,
+//!             })
+//!         })
+//!     }
+//!     fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+//!         match self.inner.local_addr() {
+//!             Ok(std::net::SocketAddr::V4(v4)) => Ok(v4),
+//!             Ok(_) => Err(TransportError::Unsupported),
+//!             Err(_) => Err(TransportError::Io(IoErrorKind::Other)),
+//!         }
+//!     }
+//!     fn join_multicast_v4(
+//!         &self,
+//!         group: Ipv4Addr,
+//!         iface: Ipv4Addr,
+//!     ) -> Result<(), TransportError> {
+//!         self.inner
+//!             .join_multicast_v4(group, iface)
+//!             .map_err(|_| TransportError::Io(IoErrorKind::Other))
+//!     }
+//!     fn leave_multicast_v4(
+//!         &self,
+//!         group: Ipv4Addr,
+//!         iface: Ipv4Addr,
+//!     ) -> Result<(), TransportError> {
+//!         self.inner
+//!             .leave_multicast_v4(group, iface)
+//!             .map_err(|_| TransportError::Io(IoErrorKind::Other))
+//!     }
+//! }
+//!
+//! struct TokioTimer;
+//! impl Timer for TokioTimer {
+//!     fn sleep(&self, duration: Duration) -> impl Future<Output = ()> + Send {
+//!         tokio::time::sleep(duration)
+//!     }
+//! }
+//! # }
+//! ```
+//!
+//! # Lifecycle
+//!
+//! Sockets are dropped to close. There is no explicit `shutdown` method —
+//! implementations should release kernel / stack resources in `Drop`.
+//! Implementations that need graceful shutdown (flushing an outgoing queue,
+//! for example) should perform it in `Drop` or expose an inherent method
+//! outside this trait.
+
+use core::future::Future;
+use core::net::{Ipv4Addr, SocketAddrV4};
+use core::time::Duration;
+
+use crate::e2e::Error as E2EError;
+use crate::e2e::{E2ECheckStatus, E2EKey, E2EProfile};
+
+/// Portable I/O error kinds surfaced by transport implementations.
+///
+/// This is a deliberately small vocabulary — anything that does not fit
+/// maps to [`IoErrorKind::Other`]. The enum is `#[non_exhaustive]` so new
+/// kinds can be added without a breaking change. Kept local to this crate
+/// (rather than re-exporting `embedded_io::ErrorKind`) so our public API
+/// does not move when `embedded_io` bumps major versions.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, thiserror::Error)]
+#[non_exhaustive]
+pub enum IoErrorKind {
+    /// The operation timed out.
+    #[error("operation timed out")]
+    TimedOut,
+    /// The operation was interrupted and can be retried.
+    #[error("operation interrupted")]
+    Interrupted,
+    /// The caller lacks permission for the operation.
+    #[error("permission denied")]
+    PermissionDenied,
+    /// A remote peer actively refused the connection / destination was
+    /// unreachable.
+    #[error("connection refused")]
+    ConnectionRefused,
+    /// The network layer rejected the operation (routing, MTU, etc.).
+    #[error("network unreachable")]
+    NetworkUnreachable,
+    /// A non-blocking call would have blocked. Transient — caller
+    /// should retry or wait for readiness rather than treating as
+    /// fatal.
+    #[error("would block")]
+    WouldBlock,
+    /// Any error that does not fit a more specific variant.
+    #[error("i/o error")]
+    Other,
+}
+
+impl IoErrorKind {
+    /// Returns `true` if a recv-loop error of this kind is a transient
+    /// condition that should not count toward a "kill the loop after N
+    /// consecutive errors" cap. Includes:
+    /// - [`Self::ConnectionRefused`] — a peer's ICMP port-unreachable
+    ///   reply is normal noise on a SOME/IP host that probes services
+    ///   that are not yet available;
+    /// - [`Self::NetworkUnreachable`] — a routing blip during
+    ///   interface migration is recoverable;
+    /// - [`Self::WouldBlock`] — by definition, retry-on-readiness;
+    /// - [`Self::Interrupted`] — a signal interrupted the syscall;
+    /// - [`Self::TimedOut`] — caller-driven timeout, not a socket
+    ///   failure.
+    ///
+    /// All other kinds (including [`Self::Other`]) are treated as
+    /// potentially-fatal and DO count toward the cap.
+    #[must_use]
+    pub fn is_transient_recv(self) -> bool {
+        matches!(
+            self,
+            Self::ConnectionRefused
+                | Self::NetworkUnreachable
+                | Self::WouldBlock
+                | Self::Interrupted
+                | Self::TimedOut,
+        )
+    }
+}
+
+/// Errors returned by [`TransportSocket`] and [`TransportFactory`]
+/// operations.
+///
+/// `#[non_exhaustive]` so that backend-specific conditions can be added in
+/// future releases without a breaking change. Implementations map their
+/// native error types into one of these variants; anything that does not
+/// fit a specific variant should use [`TransportError::Io`] with an
+/// appropriate [`IoErrorKind`].
+#[derive(Debug, Clone, Copy, PartialEq, Eq, thiserror::Error)]
+#[non_exhaustive]
+pub enum TransportError {
+    /// Bind failed because the address or port is already in use.
+    #[error("address in use")]
+    AddressInUse,
+    /// The operation is not supported by this transport (for example,
+    /// multicast on a backend that has none, or an IPv6 address on an
+    /// IPv4-only stack).
+    #[error("unsupported transport operation")]
+    Unsupported,
+    /// A generic I/O error, classified by a portable [`IoErrorKind`].
+    #[error("transport i/o: {0}")]
+    Io(IoErrorKind),
+}
+
+/// Socket-level options applied by [`TransportFactory::bind`].
+///
+/// The fields mirror the BSD / `socket2` options that `simple-someip`
+/// needs for its Service Discovery socket layout. A default-constructed
+/// [`SocketOptions`] requests a plain unicast socket.
+///
+/// `#[non_exhaustive]` so additional knobs (TTL, buffer sizes) can be
+/// introduced later without breaking downstream construction.
+#[derive(Debug, Clone, Copy)]
+#[non_exhaustive]
+pub struct SocketOptions {
+    /// Enable `SO_REUSEADDR` (required for the SD port 30490 on hosts
+    /// that run more than one SOME/IP endpoint on the same interface).
+    pub reuse_address: bool,
+    /// Enable `SO_REUSEPORT` where supported (Linux, BSD). Ignored on
+    /// platforms that do not expose it.
+    pub reuse_port: bool,
+    /// Outbound multicast interface (`IP_MULTICAST_IF`). `None` lets the
+    /// backend choose.
+    pub multicast_if_v4: Option<Ipv4Addr>,
+    /// Loop multicast traffic back to sockets on the same host
+    /// (`IP_MULTICAST_LOOP`). Tri-state:
+    /// - `None` — the OS default applies (Linux: enabled by default).
+    ///   Use this when you have no opinion on loopback.
+    /// - `Some(true)` — explicitly enable. Required when running a
+    ///   SOME/IP server and client on the same machine for testing.
+    /// - `Some(false)` — explicitly disable.
+    ///
+    /// Backends call `setsockopt(IP_MULTICAST_LOOP)` only for
+    /// `Some(_)`. A previous bool-typed field caused
+    /// `multicast_if_v4: Some(_), multicast_loop_v4: false` to silently
+    /// turn loopback OFF on hosts where the OS default was ON, even
+    /// when the caller had no opinion on loopback.
+    pub multicast_loop_v4: Option<bool>,
+}
+
+impl SocketOptions {
+    /// A plain unicast socket with no multicast configuration.
+    #[must_use]
+    pub const fn new() -> Self {
+        Self {
+            reuse_address: false,
+            reuse_port: false,
+            multicast_if_v4: None,
+            multicast_loop_v4: None,
+        }
+    }
+}
+
+impl Default for SocketOptions {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+/// The result of a successful [`TransportSocket::recv_from`].
+///
+/// `truncated` is set if the backend delivered only a prefix of the
+/// incoming datagram because it did not fit in the caller's buffer. If
+/// callers use a buffer sized to [`crate::UDP_BUFFER_SIZE`], truncation is
+/// generally not expected on backends whose delivered datagrams are
+/// bounded by that configured application-level cap. Backends that may
+/// deliver larger datagrams should surface this explicitly instead of
+/// silently dropping the fact that data was discarded.
+///
+/// Note: the default Tokio backend currently always reports
+/// `truncated: false` because `tokio::net::UdpSocket::recv_from` does not
+/// expose `MSG_TRUNC` (or equivalent). Reliable truncation detection
+/// requires a backend that does — e.g. a `recvmsg`-based backend, or a
+/// `no_std` stack like smoltcp / embassy-net that surfaces the original
+/// datagram length.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub struct ReceivedDatagram {
+    /// Number of bytes written to the caller's buffer.
+    pub bytes_received: usize,
+    /// Source address of the datagram.
+    pub source: SocketAddrV4,
+    /// `true` if the incoming datagram was larger than the caller's
+    /// buffer and the tail was discarded. See the type-level docs for
+    /// the default Tokio backend's caveat.
+    pub truncated: bool,
+}
+
+/// A bound, configured UDP socket usable for SOME/IP message exchange.
+///
+/// Implementations are obtained via [`TransportFactory::bind`]. The
+/// send/receive methods return associated future types so callers can
+/// require `Send` bounds when spawning socket loops on multithreaded
+/// executors. The smaller socket-level queries ([`Self::local_addr`],
+/// [`Self::join_multicast_v4`], [`Self::leave_multicast_v4`]) are
+/// synchronous because they are typically O(1) lookups on a backend's
+/// internal handle and do not benefit from yielding to the executor.
+///
+/// Multicast group membership is joined *after* bind via
+/// [`TransportSocket::join_multicast_v4`]; the bind-time
+/// [`SocketOptions::multicast_if_v4`] only selects the *outbound*
+/// multicast interface.
+///
+/// # Associated future types
+///
+/// The [`SendFuture`](Self::SendFuture) and [`RecvFuture`](Self::RecvFuture)
+/// associated types let consumers express `Send` bounds on the futures
+/// returned by `send_to` and `recv_from` without requiring nightly-only
+/// Return-Type Notation (RTN, RFC 3654). This enables:
+///
+/// ```ignore
+/// fn spawn_loop<T: TransportSocket>(sock: T, spawner: impl Spawner)
+/// where
+///     T: Send + Sync + 'static,
+///     for<'a> T::SendFuture<'a>: Send,
+///     for<'a> T::RecvFuture<'a>: Send,
+/// {
+///     spawner.spawn(async move { /* use sock */ });
+/// }
+/// ```
+///
+/// `TokioSocket` implements these with `Send` futures; bare-metal
+/// implementations must do the same if they want to be used with
+/// multithreaded spawners.
+pub trait TransportSocket {
+    /// Future returned by [`Self::send_to`].
+    type SendFuture<'a>: Future<Output = Result<(), TransportError>>
+    where
+        Self: 'a;
+
+    /// Future returned by [`Self::recv_from`].
+    type RecvFuture<'a>: Future<Output = Result<ReceivedDatagram, TransportError>>
+    where
+        Self: 'a;
+
+    /// Send `buf` to `target`. UDP is atomic — either the whole datagram
+    /// is transmitted or an error is returned; there is no short-write
+    /// case, which is why this method returns `()` on success rather than
+    /// a byte count.
+    ///
+    /// Takes `&self` so a single-task socket loop can hold a pending
+    /// [`Self::recv_from`] future and still call `send_to` in another
+    /// `select!` branch. Backends that need to mutate their socket
+    /// handle on send — e.g. direct smoltcp — must provide interior
+    /// mutability (typically `RefCell<_>` on single-threaded `no_std`, or
+    /// `critical_section::Mutex<RefCell<_>>` on multi-core HAL). The
+    /// `tokio::net::UdpSocket` and `embassy_net::udp::UdpSocket` APIs
+    /// are already `&self`, so adapters over those backends need no
+    /// extra wrapping.
+    ///
+    /// # Errors
+    ///
+    /// Returns:
+    /// - [`TransportError::Io`] with the appropriate [`IoErrorKind`] for
+    ///   transport-level send failures (e.g. the peer is unreachable,
+    ///   the interface is down, the datagram exceeds the link MTU, or a
+    ///   platform-level send error).
+    /// - [`TransportError::Unsupported`] if `target` is not representable
+    ///   on a backend that only speaks a subset of IPv4 (rare; most
+    ///   backends surface addressing issues as [`TransportError::Io`]).
+    fn send_to<'a>(&'a self, buf: &'a [u8], target: SocketAddrV4) -> Self::SendFuture<'a>;
+
+    /// Receive the next datagram into `buf`, returning a
+    /// [`ReceivedDatagram`] carrying byte count, source, and a truncation
+    /// flag.
+    ///
+    /// Takes `&self` for the same reason as [`Self::send_to`]: the
+    /// pending receive future must not hold an exclusive borrow of the
+    /// socket, or the concurrent send branch of a `select!` cannot
+    /// compile.
+    ///
+    /// # Errors
+    ///
+    /// Returns:
+    /// - [`TransportError::Io`] with the appropriate [`IoErrorKind`] for
+    ///   transport-level receive failures (e.g. the socket was closed,
+    ///   the interface went down, or a platform-level recv error).
+    /// - [`TransportError::Unsupported`] if the backend surfaces a
+    ///   non-IPv4 source address that cannot be represented as
+    ///   [`SocketAddrV4`].
+    ///
+    /// A datagram whose payload exceeds `buf` is **not** an error; it is
+    /// returned with [`ReceivedDatagram::truncated`] set to `true`. The
+    /// caller decides whether to treat truncation as fatal.
+    fn recv_from<'a>(&'a self, buf: &'a mut [u8]) -> Self::RecvFuture<'a>;
+
+    /// Return the local address this socket is bound to. Useful for
+    /// discovering the ephemeral port chosen by `bind(port: 0, ..)`.
+    ///
+    /// # Errors
+    ///
+    /// Returns [`TransportError`] if the backend cannot report the address.
+    fn local_addr(&self) -> Result<SocketAddrV4, TransportError>;
+
+    /// Join IPv4 multicast group `group` on interface `iface`. Required
+    /// before the socket will receive multicast traffic for that group.
+    ///
+    /// Called once per group per socket; joining twice is allowed and a
+    /// no-op on most backends.
+    ///
+    /// # Errors
+    ///
+    /// Returns [`TransportError::Unsupported`] if the backend has no
+    /// multicast support; otherwise [`TransportError::Io`] with an
+    /// appropriate kind.
+    fn join_multicast_v4(&self, group: Ipv4Addr, iface: Ipv4Addr) -> Result<(), TransportError>;
+
+    /// Leave IPv4 multicast group `group` on interface `iface`. Symmetric
+    /// to [`Self::join_multicast_v4`]. Most backends implicitly leave on
+    /// drop, so this is optional for simple lifetimes but required for
+    /// long-lived sockets that rotate group membership.
+    ///
+    /// # Errors
+    ///
+    /// Returns [`TransportError::Unsupported`] if the backend has no
+    /// multicast support; otherwise [`TransportError::Io`] with an
+    /// appropriate kind.
+    fn leave_multicast_v4(&self, group: Ipv4Addr, iface: Ipv4Addr) -> Result<(), TransportError>;
+
+    /// Upper bound, in bytes, on datagrams this socket will successfully
+    /// accept in `send_to` or return via `recv_from`. The default returns
+    /// [`crate::UDP_BUFFER_SIZE`], the crate's default application-level
+    /// UDP payload cap (currently 1500 bytes — note that this is *not*
+    /// MTU-safe; see [`crate::UDP_BUFFER_SIZE`]'s own docs for the
+    /// IPv4/IPv6 header overhead).
+    ///
+    /// Backends with a smaller effective MTU (for example, some
+    /// resource-constrained embedded stacks) should override this to
+    /// advertise the real limit so callers can size buffers accordingly.
+    #[must_use]
+    fn max_datagram_size(&self) -> usize {
+        crate::UDP_BUFFER_SIZE
+    }
+}
+
+/// Constructs [`TransportSocket`] instances from a bind address and
+/// [`SocketOptions`]. The factory carries whatever state the backend needs
+/// (for example, an lwIP network-interface handle) so that `bind` itself
+/// is a pure data operation.
+///
+/// On `std + tokio`, a unit-struct `TokioTransport;` factory is all that's
+/// needed — the runtime is implicit.
+pub trait TransportFactory {
+    /// The socket type produced by this factory.
+    type Socket: TransportSocket;
+
+    /// Future returned by [`Self::bind`].
+    ///
+    /// As an associated GAT (matching [`TransportSocket::SendFuture`] /
+    /// [`TransportSocket::RecvFuture`]), consumers can express a `Send`
+    /// bound at use sites that need it without forcing every backend
+    /// to produce a `Send` bind future. Multi-threaded callers add
+    /// `where for<'a> F::BindFuture<'a>: Send`; single-threaded callers
+    /// (`Client::new_with_deps_local`) drop that bound and accept a
+    /// `!Send` bind future from a backend like embassy-net.
+    type BindFuture<'a>: Future<Output = Result<Self::Socket, TransportError>>
+    where
+        Self: 'a;
+
+    /// Bind a new socket to `addr` with the requested `options`.
+    ///
+    /// `addr.port() == 0` requests an ephemeral port; call
+    /// [`TransportSocket::local_addr`] afterwards to discover what was
+    /// assigned.
+    ///
+    /// # Errors
+    ///
+    /// Returns [`TransportError::AddressInUse`] if the requested address
+    /// and port pair is already bound (and `reuse_*` was not enabled).
+    /// Other backend-level failures surface as [`TransportError::Io`].
+    fn bind<'a>(&'a self, addr: SocketAddrV4, options: &'a SocketOptions) -> Self::BindFuture<'a>;
+}
+
+/// Executor-agnostic sleep primitive.
+///
+/// `simple-someip` needs timed waits in two places: the Service Discovery
+/// announcement tick (1 s) and the client event-loop idle timeout
+/// (125 ms). Consumers provide a `Timer` at startup; on `std + tokio` this
+/// is a one-line wrapper around `tokio::time::sleep`, on embedded it is a
+/// one-line wrapper around `embassy_time::Timer::after` or similar.
+pub trait Timer {
+    /// Future returned by [`Self::sleep`].
+    ///
+    /// As an associated GAT, consumers can require `Send` at use sites
+    /// (`where for<'a> Tm::SleepFuture<'a>: Send`) without forcing every
+    /// backend's sleep future to be `Send`. Multi-threaded callers
+    /// (`Server::announcement_loop`, the tokio Client) add the bound;
+    /// single-threaded callers do not, accepting a `!Send` future from
+    /// a backend like `embassy_time`.
+    type SleepFuture<'a>: Future<Output = ()>
+    where
+        Self: 'a;
+
+    /// Wait for at least `duration` before resolving. Implementations MAY
+    /// overshoot but MUST NOT undershoot.
+    fn sleep(&self, duration: Duration) -> Self::SleepFuture<'_>;
+}
+
+/// Executor-agnostic task-spawning primitive.
+///
+/// `simple-someip`'s per-socket I/O loops need to run concurrently with
+/// the client's main event loop — otherwise `SocketManager::send`'s
+/// internal oneshot wait deadlocks (the send future parks the main
+/// loop, which is the only thing that would drive the socket loop to
+/// produce its response). The `Spawner` trait lets std+tokio callers
+/// pass a one-line `TokioSpawner` and bare-metal callers wrap their own
+/// executor's task-spawning primitive.
+///
+/// # Design rationale
+///
+/// The transport-trait design deliberately avoided wrapping spawn to
+/// prevent "reinventing embassy" and trait-object dispatch in the hot
+/// path. However, without a spawn abstraction, `Inner::bind_*` has to
+/// call `tokio::spawn` directly — making the whole crate tokio-only.
+/// The revised rule: spawn DOES need a trait, but we avoid the
+/// concerns by (1) keeping the trait generic (monomorphized, no
+/// `dyn Spawner`) and (2) scoping it narrowly — just spawn, not
+/// select/sleep which have other solutions.
+///
+/// # Usage
+///
+/// On `std + tokio`, use `crate::tokio_transport::TokioSpawner`
+/// (available when the `client` or `server` feature is enabled) —
+/// a zero-size unit struct whose `spawn` is a thin wrapper around
+/// `tokio::spawn`. The path is rendered as a code literal rather
+/// than an intra-doc link because the target module is feature-gated
+/// and would break default-feature rustdoc builds. On embedded:
+///
+/// ```ignore
+/// struct EmbassySpawner(embassy_executor::Spawner);
+/// impl simple_someip::Spawner for EmbassySpawner {
+///     fn spawn(&self, fut: impl core::future::Future<Output = ()> + Send + 'static) {
+///         // embassy's Spawner has its own task-registration model;
+///         // the adapter layer depends on how the user defined their tasks
+///         todo!("call self.0.spawn(...)");
+///     }
+/// }
+/// ```
+/// Local-executor counterpart to [`Spawner`].
+///
+/// Where [`Spawner::spawn`] requires its future to be `Send + 'static`
+/// (matching multi-threaded executors like tokio), `LocalSpawner::spawn_local`
+/// drops the `Send` bound and is the trait that single-threaded
+/// executors — embassy with `task-arena = 0`, tokio's `LocalSet`, async-std
+/// `LocalExecutor`, etc. — implement directly.
+///
+/// The two traits are independent: an executor MAY implement both
+/// (`current_thread` tokio with `LocalSet`), only [`Spawner`]
+/// (multi-threaded tokio default), or only [`LocalSpawner`]
+/// (single-task embassy).
+///
+/// Use `crate::client::Client::new_with_deps_local` (under `client`) to
+/// construct a Client whose run-loop and per-socket loops are submitted
+/// through a
+/// `LocalSpawner` (and whose `TransportFactory::Socket` is therefore
+/// allowed to be `!Send`).
+pub trait LocalSpawner {
+    /// Submit `future` to the local executor. Must not block; must
+    /// arrange for the future to be polled to completion on some
+    /// single-threaded task.
+    ///
+    /// The future is **not** required to be `Send` — it may capture
+    /// `Rc`, `RefCell`, raw `*mut` pointers, etc.
+    fn spawn_local(&self, future: impl Future<Output = ()> + 'static);
+}
+
+pub trait Spawner {
+    /// Submit `future` to the executor. Must not block; must arrange
+    /// for the future to be polled to completion on some task.
+    ///
+    /// # Correctness requirement
+    ///
+    /// Implementations MUST poll the submitted future. Dropping it
+    /// without polling — or holding it in a queue that never drains —
+    /// will deadlock `crate::client::Client` (available when the
+    /// `client` feature is enabled): `SocketManager::send`
+    /// `await`s an internal mpsc→oneshot round-trip whose only driver
+    /// is the per-socket loop future submitted here. No poll, no
+    /// progress, no oneshot resolution; the caller's `send` hangs
+    /// forever.
+    ///
+    /// The mock spawners in `tests/bare_metal_*.rs` demonstrate
+    /// correct integration patterns; callers that simply drop the
+    /// future will deadlock on any operation that requires a socket
+    /// round-trip.
+    ///
+    /// # Fire-and-forget by design
+    ///
+    /// `spawn` returns `()`, not a join-handle. The rest of the crate
+    /// observes `tokio::JoinHandle`s wherever it spawns work directly
+    /// (commit `d92c5a3`); this trait is the deliberate exception. The
+    /// per-socket loops have no observable result — they run forever and
+    /// only exit when their owning `SocketManager` drops its channel
+    /// ends — so a join-handle would just be storage with no callers.
+    /// A future revision MAY add an associated `Handle` type if a
+    /// concrete shutdown / cancellation use case appears; today there is
+    /// none.
+    ///
+    /// # Bound rationale
+    ///
+    /// The `Send + 'static` bound matches multi-threaded executors like
+    /// tokio, async-std, and smol — the captured per-socket loop is
+    /// already `Send + 'static` because its underlying `TokioSocket` is.
+    /// Embassy and other `no_alloc` / single-core executors typically need
+    /// additional adapter scaffolding (a typed `SpawnToken`, a static
+    /// task arena, hardware-specific waker plumbing) to satisfy
+    /// `Send + 'static`; the example at the top of this docstring has a
+    /// `todo!()` precisely because the adapter is not one-line. A future
+    /// release MAY add a `spawn_local`-style variant gated on a cargo
+    /// feature for those targets.
+    fn spawn(&self, future: impl Future<Output = ()> + Send + 'static);
+}
+
+/// Shared handle to the runtime E2E configuration registry.
+///
+/// Abstracts over `Arc<Mutex<E2ERegistry>>` on `std` and over
+/// critical-section-backed primitives (e.g. `embassy_sync::blocking_mutex`)
+/// on bare metal. All methods take `&self` and provide interior-mutable
+/// access. Implementations are required to be `Clone` so the handle can be
+/// cheaply shared between the `Client` (or `Server`) handle and its inner
+/// event loop.
+pub trait E2ERegistryHandle: Clone + Send + Sync + 'static {
+    /// Register an E2E profile for the given key, replacing any prior entry.
+    fn register(&self, key: E2EKey, profile: E2EProfile);
+
+    /// Remove the E2E configuration for the given key. No-op if absent.
+    fn unregister(&self, key: &E2EKey);
+
+    /// Returns `true` if a profile is registered for `key`.
+    fn contains_key(&self, key: &E2EKey) -> bool;
+
+    /// Run E2E protect for `key` if configured, writing to `output`.
+    ///
+    /// Returns `None` if no profile is registered for `key`.
+    /// Returns `Some(Err(_))` if protection fails (e.g. buffer too small).
+    /// Returns `Some(Ok(len))` on success; `len` is the number of bytes
+    /// written to `output`.
+    fn protect(
+        &self,
+        key: E2EKey,
+        payload: &[u8],
+        upper_header: [u8; 8],
+        output: &mut [u8],
+    ) -> Option<Result<usize, E2EError>>;
+
+    /// Run E2E check for `key` if configured.
+    ///
+    /// Returns `None` if no profile is registered for `key`. Otherwise
+    /// returns the check status and the effective payload slice — the
+    /// E2E header is stripped on success; the original bytes are returned
+    /// on check failure so the caller can decide how to handle it.
+    ///
+    /// The returned slice borrows from `payload`, not from this handle.
+    fn check<'a>(
+        &self,
+        key: E2EKey,
+        payload: &'a [u8],
+        upper_header: [u8; 8],
+    ) -> Option<(E2ECheckStatus, &'a [u8])>;
+}
+
+/// Shared handle to the local interface address.
+///
+/// Abstracts over `Arc<RwLock<Ipv4Addr>>` on `std`. All clones of a
+/// `Client` share the same handle, so writes from one clone (e.g.
+/// `Client::set_interface`) are visible to all others.
+///
+/// On bare metal, where `Client` is not `Clone`, a trivial implementation
+/// wrapping a `core::cell::Cell<Ipv4Addr>` suffices.
+pub trait InterfaceHandle: Clone + Send + Sync + 'static {
+    /// Returns the current interface address.
+    fn get(&self) -> Ipv4Addr;
+
+    /// Updates the stored interface address.
+    fn set(&self, addr: Ipv4Addr);
+}
+
+/// Default `std`-flavoured impls of [`E2ERegistryHandle`] and
+/// [`InterfaceHandle`] backed by `std::sync::{Arc, Mutex, RwLock}`. Pure
+/// std — no tokio dependency — so they live in the executor-agnostic
+/// transport module rather than the tokio backend.
+#[cfg(feature = "std")]
+mod std_handle_impls {
+    use super::{E2ERegistryHandle, InterfaceHandle};
+    use crate::e2e::Error as E2EError;
+    use crate::e2e::{E2ECheckStatus, E2EKey, E2EProfile, E2ERegistry};
+    use core::net::Ipv4Addr;
+    use std::sync::{Arc, Mutex, RwLock};
+
+    impl E2ERegistryHandle for Arc<Mutex<E2ERegistry>> {
+        fn register(&self, key: E2EKey, profile: E2EProfile) {
+            self.lock()
+                .expect("e2e registry lock poisoned")
+                .register(key, profile);
+        }
+
+        fn unregister(&self, key: &E2EKey) {
+            self.lock()
+                .expect("e2e registry lock poisoned")
+                .unregister(key);
+        }
+
+        fn contains_key(&self, key: &E2EKey) -> bool {
+            self.lock()
+                .expect("e2e registry lock poisoned")
+                .contains_key(key)
+        }
+
+        fn protect(
+            &self,
+            key: E2EKey,
+            payload: &[u8],
+            upper_header: [u8; 8],
+            output: &mut [u8],
+        ) -> Option<Result<usize, E2EError>> {
+            self.lock().expect("e2e registry lock poisoned").protect(
+                key,
+                payload,
+                upper_header,
+                output,
+            )
+        }
+
+        fn check<'a>(
+            &self,
+            key: E2EKey,
+            payload: &'a [u8],
+            upper_header: [u8; 8],
+        ) -> Option<(E2ECheckStatus, &'a [u8])> {
+            self.lock()
+                .expect("e2e registry lock poisoned")
+                .check(key, payload, upper_header)
+        }
+    }
+
+    impl InterfaceHandle for Arc<RwLock<Ipv4Addr>> {
+        fn get(&self) -> Ipv4Addr {
+            *self.read().expect("interface lock poisoned")
+        }
+
+        fn set(&self, addr: Ipv4Addr) {
+            *self.write().expect("interface lock poisoned") = addr;
+        }
+    }
+}
+
+/// Bare-metal no-alloc impls of [`E2ERegistryHandle`] and [`InterfaceHandle`].
+///
+/// These types satisfy `Clone + Send + Sync + 'static` without any heap
+/// allocation. The backing storage lives in a caller-owned `static`; the
+/// handles are thin `&'static` pointers that are trivially `Copy`.
+///
+/// # Production pattern
+///
+/// ```ignore
+/// use core::cell::RefCell;
+/// use core::sync::atomic::{AtomicU32, Ordering};
+/// use embassy_sync::blocking_mutex::Mutex;
+/// use embassy_sync::blocking_mutex::raw::CriticalSectionRawMutex;
+/// use simple_someip::e2e::E2ERegistry;
+/// use simple_someip::transport::{StaticE2EHandle, AtomicInterfaceHandle};
+///
+/// // Initialize once in main() before spawning tasks.
+/// fn init() -> (StaticE2EHandle, AtomicInterfaceHandle) {
+///     static IFACE_ADDR: AtomicU32 = AtomicU32::new(0);
+///     // E2ERegistry::new() is not const so the storage is heap-placed once.
+///     let registry_storage: &'static _ = Box::leak(Box::new(
+///         Mutex::<CriticalSectionRawMutex, RefCell<E2ERegistry>>::new(
+///             RefCell::new(E2ERegistry::new()),
+///         ),
+///     ));
+///     (StaticE2EHandle::new(registry_storage), AtomicInterfaceHandle::new(&IFACE_ADDR))
+/// }
+/// ```
+///
+/// # No-allocator targets
+///
+/// The example above uses `Box::leak` because [`crate::e2e::E2ERegistry::new()`] is not
+/// currently `const`. On a target with no allocator, swap that for a
+/// `static`-cell pattern (e.g. `static_cell::StaticCell::init`) once the
+/// registry constructor becomes `const`-friendly. The handle layer itself
+/// never allocates — only the one-time storage materialization does.
+#[cfg(feature = "bare_metal")]
+pub mod bare_metal_handle_impls {
+    use super::InterfaceHandle;
+    use core::net::Ipv4Addr;
+    use core::sync::atomic::{AtomicU32, Ordering};
+
+    // `StaticE2EHandle` wraps `E2ERegistry`, which currently requires
+    // `feature = "std"` because its backing storage is `HashMap`. Ported
+    // separately below so the rest of this module — in particular
+    // `AtomicInterfaceHandle` — is available in pure `no_std` bare-metal
+    // builds.
+
+    /// No-alloc [`InterfaceHandle`] backed by a `&'static AtomicU32`.
+    ///
+    /// IPv4 addresses are encoded as big-endian `u32` (`Ipv4Addr::into::<u32>`).
+    /// All clones are the same thin pointer. Declare the backing storage in a
+    /// `static`:
+    ///
+    /// ```ignore
+    /// static IFACE_ADDR: AtomicU32 = AtomicU32::new(0);
+    /// let handle = AtomicInterfaceHandle::new(&IFACE_ADDR);
+    /// ```
+    ///
+    /// # Memory ordering
+    ///
+    /// `set` uses [`Ordering::Release`] and `get` uses
+    /// [`Ordering::Acquire`] so a reader on a weakly-ordered core sees
+    /// updates promptly. Cheap on x86-TSO (free) and inexpensive on
+    /// aarch64 (one `dmb ish`).
+    #[derive(Clone, Copy)]
+    pub struct AtomicInterfaceHandle(&'static AtomicU32);
+
+    impl AtomicInterfaceHandle {
+        /// Wraps a static reference to the backing atomic.
+        pub const fn new(addr: &'static AtomicU32) -> Self {
+            Self(addr)
+        }
+    }
+
+    // Send + Sync are derived automatically: `&'static AtomicU32` is
+    // `Send + Sync` because `AtomicU32` is `Sync`.
+
+    impl InterfaceHandle for AtomicInterfaceHandle {
+        fn get(&self) -> Ipv4Addr {
+            // `Acquire` ordering pairs with the `Release` store below
+            // so a reader sees the most recent address promptly even
+            // on weakly-ordered hardware. The cost over `Relaxed` is
+            // a `dmb ish` on aarch64; on x86-TSO it is free.
+            Ipv4Addr::from(self.0.load(Ordering::Acquire))
+        }
+
+        fn set(&self, addr: Ipv4Addr) {
+            self.0.store(u32::from(addr), Ordering::Release);
+        }
+    }
+}
+
+/// `StaticE2EHandle` — no-alloc `E2ERegistryHandle` backed by a
+/// `&'static` critical-section mutex. Requires `feature = "std"` because
+/// the underlying [`crate::e2e::E2ERegistry`] currently uses `HashMap`.
+/// On a pure-`no_std` target the registry must be ported (see crate
+/// roadmap); until then, callers wanting bare-metal interface handles
+/// (the more common need) can use [`AtomicInterfaceHandle`] alone.
+#[cfg(all(feature = "bare_metal", feature = "std"))]
+pub mod bare_metal_e2e_impl {
+    use super::E2ERegistryHandle;
+    use crate::e2e::{E2ECheckStatus, E2EKey, E2EProfile, E2ERegistry, Error as E2EError};
+    use core::cell::RefCell;
+    use embassy_sync::blocking_mutex::Mutex;
+    use embassy_sync::blocking_mutex::raw::CriticalSectionRawMutex;
+
+    /// Convenience type alias for the embassy-sync critical-section mutex
+    /// backing [`StaticE2EHandle`].
+    pub type StaticE2EStorage = Mutex<CriticalSectionRawMutex, RefCell<E2ERegistry>>;
+
+    /// No-alloc [`E2ERegistryHandle`] backed by a `&'static` critical-section
+    /// mutex.
+    ///
+    /// All clones are the same thin pointer. Construct via [`StaticE2EHandle::new`]
+    /// and supply a `&'static StaticE2EStorage` (typically obtained via
+    /// `Box::leak` during system init, since [`E2ERegistry::new`] is not const).
+    #[derive(Clone, Copy)]
+    pub struct StaticE2EHandle(&'static StaticE2EStorage);
+
+    impl StaticE2EHandle {
+        /// Wraps a static reference to the backing mutex.
+        pub const fn new(storage: &'static StaticE2EStorage) -> Self {
+            Self(storage)
+        }
+    }
+
+    impl E2ERegistryHandle for StaticE2EHandle {
+        fn register(&self, key: E2EKey, profile: E2EProfile) {
+            self.0.lock(|cell| cell.borrow_mut().register(key, profile));
+        }
+
+        fn unregister(&self, key: &E2EKey) {
+            self.0.lock(|cell| cell.borrow_mut().unregister(key));
+        }
+
+        fn contains_key(&self, key: &E2EKey) -> bool {
+            self.0.lock(|cell| cell.borrow().contains_key(key))
+        }
+
+        fn protect(
+            &self,
+            key: E2EKey,
+            payload: &[u8],
+            upper_header: [u8; 8],
+            output: &mut [u8],
+        ) -> Option<Result<usize, E2EError>> {
+            self.0.lock(|cell| {
+                cell.borrow_mut()
+                    .protect(key, payload, upper_header, output)
+            })
+        }
+
+        fn check<'a>(
+            &self,
+            key: E2EKey,
+            payload: &'a [u8],
+            upper_header: [u8; 8],
+        ) -> Option<(E2ECheckStatus, &'a [u8])> {
+            self.0
+                .lock(|cell| cell.borrow_mut().check(key, payload, upper_header))
+        }
+    }
+}
+
+#[cfg(feature = "bare_metal")]
+pub use bare_metal_handle_impls::AtomicInterfaceHandle;
+
+#[cfg(all(feature = "bare_metal", feature = "std"))]
+pub use bare_metal_e2e_impl::{StaticE2EHandle, StaticE2EStorage};
+
+// ── Channel-handle abstraction ────────────────────────────────────────────
+//
+// `ChannelFactory` and its associated sender / receiver traits abstract over
+// the channel primitive used by the client. `TokioChannels` (in
+// `tokio_transport`) is the default for `std + tokio` builds;
+// `EmbassySyncChannels` (in `crate::embassy_channels`, gated behind
+// `embassy_channels` feature) is a heap-backed alternative for no-tokio builds;
+// `static_channels` (gated behind `bare_metal`) is the no-alloc alternative.
+
+/// Returned by [`OneshotRecv::recv`] when the sender was dropped before
+/// sending a value.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub struct OneshotCancelled;
+
+impl core::fmt::Display for OneshotCancelled {
+    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
+        f.write_str("oneshot sender dropped before sending a value")
+    }
+}
+
+/// The send half of a oneshot channel. Consuming: a value can be sent exactly
+/// once.
+pub trait OneshotSend<T: Send + 'static>: Send + 'static {
+    /// Send `value` through the channel.
+    ///
+    /// # Errors
+    ///
+    /// Returns `Err(value)` if the receiver was already dropped.
+    fn send(self, value: T) -> Result<(), T>;
+}
+
+/// The receive half of a oneshot channel. Resolves once the sender delivers a
+/// value, or returns [`OneshotCancelled`] if the sender is dropped first.
+pub trait OneshotRecv<T: Send + 'static>: Send + 'static {
+    /// Await the value. Consumes self — a oneshot receiver can only be awaited
+    /// once.
+    fn recv(self) -> impl core::future::Future<Output = Result<T, OneshotCancelled>> + Send;
+}
+
+/// The send half of a bounded MPSC channel.
+///
+/// Implementations must be [`Clone`] so that multiple producers can share the
+/// same channel (e.g. the `Client` handle is `Clone` and every clone must be
+/// able to send control messages to `Inner`).
+pub trait MpscSend<T: Send + 'static>: Clone + Send + 'static {
+    /// Send `value`, waiting if the channel is full. Returns `Err(())` if the
+    /// receiver was dropped.
+    fn send(&self, value: T) -> impl core::future::Future<Output = Result<(), ()>> + Send + '_;
+}
+
+/// The receive half of a bounded MPSC channel.
+pub trait MpscRecv<T: Send + 'static>: Send + 'static {
+    /// Receive the next value, waiting if the channel is empty. Returns `None`
+    /// if all senders were dropped and the channel is empty.
+    fn recv(&mut self) -> impl core::future::Future<Output = Option<T>> + Send + '_;
+
+    /// Poll the channel without blocking. Used by `receive_any_unicast` to
+    /// multiplex across several socket channels in a single `poll_fn` pass.
+    fn poll_recv(&mut self, cx: &mut core::task::Context<'_>) -> core::task::Poll<Option<T>>;
+}
+
+/// The send half of an unbounded MPSC channel.
+///
+/// Unlike [`MpscSend`], sending never blocks — the implementation must buffer
+/// arbitrarily many values (or, for embassy-sync, use a large finite capacity
+/// that is treated as effectively unbounded).
+pub trait UnboundedSend<T: Send + 'static>: Clone + Send + 'static {
+    /// Send `value` without blocking.
+    ///
+    /// # Errors
+    ///
+    /// Returns `Err(value)` if the receiver was dropped.
+    fn send_now(&self, value: T) -> Result<(), T>;
+}
+
+/// The receive half of an unbounded MPSC channel.
+pub trait UnboundedRecv<T: Send + 'static>: Send + 'static {
+    /// Receive the next value, waiting if the channel is empty. Returns `None`
+    /// if all senders were dropped and the channel is empty.
+    fn recv(&mut self) -> impl core::future::Future<Output = Option<T>> + Send + '_;
+}
+
+/// A zero-sized factory that creates channel pairs used by the client's
+/// internal transport.
+///
+/// Abstracting over both `tokio::sync::mpsc` / `oneshot` (std path) and
+/// `embassy-sync::channel::Channel` (bare-metal path) behind a single trait
+/// lets `Client` / `Inner` / `SocketManager` compile without a tokio
+/// dependency when `bare_metal` is active and `tokio` is not.
+///
+/// The three channel families:
+/// - **oneshot** — single-shot rendezvous, capacity 1. Used for command
+///   completion callbacks inside `crate::client::ControlMessage`.
+/// - **bounded** — finite-capacity MPSC queue. Used for the control channel
+///   and per-socket send / receive queues.
+/// - **unbounded** — notionally unbounded MPSC queue (embassy-sync
+///   implementations use a large-capacity channel). Used for the
+///   `ClientUpdate` stream from `Inner` to `Client`.
+///
+/// # Per-`T` opt-in via the `*Pooled<Self>` traits
+///
+/// The three constructor methods are generic over the channeled type
+/// `T`, but a heap-free static-pool implementation needs to map each `T`
+/// to a pre-declared `static` storage area. To make that mapping
+/// type-safe — and to surface "you forgot to declare a pool for this
+/// type" as a compile error rather than a runtime panic — each method
+/// requires the channeled type to implement the corresponding
+/// `*Pooled<Self>` trait and delegates the actual construction to it:
+///
+/// ```ignore
+/// fn oneshot<T>() -> (...) where T: OneshotPooled<Self> { T::oneshot_pair() }
+/// ```
+///
+/// Backends that have a single shared allocator (Tokio, embassy-sync)
+/// publish a blanket `impl<T: Send + 'static> OneshotPooled<Self> for T`
+/// (and its bounded / unbounded peers), so existing user code does not
+/// notice the change. A static-pool backend instead publishes per-`T`
+/// impls (typically generated by a `define_static_channels!` macro) that wire
+/// each `T` to its declared pool. Calling `oneshot::<NotDeclared>()`
+/// against such a backend fails at the call site with
+/// `OneshotPooled<MyChannels> is not implemented for NotDeclared`.
+pub trait ChannelFactory: Clone + Send + Sync + 'static {
+    /// Oneshot sender type.
+    type OneshotSender<T: Send + 'static>: OneshotSend<T>;
+    /// Oneshot receiver type.
+    type OneshotReceiver<T: Send + 'static>: OneshotRecv<T>;
+    /// Create a oneshot channel pair.
+    ///
+    /// Default body delegates to [`OneshotPooled::oneshot_pair`]; impls
+    /// rarely need to override this, they just publish the appropriate
+    /// `OneshotPooled<Self>` impls for the types they support.
+    #[must_use]
+    fn oneshot<T>() -> (Self::OneshotSender<T>, Self::OneshotReceiver<T>)
+    where
+        T: OneshotPooled<Self>,
+    {
+        T::oneshot_pair()
+    }
+
+    /// Bounded-channel sender type. The `const N: usize` parameter is
+    /// the channel capacity; it must match the `N` passed to
+    /// [`Self::bounded`]. Backends that store the capacity at
+    /// construction time (`tokio::sync::mpsc`) ignore it for storage
+    /// purposes; backends that bake it into the type (`embassy-sync`)
+    /// use it directly.
+    type BoundedSender<T: Send + 'static, const N: usize>: MpscSend<T>;
+    /// Bounded-channel receiver type. See [`Self::BoundedSender`].
+    type BoundedReceiver<T: Send + 'static, const N: usize>: MpscRecv<T>;
+    /// Create a bounded channel with capacity `N`.
+    ///
+    /// Default body delegates to [`BoundedPooled::bounded_pair`].
+    #[must_use]
+    fn bounded<T, const N: usize>() -> (Self::BoundedSender<T, N>, Self::BoundedReceiver<T, N>)
+    where
+        T: BoundedPooled<Self, N>,
+    {
+        T::bounded_pair()
+    }
+
+    /// Unbounded-channel sender type.
+    type UnboundedSender<T: Send + 'static>: UnboundedSend<T>;
+    /// Unbounded-channel receiver type.
+    type UnboundedReceiver<T: Send + 'static>: UnboundedRecv<T>;
+    /// Create an unbounded channel.
+    ///
+    /// Default body delegates to [`UnboundedPooled::unbounded_pair`].
+    #[must_use]
+    fn unbounded<T>() -> (Self::UnboundedSender<T>, Self::UnboundedReceiver<T>)
+    where
+        T: UnboundedPooled<Self>,
+    {
+        T::unbounded_pair()
+    }
+}
+
+/// Per-`T` opt-in for [`ChannelFactory::oneshot`].
+///
+/// Implementors declare "this `T` may be channeled through `C`'s oneshot
+/// family" and provide the construction. Backends with a single shared
+/// allocator (Tokio, embassy-sync) publish a blanket
+/// `impl<T: Send + 'static> OneshotPooled<Self> for T`. Static-pool
+/// backends publish per-`T` impls — typically via a macro — each
+/// pointing at a declared `static` pool slot.
+///
+/// The trait is parameterized over the channel factory `C` so a single
+/// `T` may participate in multiple backends without conflicting impls.
+pub trait OneshotPooled<C: ChannelFactory>: Send + Sized + 'static {
+    /// Build a `(sender, receiver)` pair through `C`'s oneshot family.
+    fn oneshot_pair() -> (C::OneshotSender<Self>, C::OneshotReceiver<Self>);
+}
+
+/// Per-`(T, N)` opt-in for [`ChannelFactory::bounded`]. See
+/// [`OneshotPooled`] for the design rationale; this is the bounded peer
+/// with capacity baked into the type.
+pub trait BoundedPooled<C: ChannelFactory, const N: usize>: Send + Sized + 'static {
+    /// Build a `(sender, receiver)` pair through `C`'s bounded family
+    /// with capacity `N`.
+    fn bounded_pair() -> (C::BoundedSender<Self, N>, C::BoundedReceiver<Self, N>);
+}
+
+/// Per-`T` opt-in for [`ChannelFactory::unbounded`]. See
+/// [`OneshotPooled`] for the design rationale.
+pub trait UnboundedPooled<C: ChannelFactory>: Send + Sized + 'static {
+    /// Build a `(sender, receiver)` pair through `C`'s unbounded family.
+    fn unbounded_pair() -> (C::UnboundedSender<Self>, C::UnboundedReceiver<Self>);
+}
+
+#[cfg(test)]
+mod tests {
+    //! The traits are pure interfaces — these tests only verify that
+    //! trivial mock implementations compile and that defaults behave as
+    //! documented.
+
+    use super::*;
+
+    /// `IoErrorKind::is_transient_recv` must classify the well-known
+    /// transient kinds as `true` (so they do not count toward
+    /// `MAX_CONSECUTIVE_RECV_ERRORS` in the per-socket loop) and
+    /// everything else — including the catch-all `Other` — as `false`.
+    /// Regression for H10: an inbound ICMP storm
+    /// (`ConnectionRefused`) was wrongly counted as fatal and tore
+    /// down healthy sockets after 16 transient blips.
+    #[test]
+    fn io_error_kind_transient_classification() {
+        // Transient kinds — must NOT count toward fatal-error cap.
+        assert!(IoErrorKind::ConnectionRefused.is_transient_recv());
+        assert!(IoErrorKind::NetworkUnreachable.is_transient_recv());
+        assert!(IoErrorKind::WouldBlock.is_transient_recv());
+        assert!(IoErrorKind::Interrupted.is_transient_recv());
+        assert!(IoErrorKind::TimedOut.is_transient_recv());
+
+        // Fatal-class kinds — DO count toward the cap.
+        assert!(!IoErrorKind::PermissionDenied.is_transient_recv());
+        assert!(!IoErrorKind::Other.is_transient_recv());
+    }
+
+    /// Drive a Future to completion on the test thread, assuming it never
+    /// yields (as with [`core::future::ready`] and its sync-in-disguise
+    /// peers). Panics if the future returns `Poll::Pending`.
+    fn block_on_ready<F: Future>(fut: F) -> F::Output {
+        use core::pin::pin;
+        use core::task::{Context, Poll, Waker};
+        let waker = Waker::noop();
+        let mut cx = Context::from_waker(waker);
+        let mut fut = pin!(fut);
+        match fut.as_mut().poll(&mut cx) {
+            Poll::Ready(v) => v,
+            Poll::Pending => panic!("future yielded Pending; use a real executor"),
+        }
+    }
+
+    #[test]
+    fn socket_options_default_is_plain_unicast() {
+        let opts = SocketOptions::default();
+        assert!(!opts.reuse_address);
+        assert!(!opts.reuse_port);
+        assert!(opts.multicast_if_v4.is_none());
+        assert!(opts.multicast_loop_v4.is_none());
+    }
+
+    #[test]
+    fn socket_options_new_matches_default() {
+        let a = SocketOptions::new();
+        let b = SocketOptions::default();
+        assert_eq!(a.reuse_address, b.reuse_address);
+        assert_eq!(a.reuse_port, b.reuse_port);
+        assert_eq!(a.multicast_if_v4, b.multicast_if_v4);
+        assert_eq!(a.multicast_loop_v4, b.multicast_loop_v4);
+    }
+
+    // A minimal `TransportSocket` + `TransportFactory` + `Timer`
+    // implementation. Exists purely to prove the trait signatures are
+    // implementable with zero `async` machinery — the futures are produced
+    // by `core::future` primitives, no executor involved. If this module
+    // compiles, any tokio / embassy / smoltcp adapter will also compile.
+    struct NullSocket {
+        addr: SocketAddrV4,
+    }
+
+    impl TransportSocket for NullSocket {
+        type SendFuture<'a> = core::future::Ready<Result<(), TransportError>>;
+        type RecvFuture<'a> = core::future::Ready<Result<ReceivedDatagram, TransportError>>;
+
+        fn send_to<'a>(&'a self, _buf: &'a [u8], _target: SocketAddrV4) -> Self::SendFuture<'a> {
+            core::future::ready(Err(TransportError::Unsupported))
+        }
+
+        fn recv_from<'a>(&'a self, _buf: &'a mut [u8]) -> Self::RecvFuture<'a> {
+            core::future::ready(Err(TransportError::Unsupported))
+        }
+
+        fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+            Ok(self.addr)
+        }
+
+        fn join_multicast_v4(
+            &self,
+            _group: Ipv4Addr,
+            _iface: Ipv4Addr,
+        ) -> Result<(), TransportError> {
+            Err(TransportError::Unsupported)
+        }
+
+        fn leave_multicast_v4(
+            &self,
+            _group: Ipv4Addr,
+            _iface: Ipv4Addr,
+        ) -> Result<(), TransportError> {
+            Err(TransportError::Unsupported)
+        }
+    }
+
+    struct NullFactory;
+
+    impl TransportFactory for NullFactory {
+        type Socket = NullSocket;
+        type BindFuture<'a> = core::future::Ready<Result<Self::Socket, TransportError>>;
+
+        fn bind<'a>(
+            &'a self,
+            addr: SocketAddrV4,
+            _options: &'a SocketOptions,
+        ) -> Self::BindFuture<'a> {
+            core::future::ready(Ok(NullSocket { addr }))
+        }
+    }
+
+    struct NullTimer;
+
+    impl Timer for NullTimer {
+        type SleepFuture<'a> = core::future::Ready<()>;
+
+        fn sleep(&self, _duration: Duration) -> Self::SleepFuture<'_> {
+            core::future::ready(())
+        }
+    }
+
+    #[test]
+    fn null_factory_bind_resolves_with_addr() {
+        let factory = NullFactory;
+        let addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0);
+        let options = SocketOptions::default();
+        let sock = block_on_ready(factory.bind(addr, &options)).expect("bind");
+        assert_eq!(sock.local_addr().unwrap(), addr);
+    }
+
+    #[test]
+    fn max_datagram_size_default_is_udp_buffer_size() {
+        let sock = NullSocket {
+            addr: SocketAddrV4::new(Ipv4Addr::LOCALHOST, 0),
+        };
+        assert_eq!(sock.max_datagram_size(), crate::UDP_BUFFER_SIZE);
+    }
+
+    #[test]
+    fn null_timer_sleep_resolves_immediately() {
+        let timer = NullTimer;
+        block_on_ready(timer.sleep(Duration::from_secs(1)));
+    }
+
+    #[test]
+    fn received_datagram_construct_and_field_access() {
+        let d = ReceivedDatagram {
+            bytes_received: 42,
+            source: SocketAddrV4::new(Ipv4Addr::LOCALHOST, 9999),
+            truncated: false,
+        };
+        assert_eq!(d.bytes_received, 42);
+        assert!(!d.truncated);
+    }
+
+    #[test]
+    fn io_error_kind_variants_are_distinct() {
+        // Compile-time check that all variants are constructible and
+        // distinguishable — Eq is derived, so assert some inequalities.
+        assert_ne!(IoErrorKind::TimedOut, IoErrorKind::Interrupted);
+        assert_ne!(IoErrorKind::PermissionDenied, IoErrorKind::Other);
+        assert_ne!(
+            IoErrorKind::ConnectionRefused,
+            IoErrorKind::NetworkUnreachable
+        );
+    }
+
+    #[test]
+    fn transport_error_io_wraps_kind() {
+        let e = TransportError::Io(IoErrorKind::TimedOut);
+        assert_eq!(e, TransportError::Io(IoErrorKind::TimedOut));
+        assert_ne!(e, TransportError::AddressInUse);
+    }
+
+    // Minimal no-op implementations to verify that E2ERegistryHandle and
+    // InterfaceHandle are implementable without any executor machinery.
+    #[derive(Clone)]
+    struct NullE2ERegistry;
+
+    impl E2ERegistryHandle for NullE2ERegistry {
+        fn register(&self, _key: E2EKey, _profile: E2EProfile) {}
+        fn unregister(&self, _key: &E2EKey) {}
+        fn contains_key(&self, _key: &E2EKey) -> bool {
+            false
+        }
+        fn protect(
+            &self,
+            _key: E2EKey,
+            _payload: &[u8],
+            _upper_header: [u8; 8],
+            _output: &mut [u8],
+        ) -> Option<Result<usize, E2EError>> {
+            None
+        }
+        fn check<'a>(
+            &self,
+            _key: E2EKey,
+            _payload: &'a [u8],
+            _upper_header: [u8; 8],
+        ) -> Option<(E2ECheckStatus, &'a [u8])> {
+            None
+        }
+    }
+
+    #[derive(Clone)]
+    struct NullInterface(Ipv4Addr);
+
+    impl InterfaceHandle for NullInterface {
+        fn get(&self) -> Ipv4Addr {
+            self.0
+        }
+        fn set(&self, _addr: Ipv4Addr) {}
+    }
+
+    #[test]
+    fn null_e2e_registry_compiles() {
+        let r = NullE2ERegistry;
+        let key = E2EKey::new(0, 0);
+        r.register(
+            key,
+            crate::e2e::E2EProfile::Profile4(crate::e2e::Profile4Config::new(0, 8)),
+        );
+        assert!(!r.contains_key(&key));
+        assert!(r.check(key, b"hello", [0; 8]).is_none());
+    }
+
+    #[test]
+    fn null_interface_get_set() {
+        let h = NullInterface(Ipv4Addr::LOCALHOST);
+        assert_eq!(h.get(), Ipv4Addr::LOCALHOST);
+        h.set(Ipv4Addr::UNSPECIFIED); // no-op in null impl
+        assert_eq!(h.get(), Ipv4Addr::LOCALHOST); // unchanged
+    }
+}
diff --git a/tests/bare_metal_client.rs b/tests/bare_metal_client.rs
new file mode 100644
index 0000000..3de10d3
--- /dev/null
+++ b/tests/bare_metal_client.rs
@@ -0,0 +1,287 @@
+//! Witness test: prove that `Client` can be constructed and driven
+//! without the `client-tokio` feature, using a static-pool
+//! [`ChannelFactory`] declared via [`define_static_channels!`] — the
+//! production-bound bare-metal path (no per-call heap allocation for
+//! channel storage).
+//!
+//! [`ChannelFactory`]: simple_someip::transport::ChannelFactory
+//! [`define_static_channels!`]: simple_someip::define_static_channels
+//!
+//! Originally a witness using `EmbassySyncChannels` (which still
+//! heap-allocates an `Arc<Channel<...>>` per call). The `static_channels`
+//! module and `define_static_channels!` macro now provide a truly
+//! heap-free path; this test exercises that macro end-to-end against
+//! `Client::new_with_deps`.
+//!
+//! `simple-someip` is compiled with `default-features = false,
+//! features = ["client", "bare_metal"]` per the `required-features`
+//! gate below — NO tokio, NO socket2 pulled in via the crate itself.
+//! The test runtime still uses the host's tokio (a `dev-dependency`)
+//! for `#[tokio::test]` execution, but every type fed to
+//! `Client::new_with_deps` is from the no-tokio side: a hand-rolled
+//! mock `TransportFactory`, a hand-rolled `Timer`, the
+//! macro-declared static-pool channels, and a `Spawner` that wraps
+//! `tokio::spawn` purely as the test executor.
+//!
+//! Compile-witness alone (Cargo `required-features` proving the test
+//! crate compiles without `client-tokio`) is the load-bearing
+//! assertion; the runtime send/recv at the end is a sanity check
+//! that the wired-up generics actually drive a working pipeline.
+//! Per-call heap-allocation absence is verified separately in
+//! `tests/static_channels_alloc_witness.rs`.
+#![cfg(all(feature = "client", feature = "bare_metal"))]
+
+use core::future::Future;
+use core::net::{Ipv4Addr, SocketAddrV4};
+use core::pin::Pin;
+use core::task::{Context, Poll};
+use core::time::Duration;
+use std::collections::VecDeque;
+use std::sync::{Arc, Mutex};
+
+use simple_someip::client::Error as ClientError;
+use simple_someip::client::{ClientUpdate, ControlMessage, ReceivedMessage, SendMessage};
+use simple_someip::define_static_channels;
+use simple_someip::e2e::E2ERegistry;
+use simple_someip::protocol::sd::RebootFlag;
+use simple_someip::transport::{
+    ReceivedDatagram, SocketOptions, Spawner, Timer, TransportError, TransportFactory,
+    TransportSocket,
+};
+use simple_someip::{Client, ClientDeps, RawPayload};
+
+// ── Static-pool channel factory declared via the macro ────────────────
+//
+// One pool per channeled `T`. Pool sizes here are deliberately small
+// for a witness test; production firmware would size pools to the
+// workload's high-water mark.
+define_static_channels! {
+    name: TestStaticChannels,
+    oneshot: [
+        (Result<(), ClientError>, 8),
+        (Result<RawPayload, ClientError>, 4),
+        (Result<RebootFlag, ClientError>, 4),
+    ],
+    bounded: [
+        ((ControlMessage<RawPayload, TestStaticChannels>, 4), 1),
+        ((SendMessage<RawPayload, TestStaticChannels>, 16), 4),
+        ((Result<ReceivedMessage<RawPayload>, ClientError>, 16), 4),
+    ],
+    unbounded: [
+        (ClientUpdate<RawPayload>, 1),
+    ],
+}
+
+// ── Mock transport ─────────────────────────────────────────────────────
+
+#[derive(Default)]
+struct MockPipe {
+    sent: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound_waker: Mutex<Option<core::task::Waker>>,
+}
+
+#[derive(Clone)]
+struct MockFactory {
+    pipe: Arc<MockPipe>,
+    local_port: Arc<Mutex<u16>>,
+}
+
+impl TransportFactory for MockFactory {
+    type Socket = MockSocket;
+    type BindFuture<'a> =
+        core::pin::Pin<Box<dyn Future<Output = Result<Self::Socket, TransportError>> + Send + 'a>>;
+    fn bind<'a>(&'a self, addr: SocketAddrV4, _options: &'a SocketOptions) -> Self::BindFuture<'a> {
+        let pipe = Arc::clone(&self.pipe);
+        let mut p = self.local_port.lock().unwrap();
+        // Mock: assign port deterministically. If caller asked for 0,
+        // hand out an incrementing fake ephemeral port.
+        let port = if addr.port() == 0 {
+            let next = *p + 1;
+            *p = next;
+            30000 + next
+        } else {
+            addr.port()
+        };
+        let local = SocketAddrV4::new(*addr.ip(), port);
+        Box::pin(async move { Ok(MockSocket { pipe, local }) })
+    }
+}
+
+struct MockSocket {
+    pipe: Arc<MockPipe>,
+    local: SocketAddrV4,
+}
+
+struct MockSendFut {
+    pipe: Arc<MockPipe>,
+    bytes: Option<Vec<u8>>,
+    target: SocketAddrV4,
+}
+
+impl Future for MockSendFut {
+    type Output = Result<(), TransportError>;
+    fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        if let Some(bytes) = me.bytes.take() {
+            me.pipe.sent.lock().unwrap().push_back((bytes, me.target));
+        }
+        Poll::Ready(Ok(()))
+    }
+}
+
+struct MockRecvFut<'a> {
+    pipe: Arc<MockPipe>,
+    buf: &'a mut [u8],
+}
+
+impl Future for MockRecvFut<'_> {
+    type Output = Result<ReceivedDatagram, TransportError>;
+    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        let entry = me.pipe.inbound.lock().unwrap().pop_front();
+        match entry {
+            Some((bytes, source)) => {
+                let n = bytes.len().min(me.buf.len());
+                me.buf[..n].copy_from_slice(&bytes[..n]);
+                Poll::Ready(Ok(ReceivedDatagram {
+                    bytes_received: n,
+                    source,
+                    truncated: n < bytes.len(),
+                }))
+            }
+            None => {
+                // Park on the pipe's waker. Real bare-metal impls park
+                // the task on an interrupt-driven waker;
+                // wake_by_ref-on-empty would CPU-peg the test runtime.
+                *me.pipe.inbound_waker.lock().unwrap() = Some(cx.waker().clone());
+                // Re-check after registering to close the lost-wakeup
+                // window between the pop_front above and the waker
+                // store here.
+                if let Some((bytes, source)) = me.pipe.inbound.lock().unwrap().pop_front() {
+                    let n = bytes.len().min(me.buf.len());
+                    me.buf[..n].copy_from_slice(&bytes[..n]);
+                    return Poll::Ready(Ok(ReceivedDatagram {
+                        bytes_received: n,
+                        source,
+                        truncated: n < bytes.len(),
+                    }));
+                }
+                Poll::Pending
+            }
+        }
+    }
+}
+
+impl TransportSocket for MockSocket {
+    type SendFuture<'a> = MockSendFut;
+    type RecvFuture<'a> = MockRecvFut<'a>;
+
+    fn send_to<'a>(&'a self, buf: &'a [u8], target: SocketAddrV4) -> Self::SendFuture<'a> {
+        MockSendFut {
+            pipe: Arc::clone(&self.pipe),
+            bytes: Some(buf.to_vec()),
+            target,
+        }
+    }
+
+    fn recv_from<'a>(&'a self, buf: &'a mut [u8]) -> Self::RecvFuture<'a> {
+        MockRecvFut {
+            pipe: Arc::clone(&self.pipe),
+            buf,
+        }
+    }
+
+    fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+        Ok(self.local)
+    }
+
+    fn join_multicast_v4(&self, _group: Ipv4Addr, _iface: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+
+    fn leave_multicast_v4(&self, _group: Ipv4Addr, _iface: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+}
+
+// ── Mock Timer ────────────────────────────────────────────────────────
+
+struct MockTimer;
+impl Timer for MockTimer {
+    type SleepFuture<'a> = core::pin::Pin<Box<dyn Future<Output = ()> + Send + 'a>>;
+    fn sleep(&self, duration: Duration) -> Self::SleepFuture<'_> {
+        // Honor `duration` — the `Timer` trait's contract is that
+        // implementations MAY overshoot but MUST NOT undershoot. The
+        // test runtime is `#[tokio::test]` (tokio is a `dev-dependency`),
+        // so using `tokio::time::sleep` is fine — it only proves the
+        // production crate's no-tokio path compiles. A real bare-metal
+        // impl would replace this with `embassy_time::Timer::after`.
+        Box::pin(async move {
+            tokio::time::sleep(duration).await;
+        })
+    }
+}
+
+// ── Spawner that delegates to tokio::spawn (test-runtime executor) ──
+
+struct TokioBackedSpawner;
+impl Spawner for TokioBackedSpawner {
+    fn spawn(&self, future: impl Future<Output = ()> + Send + 'static) {
+        drop(tokio::spawn(future));
+    }
+}
+
+// ── Test ──────────────────────────────────────────────────────────────
+
+#[tokio::test]
+async fn client_constructible_without_client_tokio_feature() {
+    let pipe = Arc::new(MockPipe::default());
+    let factory = MockFactory {
+        pipe: Arc::clone(&pipe),
+        local_port: Arc::new(Mutex::new(0)),
+    };
+
+    // Custom InterfaceHandle and E2ERegistryHandle that don't require
+    // tokio. We use std Arc/Mutex/RwLock impls (which are gated by
+    // `feature = "std"`, not by `client-tokio`).
+    let interface_handle: Arc<std::sync::RwLock<Ipv4Addr>> =
+        Arc::new(std::sync::RwLock::new(Ipv4Addr::LOCALHOST));
+    let e2e_handle: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+
+    let (client, _updates, run_fut) = Client::<
+        RawPayload,
+        Arc<Mutex<E2ERegistry>>,
+        Arc<std::sync::RwLock<Ipv4Addr>>,
+        TestStaticChannels,
+    >::new_with_deps(
+        ClientDeps {
+            factory,
+            spawner: TokioBackedSpawner,
+            timer: MockTimer,
+            e2e_registry: e2e_handle,
+            interface: interface_handle,
+        },
+        false,
+    );
+
+    // Compile-time witness: the constructor accepts no-tokio types,
+    // returns a `Client` + updates triple, and the run-loop future
+    // is `Send + 'static` (proven by the `tokio::spawn` below).
+    let run_handle = tokio::spawn(run_fut);
+
+    // Verify the Client handle is usable: read its interface address.
+    assert_eq!(client.interface(), Ipv4Addr::LOCALHOST);
+
+    // Tear down. `TestStaticChannels`'s bounded sender Drop sets the
+    // slot's `closed` flag and wakes the receiver, so dropping all
+    // `Client` clones lets the run loop's control-channel `recv`
+    // resolve to `None` and the loop exits naturally — but it's
+    // simpler to abort the spawned task directly here. The witness
+    // goal is the compile + start-up sanity check, not graceful
+    // shutdown semantics.
+    run_handle.abort();
+    drop(client);
+
+    tokio::time::sleep(Duration::from_millis(50)).await;
+}
diff --git a/tests/bare_metal_client_local.rs b/tests/bare_metal_client_local.rs
new file mode 100644
index 0000000..b670436
--- /dev/null
+++ b/tests/bare_metal_client_local.rs
@@ -0,0 +1,223 @@
+//! Witness that `Client::new_with_deps_local` accepts a [`LocalSpawner`]
+//! and returns a (possibly `!Send`) run-loop future. Sibling test file
+//! to `bare_metal_client.rs` — kept separate so it has its own static
+//! channel pool and can't collide with the Send-flavored Client
+//! construction witness when cargo runs the tests in parallel.
+#![cfg(all(feature = "client", feature = "bare_metal"))]
+
+use core::future::Future;
+use core::net::{Ipv4Addr, SocketAddrV4};
+use core::pin::Pin;
+use core::task::{Context, Poll};
+use core::time::Duration;
+use std::collections::VecDeque;
+use std::sync::{Arc, Mutex};
+
+use simple_someip::client::Error as ClientError;
+use simple_someip::client::{ClientUpdate, ControlMessage, ReceivedMessage, SendMessage};
+use simple_someip::define_static_channels;
+use simple_someip::e2e::E2ERegistry;
+use simple_someip::protocol::sd::RebootFlag;
+use simple_someip::transport::{
+    LocalSpawner, ReceivedDatagram, SocketOptions, Timer, TransportError, TransportFactory,
+    TransportSocket,
+};
+use simple_someip::{Client, ClientDeps, RawPayload};
+
+define_static_channels! {
+    name: LocalChannels,
+    oneshot: [
+        (Result<(), ClientError>, 4),
+        (Result<RawPayload, ClientError>, 2),
+        (Result<RebootFlag, ClientError>, 2),
+    ],
+    bounded: [
+        ((ControlMessage<RawPayload, LocalChannels>, 4), 2),
+        ((SendMessage<RawPayload, LocalChannels>, 16), 2),
+        ((Result<ReceivedMessage<RawPayload>, ClientError>, 16), 2),
+    ],
+    unbounded: [
+        (ClientUpdate<RawPayload>, 2),
+    ],
+}
+
+// ── Mock transport (mirrors bare_metal_client.rs) ─────────────────────
+
+#[derive(Default)]
+struct MockPipe {
+    sent: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound_waker: Mutex<Option<core::task::Waker>>,
+}
+
+#[derive(Clone)]
+struct MockFactory {
+    pipe: Arc<MockPipe>,
+    local_port: Arc<Mutex<u16>>,
+}
+
+impl TransportFactory for MockFactory {
+    type Socket = MockSocket;
+    type BindFuture<'a> =
+        core::pin::Pin<Box<dyn Future<Output = Result<Self::Socket, TransportError>> + 'a>>;
+    fn bind<'a>(&'a self, addr: SocketAddrV4, _options: &'a SocketOptions) -> Self::BindFuture<'a> {
+        let pipe = Arc::clone(&self.pipe);
+        let mut p = self.local_port.lock().unwrap();
+        let port = if addr.port() == 0 {
+            let next = *p + 1;
+            *p = next;
+            40000 + next
+        } else {
+            addr.port()
+        };
+        let local = SocketAddrV4::new(*addr.ip(), port);
+        Box::pin(async move { Ok(MockSocket { pipe, local }) })
+    }
+}
+
+struct MockSocket {
+    pipe: Arc<MockPipe>,
+    local: SocketAddrV4,
+}
+
+struct MockSendFut {
+    pipe: Arc<MockPipe>,
+    bytes: Option<Vec<u8>>,
+    target: SocketAddrV4,
+}
+
+impl Future for MockSendFut {
+    type Output = Result<(), TransportError>;
+    fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        if let Some(bytes) = me.bytes.take() {
+            me.pipe.sent.lock().unwrap().push_back((bytes, me.target));
+        }
+        Poll::Ready(Ok(()))
+    }
+}
+
+struct MockRecvFut<'a> {
+    pipe: Arc<MockPipe>,
+    buf: &'a mut [u8],
+}
+
+impl Future for MockRecvFut<'_> {
+    type Output = Result<ReceivedDatagram, TransportError>;
+    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        let entry = me.pipe.inbound.lock().unwrap().pop_front();
+        match entry {
+            Some((bytes, source)) => {
+                let n = bytes.len().min(me.buf.len());
+                me.buf[..n].copy_from_slice(&bytes[..n]);
+                Poll::Ready(Ok(ReceivedDatagram {
+                    bytes_received: n,
+                    source,
+                    truncated: n < bytes.len(),
+                }))
+            }
+            None => {
+                *me.pipe.inbound_waker.lock().unwrap() = Some(cx.waker().clone());
+                if let Some((bytes, source)) = me.pipe.inbound.lock().unwrap().pop_front() {
+                    let n = bytes.len().min(me.buf.len());
+                    me.buf[..n].copy_from_slice(&bytes[..n]);
+                    return Poll::Ready(Ok(ReceivedDatagram {
+                        bytes_received: n,
+                        source,
+                        truncated: n < bytes.len(),
+                    }));
+                }
+                Poll::Pending
+            }
+        }
+    }
+}
+
+impl TransportSocket for MockSocket {
+    type SendFuture<'a> = MockSendFut;
+    type RecvFuture<'a> = MockRecvFut<'a>;
+
+    fn send_to<'a>(&'a self, buf: &'a [u8], target: SocketAddrV4) -> Self::SendFuture<'a> {
+        MockSendFut {
+            pipe: Arc::clone(&self.pipe),
+            bytes: Some(buf.to_vec()),
+            target,
+        }
+    }
+
+    fn recv_from<'a>(&'a self, buf: &'a mut [u8]) -> Self::RecvFuture<'a> {
+        MockRecvFut {
+            pipe: Arc::clone(&self.pipe),
+            buf,
+        }
+    }
+
+    fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+        Ok(self.local)
+    }
+
+    fn join_multicast_v4(&self, _g: Ipv4Addr, _i: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+    fn leave_multicast_v4(&self, _g: Ipv4Addr, _i: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+}
+
+struct MockTimer;
+impl Timer for MockTimer {
+    type SleepFuture<'a> = core::pin::Pin<Box<dyn Future<Output = ()> + 'a>>;
+    fn sleep(&self, duration: Duration) -> Self::SleepFuture<'_> {
+        Box::pin(async move {
+            tokio::time::sleep(duration).await;
+        })
+    }
+}
+
+struct LocalTokioSpawner;
+impl LocalSpawner for LocalTokioSpawner {
+    fn spawn_local(&self, future: impl Future<Output = ()> + 'static) {
+        drop(tokio::task::spawn_local(future));
+    }
+}
+
+#[tokio::test]
+async fn client_constructible_with_local_spawner() {
+    tokio::task::LocalSet::new()
+        .run_until(async move {
+            let pipe = Arc::new(MockPipe::default());
+            let factory = MockFactory {
+                pipe: Arc::clone(&pipe),
+                local_port: Arc::new(Mutex::new(0)),
+            };
+
+            let interface_handle: Arc<std::sync::RwLock<Ipv4Addr>> =
+                Arc::new(std::sync::RwLock::new(Ipv4Addr::LOCALHOST));
+            let e2e_handle: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+
+            let (client, _updates, run_fut) = Client::<
+                RawPayload,
+                Arc<Mutex<E2ERegistry>>,
+                Arc<std::sync::RwLock<Ipv4Addr>>,
+                LocalChannels,
+            >::new_with_deps_local(
+                ClientDeps {
+                    factory,
+                    spawner: LocalTokioSpawner,
+                    timer: MockTimer,
+                    e2e_registry: e2e_handle,
+                    interface: interface_handle,
+                },
+                false,
+            );
+
+            let run_handle = tokio::task::spawn_local(run_fut);
+            assert_eq!(client.interface(), Ipv4Addr::LOCALHOST);
+
+            run_handle.abort();
+            drop(client);
+            tokio::time::sleep(Duration::from_millis(50)).await;
+        })
+        .await;
+}
diff --git a/tests/bare_metal_e2e.rs b/tests/bare_metal_e2e.rs
new file mode 100644
index 0000000..a90a253
--- /dev/null
+++ b/tests/bare_metal_e2e.rs
@@ -0,0 +1,563 @@
+//! End-to-end bare-metal test: wire a no-tokio Client and Server through
+//! a shared mock pipe and drive a request/response roundtrip.
+//!
+//! This test proves that the full `Client` + `Server` path works without
+//! the `client-tokio` / `server-tokio` features. Both sides use:
+//! - A shared `MockPipe` for transport (bytes sent by one side appear in
+//!   the other's inbound queue)
+//! - `define_static_channels!` for the client's channel factory
+//! - `Arc<Mutex<E2ERegistry>>` for E2E (the std-backed impl)
+//! - A test-runtime tokio spawner/timer (proving the *trait* compiles,
+//!   not that tokio is absent from the test harness)
+//!
+//! The test exercises:
+//! 1. Server startup and SD announcement broadcast
+//! 2. Client receiving the SD offer (via the shared pipe)
+//! 3. Client sending a request to the server
+//! 4. Server run-loop receiving and echoing the request
+//! 5. Client receiving the response
+#![cfg(all(feature = "client", feature = "server", feature = "bare_metal"))]
+
+use core::future::Future;
+use core::net::{Ipv4Addr, SocketAddrV4};
+use core::pin::Pin;
+use core::task::{Context, Poll};
+use core::time::Duration;
+use std::collections::VecDeque;
+use std::sync::{Arc, Mutex, RwLock};
+
+use simple_someip::PayloadWireFormat;
+use simple_someip::client::Error as ClientError;
+use simple_someip::client::{ClientUpdate, ControlMessage, ReceivedMessage, SendMessage};
+use simple_someip::define_static_channels;
+use simple_someip::e2e::E2ERegistry;
+use simple_someip::protocol::sd::RebootFlag;
+use simple_someip::protocol::{
+    Header, Message, MessageId, MessageType, MessageTypeField, ReturnCode,
+};
+use simple_someip::server::{ServerConfig, SubscribeError, Subscriber, SubscriptionHandle};
+use simple_someip::transport::{
+    ReceivedDatagram, SocketOptions, Spawner, Timer, TransportError, TransportFactory,
+    TransportSocket,
+};
+use simple_someip::{Client, ClientDeps, RawPayload, Server, ServerDeps};
+
+// ── Static-pool channel factory ───────────────────────────────────────
+
+define_static_channels! {
+    name: E2ETestChannels,
+    oneshot: [
+        (Result<(), ClientError>, 16),
+        (Result<RawPayload, ClientError>, 8),
+        (Result<RebootFlag, ClientError>, 8),
+    ],
+    bounded: [
+        ((ControlMessage<RawPayload, E2ETestChannels>, 4), 4),
+        ((SendMessage<RawPayload, E2ETestChannels>, 16), 8),
+        ((Result<ReceivedMessage<RawPayload>, ClientError>, 16), 8),
+    ],
+    unbounded: [
+        (ClientUpdate<RawPayload>, 4),
+    ],
+}
+
+// ── Shared mock pipe (bidirectional) ──────────────────────────────────
+//
+// The "network" is modeled as two separate pipes:
+// - `client_to_server`: bytes sent by client, received by server
+// - `server_to_client`: bytes sent by server, received by client
+//
+// Each side's MockSocket is configured to send to one pipe and receive
+// from the other.
+
+#[derive(Default)]
+struct MockPipe {
+    queue: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    waker: Mutex<Option<core::task::Waker>>,
+}
+
+impl MockPipe {
+    fn send(&self, bytes: Vec<u8>, source: SocketAddrV4) {
+        self.queue.lock().unwrap().push_back((bytes, source));
+        let waker = self.waker.lock().unwrap().take();
+        if let Some(waker) = waker {
+            waker.wake();
+        }
+    }
+
+    fn try_recv(&self) -> Option<(Vec<u8>, SocketAddrV4)> {
+        self.queue.lock().unwrap().pop_front()
+    }
+
+    fn register_waker(&self, waker: core::task::Waker) {
+        *self.waker.lock().unwrap() = Some(waker);
+    }
+}
+
+struct SharedNetwork {
+    client_to_server: Arc<MockPipe>,
+    server_to_client: Arc<MockPipe>,
+}
+
+impl SharedNetwork {
+    fn new() -> Self {
+        Self {
+            client_to_server: Arc::new(MockPipe::default()),
+            server_to_client: Arc::new(MockPipe::default()),
+        }
+    }
+}
+
+// ── Mock transport factory ────────────────────────────────────────────
+
+#[derive(Clone)]
+struct MockFactory {
+    /// Pipe to send to
+    tx_pipe: Arc<MockPipe>,
+    /// Pipe to receive from
+    rx_pipe: Arc<MockPipe>,
+    /// Port counter for ephemeral binds
+    next_port: Arc<Mutex<u16>>,
+}
+
+impl TransportFactory for MockFactory {
+    type Socket = MockSocket;
+    type BindFuture<'a> =
+        core::pin::Pin<Box<dyn Future<Output = Result<Self::Socket, TransportError>> + Send + 'a>>;
+
+    fn bind<'a>(&'a self, addr: SocketAddrV4, _options: &'a SocketOptions) -> Self::BindFuture<'a> {
+        let tx = Arc::clone(&self.tx_pipe);
+        let rx = Arc::clone(&self.rx_pipe);
+        let port = if addr.port() == 0 {
+            let mut p = self.next_port.lock().unwrap();
+            *p += 1;
+            40000 + *p
+        } else {
+            addr.port()
+        };
+        let local = SocketAddrV4::new(*addr.ip(), port);
+        Box::pin(async move {
+            Ok(MockSocket {
+                tx_pipe: tx,
+                rx_pipe: rx,
+                local,
+            })
+        })
+    }
+}
+
+struct MockSocket {
+    tx_pipe: Arc<MockPipe>,
+    rx_pipe: Arc<MockPipe>,
+    local: SocketAddrV4,
+}
+
+struct MockSendFut {
+    pipe: Arc<MockPipe>,
+    bytes: Option<Vec<u8>>,
+    source: SocketAddrV4,
+}
+
+impl Future for MockSendFut {
+    type Output = Result<(), TransportError>;
+    fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        if let Some(bytes) = me.bytes.take() {
+            me.pipe.send(bytes, me.source);
+        }
+        Poll::Ready(Ok(()))
+    }
+}
+
+struct MockRecvFut<'a> {
+    pipe: Arc<MockPipe>,
+    buf: &'a mut [u8],
+}
+
+impl Future for MockRecvFut<'_> {
+    type Output = Result<ReceivedDatagram, TransportError>;
+    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        if let Some((bytes, source)) = me.pipe.try_recv() {
+            let n = bytes.len().min(me.buf.len());
+            me.buf[..n].copy_from_slice(&bytes[..n]);
+            return Poll::Ready(Ok(ReceivedDatagram {
+                bytes_received: n,
+                source,
+                truncated: n < bytes.len(),
+            }));
+        }
+        me.pipe.register_waker(cx.waker().clone());
+        // Re-check after registering
+        if let Some((bytes, source)) = me.pipe.try_recv() {
+            let n = bytes.len().min(me.buf.len());
+            me.buf[..n].copy_from_slice(&bytes[..n]);
+            return Poll::Ready(Ok(ReceivedDatagram {
+                bytes_received: n,
+                source,
+                truncated: n < bytes.len(),
+            }));
+        }
+        Poll::Pending
+    }
+}
+
+impl TransportSocket for MockSocket {
+    type SendFuture<'a> = MockSendFut;
+    type RecvFuture<'a> = MockRecvFut<'a>;
+
+    fn send_to<'a>(&'a self, buf: &'a [u8], _target: SocketAddrV4) -> Self::SendFuture<'a> {
+        MockSendFut {
+            pipe: Arc::clone(&self.tx_pipe),
+            bytes: Some(buf.to_vec()),
+            source: self.local,
+        }
+    }
+
+    fn recv_from<'a>(&'a self, buf: &'a mut [u8]) -> Self::RecvFuture<'a> {
+        MockRecvFut {
+            pipe: Arc::clone(&self.rx_pipe),
+            buf,
+        }
+    }
+
+    fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+        Ok(self.local)
+    }
+
+    fn join_multicast_v4(&self, _group: Ipv4Addr, _iface: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+
+    fn leave_multicast_v4(&self, _group: Ipv4Addr, _iface: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+}
+
+// ── Mock Timer ────────────────────────────────────────────────────────
+
+#[derive(Clone)]
+struct MockTimer;
+
+impl Timer for MockTimer {
+    type SleepFuture<'a> = core::pin::Pin<Box<dyn Future<Output = ()> + Send + 'a>>;
+    fn sleep(&self, duration: Duration) -> Self::SleepFuture<'_> {
+        Box::pin(async move {
+            tokio::time::sleep(duration).await;
+        })
+    }
+}
+
+// ── Mock Spawner ──────────────────────────────────────────────────────
+
+struct TokioBackedSpawner;
+
+impl Spawner for TokioBackedSpawner {
+    fn spawn(&self, future: impl Future<Output = ()> + Send + 'static) {
+        drop(tokio::spawn(future));
+    }
+}
+
+// ── Mock SubscriptionHandle ───────────────────────────────────────────
+
+type SubKey = (u16, u16, u16, SocketAddrV4);
+
+#[derive(Clone, Default)]
+struct MockSubscriptions(Arc<Mutex<Vec<SubKey>>>);
+
+impl SubscriptionHandle for MockSubscriptions {
+    fn subscribe(
+        &self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        subscriber_addr: SocketAddrV4,
+    ) -> impl Future<Output = Result<(), SubscribeError>> + '_ {
+        let this = self.0.clone();
+        async move {
+            let mut guard = this.lock().unwrap();
+            let key = (service_id, instance_id, event_group_id, subscriber_addr);
+            if !guard.contains(&key) {
+                guard.push(key);
+            }
+            Ok(())
+        }
+    }
+
+    fn unsubscribe(
+        &self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        subscriber_addr: SocketAddrV4,
+    ) -> impl Future<Output = ()> + '_ {
+        let this = self.0.clone();
+        async move {
+            let mut guard = this.lock().unwrap();
+            guard.retain(|e| *e != (service_id, instance_id, event_group_id, subscriber_addr));
+        }
+    }
+
+    fn for_each_subscriber<'a, F>(
+        &'a self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        mut f: F,
+    ) -> impl Future<Output = usize> + 'a
+    where
+        F: FnMut(&Subscriber) + 'a,
+    {
+        let this = self.0.clone();
+        async move {
+            let guard = this.lock().unwrap();
+            let mut count = 0;
+            for (s, i, e, addr) in guard.iter() {
+                if *s == service_id && *i == instance_id && *e == event_group_id {
+                    let sub = Subscriber::new(*addr, *s, *i, *e);
+                    f(&sub);
+                    count += 1;
+                }
+            }
+            count
+        }
+    }
+}
+
+// ── Tests ─────────────────────────────────────────────────────────────
+
+/// Proves that a bare-metal Client and Server can be wired together
+/// through a shared mock transport and that the Server's SD announcement
+/// is visible to the Client.
+#[tokio::test]
+async fn client_receives_server_sd_announcement() {
+    let network = SharedNetwork::new();
+
+    // Server sends to server_to_client, receives from client_to_server
+    let server_factory = MockFactory {
+        tx_pipe: Arc::clone(&network.server_to_client),
+        rx_pipe: Arc::clone(&network.client_to_server),
+        next_port: Arc::new(Mutex::new(0)),
+    };
+
+    // Client sends to client_to_server, receives from server_to_client
+    let client_factory = MockFactory {
+        tx_pipe: Arc::clone(&network.client_to_server),
+        rx_pipe: Arc::clone(&network.server_to_client),
+        next_port: Arc::new(Mutex::new(100)),
+    };
+
+    // Create server
+    let server_e2e: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+    let server_subs = MockSubscriptions::default();
+    let server_config = ServerConfig::new(Ipv4Addr::LOCALHOST, 30500, 0x1234, 1);
+
+    let server_deps = ServerDeps {
+        factory: server_factory,
+        timer: MockTimer,
+        e2e_registry: server_e2e,
+        subscriptions: server_subs,
+    };
+
+    let server: Server<Arc<Mutex<E2ERegistry>>, MockSubscriptions, MockFactory, MockTimer> =
+        Server::new_with_deps(server_deps, server_config, false)
+            .await
+            .expect("server creation");
+
+    // Start server announcement loop
+    let announce_fut = server.announcement_loop().expect("announcement_loop");
+    let announce_handle = tokio::spawn(announce_fut);
+
+    // Create client
+    let client_e2e: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+    let client_iface: Arc<RwLock<Ipv4Addr>> = Arc::new(RwLock::new(Ipv4Addr::LOCALHOST));
+
+    let client_deps = ClientDeps {
+        factory: client_factory,
+        spawner: TokioBackedSpawner,
+        timer: MockTimer,
+        e2e_registry: client_e2e,
+        interface: client_iface,
+    };
+
+    let (client, mut updates, run_fut) = Client::<
+        RawPayload,
+        Arc<Mutex<E2ERegistry>>,
+        Arc<RwLock<Ipv4Addr>>,
+        E2ETestChannels,
+    >::new_with_deps(client_deps, false);
+
+    let run_handle = tokio::spawn(run_fut);
+
+    // Bind client discovery socket
+    client.bind_discovery().await.expect("bind_discovery");
+
+    // Wait for server's SD announcement to propagate through the mock
+    // network and arrive at the client's update stream.
+    let timeout = tokio::time::timeout(Duration::from_secs(2), async {
+        while let Some(update) = updates.recv().await {
+            if let ClientUpdate::DiscoveryUpdated(_msg) = update {
+                // Got an SD message — the e2e path works!
+                return true;
+            }
+        }
+        false
+    })
+    .await;
+
+    assert!(
+        timeout.unwrap_or(false),
+        "client should have received server's SD announcement"
+    );
+
+    // Cleanup
+    announce_handle.abort();
+    run_handle.abort();
+}
+
+/// Proves that the client can send a SOME/IP request through the mock network
+/// using `add_endpoint` + `send_to_service`, and the server run-loop stays
+/// stable under load. Response delivery is not verified here because the
+/// server has no registered request handler; see the doc-level test list for
+/// items that remain.
+#[tokio::test]
+async fn client_send_request_server_runloop_stable() {
+    let network = SharedNetwork::new();
+
+    let server_factory = MockFactory {
+        tx_pipe: Arc::clone(&network.server_to_client),
+        rx_pipe: Arc::clone(&network.client_to_server),
+        next_port: Arc::new(Mutex::new(0)),
+    };
+
+    let client_factory = MockFactory {
+        tx_pipe: Arc::clone(&network.client_to_server),
+        rx_pipe: Arc::clone(&network.server_to_client),
+        next_port: Arc::new(Mutex::new(100)),
+    };
+
+    // Create server (passive — no SD announcements)
+    let server_e2e: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+    let server_subs = MockSubscriptions::default();
+    let service_id = 0x5678_u16;
+    let instance_id = 1_u16;
+    let server_port = 30600_u16;
+    let server_config =
+        ServerConfig::new(Ipv4Addr::LOCALHOST, server_port, service_id, instance_id);
+
+    let server_deps = ServerDeps {
+        factory: server_factory,
+        timer: MockTimer,
+        e2e_registry: server_e2e,
+        subscriptions: server_subs,
+    };
+
+    let mut server: Server<Arc<Mutex<E2ERegistry>>, MockSubscriptions, MockFactory, MockTimer> =
+        Server::new_passive_with_deps(server_deps, server_config)
+            .await
+            .expect("passive server creation");
+
+    // Start server run loop
+    let run_handle = tokio::spawn(async move {
+        let _ = server.run().await;
+    });
+
+    // Create client
+    let client_e2e: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+    let client_iface: Arc<RwLock<Ipv4Addr>> = Arc::new(RwLock::new(Ipv4Addr::LOCALHOST));
+
+    let client_deps = ClientDeps {
+        factory: client_factory,
+        spawner: TokioBackedSpawner,
+        timer: MockTimer,
+        e2e_registry: client_e2e,
+        interface: client_iface,
+    };
+
+    let (client, mut updates, client_run_fut) = Client::<
+        RawPayload,
+        Arc<Mutex<E2ERegistry>>,
+        Arc<RwLock<Ipv4Addr>>,
+        E2ETestChannels,
+    >::new_with_deps(client_deps, false);
+
+    let client_run_handle = tokio::spawn(client_run_fut);
+
+    // Register the server endpoint with the client
+    let server_addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, server_port);
+    client
+        .add_endpoint(service_id, instance_id, server_addr, 0)
+        .await
+        .expect("add_endpoint");
+
+    // Build a request message using the correct API
+    let msg_id = MessageId::new_from_service_and_method(service_id, 0x0001);
+    let payload_bytes = [0x01_u8, 0x02, 0x03, 0x04];
+    let payload = RawPayload::from_payload_bytes(msg_id, &payload_bytes).expect("create payload");
+    let request = Message::<RawPayload>::new(
+        Header::new(
+            msg_id,
+            0x0001_0001, // request_id: client_id << 16 | session_id
+            1,           // protocol_version
+            1,           // interface_version
+            MessageTypeField::new(MessageType::Request, false),
+            ReturnCode::Ok,
+            payload_bytes.len(),
+        ),
+        payload,
+    );
+
+    // Send request via the client API
+    let pending = client
+        .send_to_service(service_id, instance_id, request)
+        .await
+        .expect("send_to_service");
+
+    // Give the server time to process
+    tokio::time::sleep(Duration::from_millis(100)).await;
+
+    // Check for any updates — server won't respond without a handler,
+    // but this proves the send path compiles and runs.
+    let timeout_result = tokio::time::timeout(Duration::from_millis(500), async {
+        while let Some(update) = updates.recv().await {
+            match update {
+                ClientUpdate::Unicast { message, .. } => {
+                    return Some(message);
+                }
+                ClientUpdate::Error(e) => {
+                    eprintln!("Client error: {:?}", e);
+                }
+                _ => {}
+            }
+        }
+        None
+    })
+    .await;
+
+    // The test passes if:
+    // 1. add_endpoint succeeded
+    // 2. send_to_service succeeded (already asserted)
+    // 3. No panics in either run loop
+    // A response is not guaranteed without a server-side request handler.
+
+    match timeout_result {
+        Ok(Some(msg)) => {
+            println!(
+                "Received response: service=0x{:04X}, method=0x{:04X}",
+                msg.header().message_id().service_id(),
+                msg.header().message_id().method_id()
+            );
+        }
+        Ok(None) | Err(_) => {
+            println!("No response (expected — server has no request handler)");
+        }
+    }
+
+    // Verify the pending response handle is usable (won't resolve without
+    // a server reply, but the type should be correct)
+    drop(pending);
+
+    // Cleanup
+    run_handle.abort();
+    client_run_handle.abort();
+}
diff --git a/tests/bare_metal_example_builds.rs b/tests/bare_metal_example_builds.rs
new file mode 100644
index 0000000..7b404f6
--- /dev/null
+++ b/tests/bare_metal_example_builds.rs
@@ -0,0 +1,22 @@
+//! Integration test: documents the intent that the `bare_metal_client` and
+//! `bare_metal_server` example workspace members must compile cleanly.
+//! Guards against regressions in the `transport`/`tokio_transport`/`Timer`
+//! trait surface that would break bare-metal consumers.
+//!
+//! Compilation of those examples is already covered by workspace-wide Cargo
+//! commands such as `cargo build --workspace`, `cargo test --workspace`, or
+//! CI's `cargo clippy --workspace`, so this file does not spawn a nested
+//! `cargo build` — nested cargo invocations are redundant and flaky under
+//! lock contention. The test body below is a minimal sanity check that the
+//! test harness ran at all; the real coverage comes from those outer
+//! workspace-wide checks. Keep this file so the regression's intent stays
+//! documented.
+
+#[test]
+fn bare_metal_workspace_member_compiles() {
+    // Minimal canary: the test harness executed this test. Compilation of
+    // the `bare_metal` example itself is enforced by explicit
+    // workspace-wide checks (for example `cargo build --workspace`),
+    // not by spawning a nested `cargo build` here — so an empty body is
+    // sufficient.
+}
diff --git a/tests/bare_metal_server.rs b/tests/bare_metal_server.rs
new file mode 100644
index 0000000..986c202
--- /dev/null
+++ b/tests/bare_metal_server.rs
@@ -0,0 +1,336 @@
+//! Witness test: prove that `Server` can be constructed and
+//! driven without the `server-tokio` feature, using only the trait
+//! surface (`TransportFactory`, `Timer`, `E2ERegistryHandle`,
+//! `SubscriptionHandle`).
+//!
+//! `simple-someip` is compiled with `default-features = false,
+//! features = ["server", "bare_metal"]` per the `required-features`
+//! gate below — i.e. NO tokio, NO socket2 pulled in via the crate
+//! itself. The test still uses the host's tokio runtime as a generic
+//! executor (tokio is a `dev-dependency`), but every type fed to
+//! `simple-someip::Server::new_with_deps` comes from the no-tokio side:
+//! a hand-rolled mock `TransportFactory`, a hand-rolled `Timer`, a
+//! hand-rolled `SubscriptionHandle`, and the std-backed
+//! `Arc<Mutex<E2ERegistry>>` impl that ships under the bare `transport`
+//! module.
+//!
+//! This is the gate witness for the claim that `Server` is reachable
+//! on a no-tokio build. Compile-witness alone (Cargo `required-features`
+//! proving the test crate compiles without `server-tokio`) is the
+//! load-bearing assertion; the `tokio::spawn` at the end is a sanity
+//! check that the announcement-loop future is `Send + 'static` and
+//! the trait surface drives a working pipeline.
+#![cfg(all(feature = "server", feature = "bare_metal"))]
+
+use core::future::Future;
+use core::net::{Ipv4Addr, SocketAddrV4};
+use core::pin::Pin;
+use core::task::{Context, Poll};
+use core::time::Duration;
+use std::collections::VecDeque;
+use std::sync::{Arc, Mutex};
+use std::vec::Vec;
+
+use simple_someip::e2e::E2ERegistry;
+use simple_someip::server::ServerConfig;
+use simple_someip::server::{SubscribeError, Subscriber, SubscriptionHandle};
+use simple_someip::transport::{
+    ReceivedDatagram, SocketOptions, Timer, TransportError, TransportFactory, TransportSocket,
+};
+use simple_someip::{Server, ServerDeps};
+
+// ── Mock transport ─────────────────────────────────────────────────────
+
+#[derive(Default)]
+struct MockPipe {
+    sent: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound_waker: Mutex<Option<core::task::Waker>>,
+}
+
+#[derive(Clone)]
+struct MockFactory {
+    pipe: Arc<MockPipe>,
+    next_port: Arc<Mutex<u16>>,
+}
+
+impl TransportFactory for MockFactory {
+    type Socket = MockSocket;
+    type BindFuture<'a> =
+        core::pin::Pin<Box<dyn Future<Output = Result<Self::Socket, TransportError>> + Send + 'a>>;
+    fn bind<'a>(&'a self, addr: SocketAddrV4, _options: &'a SocketOptions) -> Self::BindFuture<'a> {
+        let pipe = Arc::clone(&self.pipe);
+        // Mock: assign port deterministically. If caller asked for 0,
+        // hand out an incrementing fake ephemeral port.
+        let port = if addr.port() == 0 {
+            let mut p = self.next_port.lock().unwrap();
+            let next = *p + 1;
+            *p = next;
+            40000 + next
+        } else {
+            addr.port()
+        };
+        let local = SocketAddrV4::new(*addr.ip(), port);
+        Box::pin(async move { Ok(MockSocket { pipe, local }) })
+    }
+}
+
+struct MockSocket {
+    pipe: Arc<MockPipe>,
+    local: SocketAddrV4,
+}
+
+struct MockSendFut {
+    pipe: Arc<MockPipe>,
+    bytes: Option<Vec<u8>>,
+    target: SocketAddrV4,
+}
+
+impl Future for MockSendFut {
+    type Output = Result<(), TransportError>;
+    fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        if let Some(bytes) = me.bytes.take() {
+            me.pipe.sent.lock().unwrap().push_back((bytes, me.target));
+        }
+        Poll::Ready(Ok(()))
+    }
+}
+
+struct MockRecvFut<'a> {
+    pipe: Arc<MockPipe>,
+    buf: &'a mut [u8],
+}
+
+impl Future for MockRecvFut<'_> {
+    type Output = Result<ReceivedDatagram, TransportError>;
+    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        let entry = me.pipe.inbound.lock().unwrap().pop_front();
+        match entry {
+            Some((bytes, source)) => {
+                let n = bytes.len().min(me.buf.len());
+                me.buf[..n].copy_from_slice(&bytes[..n]);
+                Poll::Ready(Ok(ReceivedDatagram {
+                    bytes_received: n,
+                    source,
+                    truncated: n < bytes.len(),
+                }))
+            }
+            None => {
+                // Park on the pipe's waker. Real bare-metal impls park
+                // the task on an interrupt-driven waker;
+                // wake_by_ref-on-empty would CPU-peg the test runtime.
+                *me.pipe.inbound_waker.lock().unwrap() = Some(cx.waker().clone());
+                if let Some((bytes, source)) = me.pipe.inbound.lock().unwrap().pop_front() {
+                    let n = bytes.len().min(me.buf.len());
+                    me.buf[..n].copy_from_slice(&bytes[..n]);
+                    return Poll::Ready(Ok(ReceivedDatagram {
+                        bytes_received: n,
+                        source,
+                        truncated: n < bytes.len(),
+                    }));
+                }
+                Poll::Pending
+            }
+        }
+    }
+}
+
+impl TransportSocket for MockSocket {
+    type SendFuture<'a> = MockSendFut;
+    type RecvFuture<'a> = MockRecvFut<'a>;
+
+    fn send_to<'a>(&'a self, buf: &'a [u8], target: SocketAddrV4) -> Self::SendFuture<'a> {
+        MockSendFut {
+            pipe: Arc::clone(&self.pipe),
+            bytes: Some(buf.to_vec()),
+            target,
+        }
+    }
+
+    fn recv_from<'a>(&'a self, buf: &'a mut [u8]) -> Self::RecvFuture<'a> {
+        MockRecvFut {
+            pipe: Arc::clone(&self.pipe),
+            buf,
+        }
+    }
+
+    fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+        Ok(self.local)
+    }
+
+    fn join_multicast_v4(&self, _group: Ipv4Addr, _iface: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+
+    fn leave_multicast_v4(&self, _group: Ipv4Addr, _iface: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+}
+
+// ── Mock Timer ────────────────────────────────────────────────────────
+
+#[derive(Clone)]
+struct MockTimer;
+impl Timer for MockTimer {
+    type SleepFuture<'a> = core::pin::Pin<Box<dyn Future<Output = ()> + Send + 'a>>;
+    fn sleep(&self, duration: Duration) -> Self::SleepFuture<'_> {
+        // Honor `duration` per the `Timer` trait contract (MAY
+        // overshoot, MUST NOT undershoot). The test runtime is
+        // `#[tokio::test]`; this only demonstrates the no-tokio
+        // production path compiles. A real bare-metal impl would
+        // replace this with `embassy_time::Timer::after`.
+        Box::pin(async move {
+            tokio::time::sleep(duration).await;
+        })
+    }
+}
+
+// ── Mock SubscriptionHandle ───────────────────────────────────────────
+//
+// On `server-tokio`, `Arc<RwLock<SubscriptionManager>>` is a built-in
+// impl. Bare-metal callers supply their own. A real bare-metal impl
+// would back this with a `critical_section::Mutex<RefCell<...>>` or a
+// `spin::Mutex<...>` over a `heapless`-backed table; here we use
+// `std::sync::Mutex` over a tiny inline table because the test runtime
+// has `std`. The point is the *trait* impl, not the concurrency
+// primitive.
+
+type SubKey = (u16, u16, u16, SocketAddrV4);
+
+#[derive(Clone, Default)]
+#[allow(clippy::type_complexity)]
+struct MockSubscriptions(Arc<Mutex<Vec<SubKey>>>);
+
+impl SubscriptionHandle for MockSubscriptions {
+    fn subscribe(
+        &self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        subscriber_addr: SocketAddrV4,
+    ) -> impl Future<Output = Result<(), SubscribeError>> + '_ {
+        let this = self.0.clone();
+        async move {
+            let mut guard = this.lock().unwrap();
+            let key = (service_id, instance_id, event_group_id, subscriber_addr);
+            if !guard.contains(&key) {
+                guard.push(key);
+            }
+            Ok(())
+        }
+    }
+
+    fn unsubscribe(
+        &self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        subscriber_addr: SocketAddrV4,
+    ) -> impl Future<Output = ()> + '_ {
+        let this = self.0.clone();
+        async move {
+            let mut guard = this.lock().unwrap();
+            guard.retain(|e| *e != (service_id, instance_id, event_group_id, subscriber_addr));
+        }
+    }
+
+    fn for_each_subscriber<'a, F>(
+        &'a self,
+        service_id: u16,
+        instance_id: u16,
+        event_group_id: u16,
+        mut f: F,
+    ) -> impl Future<Output = usize> + 'a
+    where
+        F: FnMut(&Subscriber) + 'a,
+    {
+        let this = self.0.clone();
+        async move {
+            let guard = this.lock().unwrap();
+            let mut count = 0;
+            for (s, i, e, addr) in guard.iter() {
+                if *s == service_id && *i == instance_id && *e == event_group_id {
+                    let sub = Subscriber::new(*addr, *s, *i, *e);
+                    f(&sub);
+                    count += 1;
+                }
+            }
+            count
+        }
+    }
+}
+
+// ── Test ──────────────────────────────────────────────────────────────
+
+#[tokio::test]
+async fn server_constructible_without_server_tokio_feature() {
+    let pipe = Arc::new(MockPipe::default());
+    let factory = MockFactory {
+        pipe: Arc::clone(&pipe),
+        next_port: Arc::new(Mutex::new(0)),
+    };
+
+    let e2e_handle: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+    let subs = MockSubscriptions::default();
+
+    let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 30490, 0x5B, 1);
+
+    let deps: ServerDeps<MockFactory, MockTimer, Arc<Mutex<E2ERegistry>>, MockSubscriptions> =
+        ServerDeps {
+            factory,
+            timer: MockTimer,
+            e2e_registry: e2e_handle,
+            subscriptions: subs,
+        };
+
+    let server: Server<Arc<Mutex<E2ERegistry>>, MockSubscriptions, MockFactory, MockTimer> =
+        Server::new_with_deps(deps, config, false)
+            .await
+            .expect("Server::new_with_deps must succeed with no-tokio mocks");
+
+    // Build the announcement-loop future and prove it's `Send + 'static`
+    // by spawning it on tokio. The witness is purely structural: if this
+    // line compiles, `Server` is reachable on a no-tokio build.
+    let announce_fut = server
+        .announcement_loop()
+        .expect("announcement_loop must build on a non-passive server");
+    let handle = tokio::spawn(announce_fut);
+
+    // Yield once so the spawned future has a chance to poll (its first
+    // tick fires `send_to` immediately, before the timer sleep).
+    tokio::task::yield_now().await;
+    tokio::task::yield_now().await;
+
+    // Tear down: abort the announce loop.
+    handle.abort();
+    let _ = handle.await;
+}
+
+#[tokio::test]
+async fn passive_server_constructible_without_server_tokio_feature() {
+    let pipe = Arc::new(MockPipe::default());
+    let factory = MockFactory {
+        pipe: Arc::clone(&pipe),
+        next_port: Arc::new(Mutex::new(0)),
+    };
+
+    let e2e_handle: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+    let subs = MockSubscriptions::default();
+
+    let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 0, 0x5C, 2);
+
+    let deps: ServerDeps<MockFactory, MockTimer, Arc<Mutex<E2ERegistry>>, MockSubscriptions> =
+        ServerDeps {
+            factory,
+            timer: MockTimer,
+            e2e_registry: e2e_handle,
+            subscriptions: subs,
+        };
+
+    let _server: Server<Arc<Mutex<E2ERegistry>>, MockSubscriptions, MockFactory, MockTimer> =
+        Server::new_passive_with_deps(deps, config)
+            .await
+            .expect("Server::new_passive_with_deps must succeed with no-tokio mocks");
+}
diff --git a/tests/client_server.rs b/tests/client_server.rs
index ffd6d34..459f6bb 100644
--- a/tests/client_server.rs
+++ b/tests/client_server.rs
@@ -1,10 +1,48 @@
 //! Integration tests exercising the Client and Server together on localhost.
+//!
+//! # Parallel execution caveat
+//!
+//! These tests share `sd::MULTICAST_PORT` (30490) and bind it via
+//! `SO_REUSEPORT`. Linux's reuseport hashing then load-balances incoming
+//! Subscribe / SD multicast traffic across whichever sockets are
+//! currently bound, which means one test's Subscribe message can be
+//! delivered to a *different* test's server. Each test verifies its own
+//! `EventPublisher::has_subscribers` (per-server `SubscriptionManager`
+//! state, not a shared one), so the cross-routing produces flaky
+//! failures when the suite runs with cargo's default parallelism.
+//!
+//! Until we can give each test its own SD port (which would require
+//! widening the protocol layer's `MULTICAST_PORT` constant to a runtime
+//! config) or its own network namespace, **run this binary with
+//! `--test-threads=1`** to serialise the SD-port contention:
+//!
+//! ```text
+//! cargo test --test client_server -- --test-threads=1
+//! ```
+//!
+//! `cargo test --workspace` (parallel default) is expected to flake on
+//! ~half of the tests in this file. The unit-test suite under
+//! `cargo test --lib` does not have this issue and runs reliably in
+//! parallel. The fix is tracked alongside the bare-metal refactor
+//! (which will need to abstract the port anyway).
 
 use simple_someip::e2e::{E2ECheckStatus, E2EKey, E2EProfile, Profile4Config};
 use simple_someip::protocol::{Header, Message, MessageId, sd};
 use simple_someip::server::ServerConfig;
-use simple_someip::{Client, ClientUpdate, PayloadWireFormat, RawPayload, Server, VecSdHeader};
+use simple_someip::{
+    Client, ClientUpdate, PayloadWireFormat, RawPayload, Server, TokioChannels, VecSdHeader,
+};
 use std::net::{Ipv4Addr, SocketAddrV4};
+use std::sync::atomic::{AtomicU16, Ordering};
+
+/// Allocate a unique service ID per test invocation. Multiple
+/// integration tests in this file run in parallel (cargo's default) and
+/// would otherwise collide on the SD multicast group + a shared service
+/// ID, causing cross-test SubscribeAck bleed-through.
+fn next_service_id() -> u16 {
+    static NEXT: AtomicU16 = AtomicU16::new(0x5B);
+    NEXT.fetch_add(1, Ordering::Relaxed)
+}
 
 fn empty_sd_header() -> VecSdHeader {
     VecSdHeader {
@@ -14,12 +52,35 @@ fn empty_sd_header() -> VecSdHeader {
     }
 }
 
-type TestClient = Client<RawPayload>;
+type TestClient = Client<
+    RawPayload,
+    std::sync::Arc<std::sync::Mutex<simple_someip::e2e::E2ERegistry>>,
+    std::sync::Arc<std::sync::RwLock<Ipv4Addr>>,
+    TokioChannels,
+>;
+
+/// Type alias bringing the tokio-flavor concrete type parameters back into
+/// scope so callers can spell `TestServer::new(...)` without chasing the
+/// four-type-parameter signature on every call site.
+type TestServer = Server<
+    std::sync::Arc<std::sync::Mutex<simple_someip::e2e::E2ERegistry>>,
+    std::sync::Arc<tokio::sync::RwLock<simple_someip::server::SubscriptionManager>>,
+    simple_someip::TokioTransport,
+    simple_someip::TokioTimer,
+>;
+
+/// Type alias for the event publisher concrete type used by `TestServer`'s
+/// publisher. Same shape rationale as [`TestServer`].
+type TestEventPublisher = simple_someip::server::EventPublisher<
+    std::sync::Arc<std::sync::Mutex<simple_someip::e2e::E2ERegistry>>,
+    std::sync::Arc<tokio::sync::RwLock<simple_someip::server::SubscriptionManager>>,
+    simple_someip::TokioSocket,
+>;
 
 /// Create a server on an ephemeral unicast port, returning (Server, actual_port).
-async fn create_server(service_id: u16, instance_id: u16) -> (Server, u16) {
+async fn create_server(service_id: u16, instance_id: u16) -> (TestServer, u16) {
     let config = ServerConfig::new(Ipv4Addr::LOCALHOST, 0, service_id, instance_id);
-    let mut server: Server = Server::new(config).await.expect("Server::new failed");
+    let mut server: TestServer = TestServer::new(config).await.expect("Server::new failed");
     let port = match server.unicast_local_addr().expect("local_addr failed") {
         std::net::SocketAddr::V4(a) => a.port(),
         _ => panic!("expected IPv4"),
@@ -31,7 +92,7 @@ async fn create_server(service_id: u16, instance_id: u16) -> (Server, u16) {
 /// Poll `has_subscribers` with retries until the server has processed the
 /// subscription. Returns true if subscribers appeared within the deadline.
 async fn wait_for_subscribers(
-    publisher: &simple_someip::server::EventPublisher,
+    publisher: &TestEventPublisher,
     service_id: u16,
     instance_id: u16,
     event_group_id: u16,
@@ -51,18 +112,26 @@ async fn wait_for_subscribers(
 #[tokio::test]
 async fn test_client_server_subscribe_and_receive_event() {
     // Start server on ephemeral port
-    let (mut server, server_port) = create_server(0x5B, 1).await;
+    let service_id = next_service_id();
+    let (mut server, server_port) = create_server(service_id, 1).await;
     let publisher = server.publisher();
     let server_handle = tokio::spawn(async move { server.run().await });
 
     // Create client and subscribe to the server's event group
-    let (client, mut updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let (client, mut updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let _run_handle = tokio::spawn(run_fut);
     let server_addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, server_port);
-    client.add_endpoint(0x5B, 1, server_addr, 0).await.unwrap();
-    client.subscribe(0x5B, 1, 1, 3, 0x01, 0).await.unwrap();
+    client
+        .add_endpoint(service_id, 1, server_addr, 0)
+        .await
+        .unwrap();
+    client
+        .subscribe(service_id, 1, 1, 3, 0x01, 0)
+        .await
+        .unwrap();
 
     assert!(
-        wait_for_subscribers(&publisher, 0x5B, 1, 0x01).await,
+        wait_for_subscribers(&publisher, service_id, 1, 0x01).await,
         "server should have registered the subscriber"
     );
 
@@ -72,7 +141,7 @@ async fn test_client_server_subscribe_and_receive_event() {
     // Publish an event from the server to the client's unicast port
     let event_msg = Message::<RawPayload>::new_sd(0x0001, &empty_sd_header());
     let sent = publisher
-        .publish_event(0x5B, 1, 0x01, &event_msg)
+        .publish_event(service_id, 1, 0x01, &event_msg)
         .await
         .expect("publish_event failed");
     assert_eq!(sent, 1);
@@ -95,17 +164,19 @@ async fn test_client_server_subscribe_and_receive_event() {
 #[tokio::test]
 async fn test_client_send_sd_auto_binds_discovery() {
     // Create server so there is something to send to
-    let (mut server, server_port) = create_server(0x5B, 1).await;
+    let service_id = next_service_id();
+    let (mut server, server_port) = create_server(service_id, 1).await;
     let server_handle = tokio::spawn(async move { server.run().await });
 
     // Create client — NO bind_discovery
-    let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let _run_handle = tokio::spawn(run_fut);
 
     // send_sd_message should auto-bind discovery and succeed
     let sd_header = VecSdHeader {
         flags: sd::Flags::new_sd(sd::RebootFlag::RecentlyRebooted),
         entries: vec![sd::Entry::SubscribeEventGroup(sd::EventGroupEntry::new(
-            0x5B, 1, 1, 3, 0x01,
+            service_id, 1, 1, 3, 0x01,
         ))],
         options: vec![sd::Options::IpV4Endpoint {
             ip: Ipv4Addr::LOCALHOST,
@@ -127,16 +198,24 @@ async fn test_client_send_sd_auto_binds_discovery() {
 /// while an SD message round-trip is in flight.
 #[tokio::test]
 async fn test_client_bind_unbind_lifecycle_with_server() {
-    let (mut server, server_port) = create_server(0x5B, 1).await;
+    let service_id = next_service_id();
+    let (mut server, server_port) = create_server(service_id, 1).await;
     let server_handle = tokio::spawn(async move { server.run().await });
 
-    let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let _run_handle = tokio::spawn(run_fut);
 
     // Bind discovery, subscribe, then unbind and rebind
     client.bind_discovery().await.unwrap();
     let server_addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, server_port);
-    client.add_endpoint(0x5B, 1, server_addr, 0).await.unwrap();
-    client.subscribe(0x5B, 1, 1, 3, 0x01, 0).await.unwrap();
+    client
+        .add_endpoint(service_id, 1, server_addr, 0)
+        .await
+        .unwrap();
+    client
+        .subscribe(service_id, 1, 1, 3, 0x01, 0)
+        .await
+        .unwrap();
 
     // Unbind and rebind discovery — covers unbind_discovery + re-bind path
     client.unbind_discovery().await.unwrap();
@@ -154,23 +233,31 @@ async fn test_client_bind_unbind_lifecycle_with_server() {
 /// registry, auto-binds unicast, sends the request, and receives a response.
 #[tokio::test]
 async fn test_add_endpoint_and_send_to_service() {
-    let (mut server, server_port) = create_server(0x5B, 1).await;
+    let service_id = next_service_id();
+    let (mut server, server_port) = create_server(service_id, 1).await;
     let publisher = server.publisher();
     let server_handle = tokio::spawn(async move { server.run().await });
 
-    let (client, mut updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let (client, mut updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let _run_handle = tokio::spawn(run_fut);
     client.bind_discovery().await.unwrap();
 
     // Register the server's endpoint manually (simulating non-broadcasting service)
     let server_addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, server_port);
-    client.add_endpoint(0x5B, 1, server_addr, 0).await.unwrap();
+    client
+        .add_endpoint(service_id, 1, server_addr, 0)
+        .await
+        .unwrap();
 
     // Subscribe to server's event group (auto-binds unicast internally)
-    client.subscribe(0x5B, 1, 1, 3, 0x01, 0).await.unwrap();
+    client
+        .subscribe(service_id, 1, 1, 3, 0x01, 0)
+        .await
+        .unwrap();
 
     // Wait for the server to process the subscription
     assert!(
-        wait_for_subscribers(&publisher, 0x5B, 1, 0x01).await,
+        wait_for_subscribers(&publisher, service_id, 1, 0x01).await,
         "server should have registered the subscriber"
     );
 
@@ -180,7 +267,7 @@ async fn test_add_endpoint_and_send_to_service() {
     // Publish an event from the server
     let event_msg = Message::<RawPayload>::new_sd(0x0001, &empty_sd_header());
     let sent = publisher
-        .publish_event(0x5B, 1, 0x01, &event_msg)
+        .publish_event(service_id, 1, 0x01, &event_msg)
         .await
         .expect("publish_event failed");
     assert_eq!(sent, 1);
@@ -195,15 +282,15 @@ async fn test_add_endpoint_and_send_to_service() {
     );
 
     // Remove the endpoint and verify send_to_service returns ServiceNotFound
-    client.remove_endpoint(0x5B, 1).await.unwrap();
+    client.remove_endpoint(service_id, 1).await.unwrap();
     let msg = Message::<RawPayload>::new_sd(0x0001, &empty_sd_header());
-    let result = client.send_to_service(0x5B, 1, msg).await;
+    let result = client.send_to_service(service_id, 1, msg).await;
     assert!(
         matches!(result, Err(simple_someip::client::Error::ServiceNotFound)),
         "expected ServiceNotFound after remove, got {result:?}"
     );
     // Verify that PendingResponse is importable from the crate root
-    let _: fn() -> Option<simple_someip::PendingResponse<RawPayload>> = || None;
+    let _: fn() -> Option<simple_someip::PendingResponse<RawPayload, TokioChannels>> = || None;
 
     client.shut_down();
     server_handle.abort();
@@ -213,19 +300,27 @@ async fn test_add_endpoint_and_send_to_service() {
 /// Exercises the Subscribe auto-bind discovery path in inner.rs.
 #[tokio::test]
 async fn test_subscribe_auto_binds_discovery() {
-    let (mut server, server_port) = create_server(0x5B, 1).await;
+    let service_id = next_service_id();
+    let (mut server, server_port) = create_server(service_id, 1).await;
     let publisher = server.publisher();
     let server_handle = tokio::spawn(async move { server.run().await });
 
     // Create client — do NOT bind discovery manually
-    let (client, mut updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let (client, mut updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let _run_handle = tokio::spawn(run_fut);
     let server_addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, server_port);
-    client.add_endpoint(0x5B, 1, server_addr, 0).await.unwrap();
+    client
+        .add_endpoint(service_id, 1, server_addr, 0)
+        .await
+        .unwrap();
     // Subscribe should auto-bind discovery internally
-    client.subscribe(0x5B, 1, 1, 3, 0x01, 0).await.unwrap();
+    client
+        .subscribe(service_id, 1, 1, 3, 0x01, 0)
+        .await
+        .unwrap();
 
     assert!(
-        wait_for_subscribers(&publisher, 0x5B, 1, 0x01).await,
+        wait_for_subscribers(&publisher, service_id, 1, 0x01).await,
         "server should have registered the subscriber"
     );
 
@@ -235,7 +330,7 @@ async fn test_subscribe_auto_binds_discovery() {
     // Publish an event and verify the client can receive it
     let event_msg = Message::<RawPayload>::new_sd(0x0001, &empty_sd_header());
     let sent = publisher
-        .publish_event(0x5B, 1, 0x01, &event_msg)
+        .publish_event(service_id, 1, 0x01, &event_msg)
         .await
         .expect("publish_event failed");
     assert_eq!(sent, 1);
@@ -256,17 +351,25 @@ async fn test_subscribe_auto_binds_discovery() {
 /// Exercises the pending_responses HashMap matching path in inner.rs.
 #[tokio::test]
 async fn test_client_request_resolves_via_unicast_reply() {
-    let (mut server, server_port) = create_server(0x5B, 1).await;
+    let service_id = next_service_id();
+    let (mut server, server_port) = create_server(service_id, 1).await;
     let publisher = server.publisher();
     let server_handle = tokio::spawn(async move { server.run().await });
 
-    let (client, mut updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let (client, mut updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let _run_handle = tokio::spawn(run_fut);
     let server_addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, server_port);
-    client.add_endpoint(0x5B, 1, server_addr, 0).await.unwrap();
-    client.subscribe(0x5B, 1, 1, 3, 0x01, 0).await.unwrap();
+    client
+        .add_endpoint(service_id, 1, server_addr, 0)
+        .await
+        .unwrap();
+    client
+        .subscribe(service_id, 1, 1, 3, 0x01, 0)
+        .await
+        .unwrap();
 
     assert!(
-        wait_for_subscribers(&publisher, 0x5B, 1, 0x01).await,
+        wait_for_subscribers(&publisher, service_id, 1, 0x01).await,
         "server should have registered the subscriber"
     );
 
@@ -277,14 +380,14 @@ async fn test_client_request_resolves_via_unicast_reply() {
     // which has a matching request_id, resolving it.
     let msg = Message::<RawPayload>::new_sd(0x0001, &empty_sd_header());
     let pending = client
-        .send_to_service(0x5B, 1, msg)
+        .send_to_service(service_id, 1, msg)
         .await
         .expect("send_to_service failed");
 
     // Publish an event that the client unicast socket will receive
     let event_msg = Message::<RawPayload>::new_sd(0x0001, &empty_sd_header());
     publisher
-        .publish_event(0x5B, 1, 0x01, &event_msg)
+        .publish_event(service_id, 1, 0x01, &event_msg)
         .await
         .expect("publish_event failed");
 
@@ -308,12 +411,13 @@ async fn test_client_request_resolves_via_unicast_reply() {
 /// Exercises E2E protect in event_publisher.rs and E2E check in socket_manager.rs.
 #[tokio::test]
 async fn test_e2e_protect_on_publish_and_check_on_receive() {
-    let (mut server, server_port) = create_server(0x5B, 1).await;
+    let service_id = next_service_id();
+    let (mut server, server_port) = create_server(service_id, 1).await;
     let publisher = server.publisher();
 
     // Register E2E profile on server for the event message ID
     let key = E2EKey {
-        service_id: 0x5B,
+        service_id,
         method_or_event_id: 0x0001,
     };
     let profile = E2EProfile::Profile4(Profile4Config::new(0x12345678, 15));
@@ -321,17 +425,24 @@ async fn test_e2e_protect_on_publish_and_check_on_receive() {
 
     let server_handle = tokio::spawn(async move { server.run().await });
 
-    let (client, mut updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let (client, mut updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let _run_handle = tokio::spawn(run_fut);
 
     // Register matching E2E profile on client
     client.register_e2e(key, profile);
 
     let server_addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, server_port);
-    client.add_endpoint(0x5B, 1, server_addr, 0).await.unwrap();
-    client.subscribe(0x5B, 1, 1, 3, 0x01, 0).await.unwrap();
+    client
+        .add_endpoint(service_id, 1, server_addr, 0)
+        .await
+        .unwrap();
+    client
+        .subscribe(service_id, 1, 1, 3, 0x01, 0)
+        .await
+        .unwrap();
 
     assert!(
-        wait_for_subscribers(&publisher, 0x5B, 1, 0x01).await,
+        wait_for_subscribers(&publisher, service_id, 1, 0x01).await,
         "server should have registered the subscriber"
     );
 
@@ -339,14 +450,14 @@ async fn test_e2e_protect_on_publish_and_check_on_receive() {
     let _ = tokio::time::timeout(std::time::Duration::from_millis(250), updates.recv()).await;
 
     // Publish an event — server will E2E-protect it
-    // Construct a non-SD message with service_id=0x5B, method/event_id=0x0001
+    // Construct a non-SD message with service_id=service_id, method/event_id=0x0001
     let payload_bytes = [0xAA, 0xBB];
-    let msg_id = MessageId::new_from_service_and_method(0x5B, 0x0001);
+    let msg_id = MessageId::new_from_service_and_method(service_id, 0x0001);
     let raw_payload = RawPayload::from_payload_bytes(msg_id, &payload_bytes).unwrap();
-    let header = Header::new_event(0x5B, 0x0001, 0, 0x01, 0x01, payload_bytes.len());
+    let header = Header::new_event(service_id, 0x0001, 0, 0x01, 0x01, payload_bytes.len());
     let event_msg = Message::new(header, raw_payload);
     let sent = publisher
-        .publish_event(0x5B, 1, 0x01, &event_msg)
+        .publish_event(service_id, 1, 0x01, &event_msg)
         .await
         .expect("publish_event failed");
     assert_eq!(sent, 1);
@@ -378,31 +489,46 @@ async fn test_e2e_protect_on_publish_and_check_on_receive() {
 /// Exercises multi-subscriber path in event_publisher.rs.
 #[tokio::test]
 async fn test_multiple_subscribers_receive_events() {
-    let (mut server, server_port) = create_server(0x5B, 1).await;
+    let service_id = next_service_id();
+    let (mut server, server_port) = create_server(service_id, 1).await;
     let publisher = server.publisher();
     let server_handle = tokio::spawn(async move { server.run().await });
 
     let server_addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, server_port);
 
     // Client 1
-    let (client1, mut updates1) = TestClient::new(Ipv4Addr::LOCALHOST);
-    client1.add_endpoint(0x5B, 1, server_addr, 0).await.unwrap();
-    client1.subscribe(0x5B, 1, 1, 3, 0x01, 0).await.unwrap();
+    let (client1, mut updates1, run_fut1) = TestClient::new(Ipv4Addr::LOCALHOST);
+    tokio::spawn(run_fut1);
+    client1
+        .add_endpoint(service_id, 1, server_addr, 0)
+        .await
+        .unwrap();
+    client1
+        .subscribe(service_id, 1, 1, 3, 0x01, 0)
+        .await
+        .unwrap();
 
     // Client 2
-    let (client2, mut updates2) = TestClient::new(Ipv4Addr::LOCALHOST);
-    client2.add_endpoint(0x5B, 1, server_addr, 0).await.unwrap();
-    client2.subscribe(0x5B, 1, 1, 3, 0x01, 0).await.unwrap();
+    let (client2, mut updates2, run_fut2) = TestClient::new(Ipv4Addr::LOCALHOST);
+    tokio::spawn(run_fut2);
+    client2
+        .add_endpoint(service_id, 1, server_addr, 0)
+        .await
+        .unwrap();
+    client2
+        .subscribe(service_id, 1, 1, 3, 0x01, 0)
+        .await
+        .unwrap();
 
     // Wait for both subscribers
     for _ in 0..40 {
-        if publisher.subscriber_count(0x5B, 1, 0x01).await >= 2 {
+        if publisher.subscriber_count(service_id, 1, 0x01).await >= 2 {
             break;
         }
         tokio::time::sleep(std::time::Duration::from_millis(50)).await;
     }
     assert!(
-        publisher.subscriber_count(0x5B, 1, 0x01).await >= 2,
+        publisher.subscriber_count(service_id, 1, 0x01).await >= 2,
         "expected at least 2 subscribers"
     );
 
@@ -413,7 +539,7 @@ async fn test_multiple_subscribers_receive_events() {
     // Publish event
     let event_msg = Message::<RawPayload>::new_sd(0x0001, &empty_sd_header());
     let sent = publisher
-        .publish_event(0x5B, 1, 0x01, &event_msg)
+        .publish_event(service_id, 1, 0x01, &event_msg)
         .await
         .expect("publish_event failed");
     assert!(sent >= 2, "expected sent >= 2, got {sent}");
@@ -443,7 +569,8 @@ async fn test_multiple_subscribers_receive_events() {
 /// Verify ClientUpdates returns None after client shutdown.
 #[tokio::test]
 async fn test_updates_drain_after_shutdown() {
-    let (client, mut updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let (client, mut updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let _run_handle = tokio::spawn(run_fut);
     client.shut_down();
 
     let result = tokio::time::timeout(std::time::Duration::from_secs(2), updates.recv())
@@ -455,16 +582,24 @@ async fn test_updates_drain_after_shutdown() {
 /// Verify that cloned client handles work independently.
 #[tokio::test]
 async fn test_cloned_client_works() {
-    let (mut server, server_port) = create_server(0x5B, 1).await;
+    let service_id = next_service_id();
+    let (mut server, server_port) = create_server(service_id, 1).await;
     let server_handle = tokio::spawn(async move { server.run().await });
 
-    let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let _run_handle = tokio::spawn(run_fut);
     let client2 = client.clone();
 
     // Both clones can send commands
     let server_addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, server_port);
-    client.add_endpoint(0x5B, 1, server_addr, 0).await.unwrap();
-    client2.subscribe(0x5B, 1, 1, 3, 0x01, 0).await.unwrap();
+    client
+        .add_endpoint(service_id, 1, server_addr, 0)
+        .await
+        .unwrap();
+    client2
+        .subscribe(service_id, 1, 1, 3, 0x01, 0)
+        .await
+        .unwrap();
 
     client.shut_down();
     // client2 is also dropped
@@ -475,22 +610,27 @@ async fn test_cloned_client_works() {
 /// Exercises the port-reuse path in Subscribe handling.
 #[tokio::test]
 async fn test_subscribe_specific_port_reuse() {
-    let (mut server, server_port) = create_server(0x5B, 1).await;
+    let service_id = next_service_id();
+    let (mut server, server_port) = create_server(service_id, 1).await;
     let server_handle = tokio::spawn(async move { server.run().await });
 
-    let (client, _updates) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let (client, _updates, run_fut) = TestClient::new(Ipv4Addr::LOCALHOST);
+    let _run_handle = tokio::spawn(run_fut);
     let server_addr = SocketAddrV4::new(Ipv4Addr::LOCALHOST, server_port);
-    client.add_endpoint(0x5B, 1, server_addr, 0).await.unwrap();
+    client
+        .add_endpoint(service_id, 1, server_addr, 0)
+        .await
+        .unwrap();
 
     // Use specific port
     let specific_port = 44444;
     client
-        .subscribe(0x5B, 1, 1, 3, 0x01, specific_port)
+        .subscribe(service_id, 1, 1, 3, 0x01, specific_port)
         .await
         .unwrap();
     // Second subscribe reuses the port
     client
-        .subscribe(0x5B, 1, 1, 3, 0x02, specific_port)
+        .subscribe(service_id, 1, 1, 3, 0x02, specific_port)
         .await
         .unwrap();
 
diff --git a/tests/no_alloc_witness.rs b/tests/no_alloc_witness.rs
new file mode 100644
index 0000000..db4c1f2
--- /dev/null
+++ b/tests/no_alloc_witness.rs
@@ -0,0 +1,347 @@
+//! No-alloc CI gate: prove that the bare-metal handle types and
+//! static-pool channels do not invoke the global allocator on the hot path.
+//!
+//! # Why `harness = false`
+//!
+//! `libtest` allocates during process startup — thread-local storage, a
+//! worker thread pool for parallel test execution, and per-test bookkeeping
+//! (the harness wraps each test in heap-allocated state). With a
+//! panic-on-alloc `#[global_allocator]` that would fire before any of our
+//! code runs. `harness = false` removes the harness: this file defines its
+//! own `main()` that runs the witness functions directly on the main thread
+//! and aborts the process on any unexpected allocation.
+//!
+//! # Strategy
+//!
+//! A [`PanicAllocator`] replaces the global allocator. It is disarmed by
+//! default; [`assert_no_alloc`] arms it around a closure, causing any
+//! allocation inside the closure to call `process::abort()` — turning a
+//! latent regression into a hard CI failure. Because `main()` is single-threaded and all witnessed
+//! operations are synchronous (no yield points), no background allocations
+//! can fire while the allocator is armed.
+//!
+//! # What is witnessed
+//!
+//! 1. [`AtomicInterfaceHandle`] `get` / `set` are provably alloc-free (thin
+//!    pointer to a `static AtomicU32`).
+//! 2. [`StaticE2EHandle`] `contains_key` / `protect` / `check` do not
+//!    allocate after the registry is configured. Registration itself may
+//!    allocate (the backing [`E2ERegistry`] uses a `HashMap`); that is
+//!    acceptable as a construction-time cost.
+//! 3. [`define_static_channels!`] oneshot first-claim, warm-claim, and
+//!    receiver-poll paths are alloc-free. First-claim is exercised on a
+//!    pool that has never been touched before (the `u64` variant), which
+//!    is the case that runs once at boot on a real bare-metal target.
+//!    `recv()` is polled with [`Waker::noop`] so we measure the channel
+//!    path without an executor.
+//! 4. Both Profile4 and Profile5 protect/check round-trips through
+//!    [`StaticE2EHandle`] are alloc-free.
+//!
+//! # What this does not witness
+//!
+//! A fully no-alloc `Client` or `Server` run loop additionally requires a
+//! no-alloc `Spawner`, no-alloc transport, and a no-tokio executor. That
+//! end-to-end harness requires further work. The counting allocator in
+//! `tests/static_channels_alloc_witness.rs` covers the channel-storage hot
+//! path in a tokio-hosted context; this file extends it to the handle layer
+//! with a stricter panic harness.
+
+use core::cell::RefCell;
+use core::future::Future;
+use core::net::Ipv4Addr;
+use core::pin::Pin;
+use core::sync::atomic::{AtomicBool, AtomicU32, Ordering};
+use core::task::{Context, Waker};
+use std::alloc::{GlobalAlloc, Layout, System};
+use std::process;
+
+use embassy_sync::blocking_mutex::Mutex as BlockingMutex;
+use embassy_sync::blocking_mutex::raw::CriticalSectionRawMutex;
+
+use simple_someip::e2e::{E2EKey, E2EProfile, E2ERegistry, Profile4Config, Profile5Config};
+use simple_someip::transport::{AtomicInterfaceHandle, OneshotRecv, OneshotSend, StaticE2EHandle};
+use simple_someip::{
+    ChannelFactory, E2ERegistryHandle, InterfaceHandle, StaticE2EStorage, define_static_channels,
+};
+
+// ── Panic allocator ───────────────────────────────────────────────────────
+
+static ARMED: AtomicBool = AtomicBool::new(false);
+
+struct PanicAllocator;
+
+/// Disarm the allocator, print a diagnostic, then abort.
+///
+/// We disarm first so the formatter is allowed to allocate while building
+/// the diagnostic — otherwise the diagnostic would re-trigger the allocator
+/// trap and we'd lose the message. Aborting (rather than panicking) keeps
+/// us off the panic-unwind path, whose machinery also allocates.
+fn diagnose_and_abort(kind: &str, size: usize, align_or_new: usize) -> ! {
+    ARMED.store(false, Ordering::SeqCst);
+    eprintln!("no_alloc_witness: forbidden allocation ({kind}): {size} bytes / {align_or_new}");
+    process::abort();
+}
+
+unsafe impl GlobalAlloc for PanicAllocator {
+    unsafe fn alloc(&self, layout: Layout) -> *mut u8 {
+        if ARMED.load(Ordering::Acquire) {
+            diagnose_and_abort("alloc", layout.size(), layout.align());
+        }
+        // SAFETY: forwarding to System with caller's layout contract.
+        unsafe { System.alloc(layout) }
+    }
+
+    unsafe fn dealloc(&self, ptr: *mut u8, layout: Layout) {
+        // SAFETY: forwarding to System; ptr/layout from System::alloc.
+        unsafe { System.dealloc(ptr, layout) }
+    }
+
+    unsafe fn alloc_zeroed(&self, layout: Layout) -> *mut u8 {
+        if ARMED.load(Ordering::Acquire) {
+            diagnose_and_abort("alloc_zeroed", layout.size(), layout.align());
+        }
+        // SAFETY: forwarding to System.
+        unsafe { System.alloc_zeroed(layout) }
+    }
+
+    unsafe fn realloc(&self, ptr: *mut u8, layout: Layout, new_size: usize) -> *mut u8 {
+        if ARMED.load(Ordering::Acquire) {
+            diagnose_and_abort("realloc", layout.size(), new_size);
+        }
+        // SAFETY: forwarding to System; invariants upheld by caller.
+        unsafe { System.realloc(ptr, layout, new_size) }
+    }
+}
+
+#[global_allocator]
+static GLOBAL: PanicAllocator = PanicAllocator;
+
+/// Arm the panic allocator for the duration of `f`, then disarm.
+///
+/// Any heap allocation inside `f` triggers `diagnose_and_abort`, which
+/// disarms the allocator (so the diagnostic itself can format), prints
+/// the offending kind/size/align to stderr, and then calls
+/// [`std::process::abort`]. The process exits with a non-zero status
+/// without unwinding — CI failure. (Aborting rather than panicking
+/// keeps us off the panic-unwind path, whose machinery would itself
+/// allocate and re-trip the trap.)
+fn assert_no_alloc<T>(label: &str, f: impl FnOnce() -> T) -> T {
+    ARMED.store(true, Ordering::SeqCst);
+    let result = f();
+    ARMED.store(false, Ordering::SeqCst);
+    println!("  [pass] {label}");
+    result
+}
+
+// ── Static channels ───────────────────────────────────────────────────────
+
+define_static_channels! {
+    name: WitnessChannels,
+    oneshot: [
+        (u32, 8),
+        // A separate type used exclusively by the first-claim witness so
+        // its pool has never been touched before we arm the allocator.
+        (u64, 4),
+    ],
+    bounded: [
+        ((u32, 4), 2),
+    ],
+    unbounded: [
+        (u32, 2),
+    ],
+}
+
+// ── Backing statics ───────────────────────────────────────────────────────
+
+static IFACE_ADDR: AtomicU32 = AtomicU32::new(0);
+
+// ── Witness functions ─────────────────────────────────────────────────────
+
+fn witness_atomic_interface_handle() {
+    let handle = AtomicInterfaceHandle::new(&IFACE_ADDR);
+    // Initialize outside the armed window.
+    handle.set(Ipv4Addr::LOCALHOST);
+
+    assert_no_alloc("AtomicInterfaceHandle::set / ::get", || {
+        handle.set(Ipv4Addr::new(192, 168, 1, 1));
+        assert_eq!(handle.get(), Ipv4Addr::new(192, 168, 1, 1));
+        handle.set(Ipv4Addr::LOCALHOST);
+        assert_eq!(handle.get(), Ipv4Addr::LOCALHOST);
+    });
+}
+
+fn witness_static_e2e_handle_reads() {
+    // Box::leak allocates — that is an accepted construction-time cost.
+    let storage: &'static StaticE2EStorage =
+        Box::leak(Box::new(BlockingMutex::<
+            CriticalSectionRawMutex,
+            RefCell<E2ERegistry>,
+        >::new(RefCell::new(E2ERegistry::new()))));
+    let handle = StaticE2EHandle::new(storage);
+
+    // register() allocates into the HashMap — also construction-time.
+    handle.register(
+        E2EKey::new(0x1234, 0x0001),
+        E2EProfile::Profile4(Profile4Config::new(0xDEAD_BEEF, 15)),
+    );
+
+    // Hot-path reads must be alloc-free.
+    assert_no_alloc("StaticE2EHandle::contains_key (hit)", || {
+        assert!(handle.contains_key(&E2EKey::new(0x1234, 0x0001)));
+    });
+
+    assert_no_alloc("StaticE2EHandle::contains_key (miss)", || {
+        assert!(!handle.contains_key(&E2EKey::new(0xFFFF, 0x0000)));
+    });
+
+    assert_no_alloc("StaticE2EHandle::check (absent key → None)", || {
+        assert!(
+            handle
+                .check(E2EKey::new(0xFFFF, 0x0000), b"payload", [0u8; 8])
+                .is_none()
+        );
+    });
+}
+
+fn witness_static_e2e_handle_protect_check() {
+    let storage: &'static StaticE2EStorage =
+        Box::leak(Box::new(BlockingMutex::<
+            CriticalSectionRawMutex,
+            RefCell<E2ERegistry>,
+        >::new(RefCell::new(E2ERegistry::new()))));
+    let handle = StaticE2EHandle::new(storage);
+
+    handle.register(
+        E2EKey::new(0x0001, 0x8001),
+        E2EProfile::Profile4(Profile4Config::new(0x1234_5678, 15)),
+    );
+    // Register a second profile (Profile5) so the protect/check witness
+    // covers both profile families' hot paths, not just Profile4.
+    handle.register(
+        E2EKey::new(0x0002, 0x8002),
+        // data_length must equal payload length (5 = b"hello".len())
+        // — a mismatch routes through `tracing::warn!`, which is fine in
+        // production but adds noise to a no-alloc witness.
+        E2EProfile::Profile5(Profile5Config::new(0xABCD, 5, 15)),
+    );
+
+    let key = E2EKey::new(0x0001, 0x8001);
+    let payload = b"hello";
+    let mut protected = [0u8; 64];
+
+    assert_no_alloc(
+        "StaticE2EHandle::protect + check round-trip (Profile4)",
+        || {
+            let len = handle
+                .protect(key, payload, [0u8; 8], &mut protected)
+                .expect("profile registered")
+                .expect("protect succeeded");
+            let (status, stripped) = handle
+                .check(key, &protected[..len], [0u8; 8])
+                .expect("profile registered");
+            assert_eq!(status, simple_someip::E2ECheckStatus::Ok);
+            assert_eq!(stripped, payload);
+        },
+    );
+
+    let key5 = E2EKey::new(0x0002, 0x8002);
+    let mut protected5 = [0u8; 64];
+    assert_no_alloc(
+        "StaticE2EHandle::protect + check round-trip (Profile5)",
+        || {
+            let len = handle
+                .protect(key5, payload, [0u8; 8], &mut protected5)
+                .expect("profile registered")
+                .expect("protect succeeded");
+            let (status, stripped) = handle
+                .check(key5, &protected5[..len], [0u8; 8])
+                .expect("profile registered");
+            assert_eq!(status, simple_someip::E2ECheckStatus::Ok);
+            assert_eq!(stripped, payload);
+        },
+    );
+}
+
+fn witness_static_channels_oneshot() {
+    // Warm the pool: first claim/release seeds the free-list.
+    {
+        let (tx, _rx) = WitnessChannels::oneshot::<u32>();
+        tx.send(42u32).ok();
+    }
+
+    // Second claim must not allocate.
+    assert_no_alloc("WitnessChannels::oneshot warm claim + send", || {
+        let (tx, _rx) = WitnessChannels::oneshot::<u32>();
+        tx.send(99u32).ok();
+    });
+}
+
+/// First-claim witness: a freshly declared static pool (the `u64` variant
+/// in [`WitnessChannels`], untouched until this point) must seed its
+/// free-list and hand out the first slot without allocating. This is the
+/// case that runs once at boot on a real bare-metal target.
+fn witness_static_channels_first_claim() {
+    assert_no_alloc("WitnessChannels::oneshot::<u64> FIRST claim + send", || {
+        let (tx, _rx) = WitnessChannels::oneshot::<u64>();
+        tx.send(7u64).ok();
+    });
+}
+
+/// Receiver hot-path witness: polling the recv future once on a slot that
+/// already has a value must not allocate. Uses [`Waker::noop`] so we don't
+/// drag in an executor.
+fn witness_static_channels_oneshot_recv() {
+    // Warm the pool first so this witness measures only the recv path.
+    {
+        let (tx, _rx) = WitnessChannels::oneshot::<u32>();
+        tx.send(1u32).ok();
+    }
+
+    assert_no_alloc(
+        "WitnessChannels::oneshot recv (value already pending)",
+        || {
+            let (tx, rx) = WitnessChannels::oneshot::<u32>();
+            tx.send(123u32).ok();
+            let mut fut = rx.recv();
+            // SAFETY: `fut` is stack-pinned and dropped before this scope ends;
+            // no reference escapes.
+            let pinned = unsafe { Pin::new_unchecked(&mut fut) };
+            let waker = Waker::noop();
+            let mut cx = Context::from_waker(waker);
+            match pinned.poll(&mut cx) {
+                core::task::Poll::Ready(Ok(v)) => assert_eq!(v, 123),
+                other => panic!("expected Ready(Ok(123)), got {other:?}"),
+            }
+        },
+    );
+}
+
+// ── Entry point ───────────────────────────────────────────────────────────
+
+fn main() {
+    // cargo-nextest runs `--list --format terse` for test discovery. A
+    // `harness = false` binary must print each test name followed by
+    // `: test` or `: benchmark`. We expose a single pseudo-test named
+    // `no_alloc_witness` so nextest can schedule us.
+    let args: Vec<String> = std::env::args().collect();
+    if args.iter().any(|a| a == "--list") {
+        // nextest calls --list twice: once for normal tests and once with
+        // --ignored. Print nothing for the --ignored pass so nextest does
+        // not classify this test as ignored and skip it by default.
+        if !args.iter().any(|a| a == "--ignored") {
+            println!("no_alloc_witness: test");
+        }
+        return;
+    }
+
+    println!("no-alloc witness:");
+
+    witness_atomic_interface_handle();
+    witness_static_e2e_handle_reads();
+    witness_static_e2e_handle_protect_check();
+    witness_static_channels_first_claim();
+    witness_static_channels_oneshot();
+    witness_static_channels_oneshot_recv();
+
+    println!("all witnesses passed");
+}
diff --git a/tests/static_channels_alloc_witness.rs b/tests/static_channels_alloc_witness.rs
new file mode 100644
index 0000000..6db9ea5
--- /dev/null
+++ b/tests/static_channels_alloc_witness.rs
@@ -0,0 +1,336 @@
+//! Allocation witness: prove that the static-pool [`ChannelFactory`]
+//! generated by [`define_static_channels!`] does not invoke the global
+//! allocator on the request/response hot path.
+//!
+//! [`ChannelFactory`]: simple_someip::transport::ChannelFactory
+//! [`define_static_channels!`]: simple_someip::define_static_channels
+//!
+//! # What this test asserts
+//!
+//! 1. `Client::new_with_deps` is allowed to allocate — the std-flavored
+//!    `Arc<Mutex<E2ERegistry>>` and `Arc<RwLock<Ipv4Addr>>` handles
+//!    used here, plus tokio's task-spawning machinery, all heap-backed.
+//!    The strategic-goal claim is "zero heap **after** `Client::new`
+//!    returns," not "zero heap, period."
+//! 2. After construction, calling [`Client::interface`] (a pure handle
+//!    read) does not allocate.
+//! 3. After construction, claiming + dropping a oneshot through the
+//!    macro-declared static pool does not allocate. This is the
+//!    direct witness for the strategic-goal claim about per-call
+//!    channel storage.
+//!
+//! # Why a counting allocator and not a panicking one
+//!
+//! The design specifies a `#[global_allocator]` shim that **panics**
+//! on allocation after `Client::new` returns. That requires a no-alloc
+//! test executor (tokio's runtime allocates on its own), no-alloc
+//! `Spawner` impl for the per-socket loops, and stack-based
+//! `E2ERegistryHandle` / `InterfaceHandle` impls. Each of those is a
+//! real piece of work and lives under the CI harness umbrella.
+//!
+//! The counting allocator here is a softer witness: it instruments
+//! every allocation through a [`std::sync::atomic::AtomicUsize`]
+//! counter and checks the delta across specific operations. It
+//! catches regressions where a channel construction starts heap-
+//! allocating; it does not catch "tokio runtime allocated to drive
+//! a sleep" because that allocation is acceptable in the host-test
+//! context. The panicking harness will catch both.
+#![cfg(all(feature = "client", feature = "bare_metal"))]
+
+use core::future::Future;
+use core::net::{Ipv4Addr, SocketAddrV4};
+use core::pin::Pin;
+use core::task::{Context, Poll};
+use core::time::Duration;
+use std::alloc::{GlobalAlloc, Layout, System};
+use std::collections::VecDeque;
+use std::sync::atomic::{AtomicUsize, Ordering};
+use std::sync::{Arc, Mutex};
+
+use simple_someip::client::Error as ClientError;
+use simple_someip::client::{ClientUpdate, ControlMessage, ReceivedMessage, SendMessage};
+use simple_someip::define_static_channels;
+use simple_someip::e2e::E2ERegistry;
+use simple_someip::protocol::sd::RebootFlag;
+use simple_someip::transport::{
+    ChannelFactory, OneshotSend, ReceivedDatagram, SocketOptions, Spawner, Timer, TransportError,
+    TransportFactory, TransportSocket,
+};
+use simple_someip::{Client, ClientDeps, RawPayload};
+
+// ── Counting global allocator ─────────────────────────────────────────
+
+static ALLOC_COUNT: AtomicUsize = AtomicUsize::new(0);
+
+/// Serializes the alloc-measurement region across `#[tokio::test]`s in
+/// this file. Without it, parallel test execution would interleave
+/// allocations from one test into another's `(baseline, end)` window.
+static MEASURE_LOCK: Mutex<()> = Mutex::new(());
+
+struct CountingAllocator;
+
+unsafe impl GlobalAlloc for CountingAllocator {
+    unsafe fn alloc(&self, layout: Layout) -> *mut u8 {
+        ALLOC_COUNT.fetch_add(1, Ordering::Relaxed);
+        // SAFETY: forwarding to System with caller's layout
+        // contract preserved.
+        unsafe { System.alloc(layout) }
+    }
+    unsafe fn dealloc(&self, ptr: *mut u8, layout: Layout) {
+        // SAFETY: forwarding to System; ptr/layout came from System::alloc
+        // (we only delegate forward).
+        unsafe { System.dealloc(ptr, layout) }
+    }
+    unsafe fn alloc_zeroed(&self, layout: Layout) -> *mut u8 {
+        ALLOC_COUNT.fetch_add(1, Ordering::Relaxed);
+        // SAFETY: forwarding to System.
+        unsafe { System.alloc_zeroed(layout) }
+    }
+    unsafe fn realloc(&self, ptr: *mut u8, layout: Layout, new_size: usize) -> *mut u8 {
+        ALLOC_COUNT.fetch_add(1, Ordering::Relaxed);
+        // SAFETY: forwarding to System; ptr/layout/new_size invariants
+        // upheld by caller.
+        unsafe { System.realloc(ptr, layout, new_size) }
+    }
+}
+
+#[global_allocator]
+static GLOBAL: CountingAllocator = CountingAllocator;
+
+fn alloc_count() -> usize {
+    ALLOC_COUNT.load(Ordering::Relaxed)
+}
+
+// ── Static channels declaration ───────────────────────────────────────
+
+define_static_channels! {
+    name: WitnessChannels,
+    oneshot: [
+        (Result<(), ClientError>, 8),
+        (Result<RawPayload, ClientError>, 4),
+        (Result<RebootFlag, ClientError>, 4),
+    ],
+    bounded: [
+        ((ControlMessage<RawPayload, WitnessChannels>, 4), 1),
+        ((SendMessage<RawPayload, WitnessChannels>, 16), 4),
+        ((Result<ReceivedMessage<RawPayload>, ClientError>, 16), 4),
+    ],
+    unbounded: [
+        (ClientUpdate<RawPayload>, 1),
+    ],
+}
+
+// ── Mock transport (mirrors tests/bare_metal_client.rs) ───────────────
+
+#[derive(Default)]
+struct MockPipe {
+    sent: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound: Mutex<VecDeque<(Vec<u8>, SocketAddrV4)>>,
+    inbound_waker: Mutex<Option<core::task::Waker>>,
+}
+
+#[derive(Clone)]
+struct MockFactory {
+    pipe: Arc<MockPipe>,
+    local_port: Arc<Mutex<u16>>,
+}
+
+impl TransportFactory for MockFactory {
+    type Socket = MockSocket;
+    type BindFuture<'a> = core::future::Ready<Result<Self::Socket, TransportError>>;
+    fn bind<'a>(&'a self, addr: SocketAddrV4, _options: &'a SocketOptions) -> Self::BindFuture<'a> {
+        let pipe = Arc::clone(&self.pipe);
+        let mut p = self.local_port.lock().unwrap();
+        let port = if addr.port() == 0 {
+            let next = *p + 1;
+            *p = next;
+            30000 + next
+        } else {
+            addr.port()
+        };
+        let local = SocketAddrV4::new(*addr.ip(), port);
+        core::future::ready(Ok(MockSocket { pipe, local }))
+    }
+}
+
+struct MockSocket {
+    pipe: Arc<MockPipe>,
+    local: SocketAddrV4,
+}
+
+struct MockSendFut {
+    pipe: Arc<MockPipe>,
+    bytes: Option<Vec<u8>>,
+    target: SocketAddrV4,
+}
+
+impl Future for MockSendFut {
+    type Output = Result<(), TransportError>;
+    fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        if let Some(bytes) = me.bytes.take() {
+            me.pipe.sent.lock().unwrap().push_back((bytes, me.target));
+        }
+        Poll::Ready(Ok(()))
+    }
+}
+
+struct MockRecvFut<'a> {
+    pipe: Arc<MockPipe>,
+    buf: &'a mut [u8],
+}
+
+impl Future for MockRecvFut<'_> {
+    type Output = Result<ReceivedDatagram, TransportError>;
+    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let me = self.get_mut();
+        let entry = me.pipe.inbound.lock().unwrap().pop_front();
+        match entry {
+            Some((bytes, source)) => {
+                let n = bytes.len().min(me.buf.len());
+                me.buf[..n].copy_from_slice(&bytes[..n]);
+                Poll::Ready(Ok(ReceivedDatagram {
+                    bytes_received: n,
+                    source,
+                    truncated: n < bytes.len(),
+                }))
+            }
+            None => {
+                *me.pipe.inbound_waker.lock().unwrap() = Some(cx.waker().clone());
+                if let Some((bytes, source)) = me.pipe.inbound.lock().unwrap().pop_front() {
+                    let n = bytes.len().min(me.buf.len());
+                    me.buf[..n].copy_from_slice(&bytes[..n]);
+                    return Poll::Ready(Ok(ReceivedDatagram {
+                        bytes_received: n,
+                        source,
+                        truncated: n < bytes.len(),
+                    }));
+                }
+                Poll::Pending
+            }
+        }
+    }
+}
+
+impl TransportSocket for MockSocket {
+    type SendFuture<'a> = MockSendFut;
+    type RecvFuture<'a> = MockRecvFut<'a>;
+
+    fn send_to<'a>(&'a self, buf: &'a [u8], target: SocketAddrV4) -> Self::SendFuture<'a> {
+        MockSendFut {
+            pipe: Arc::clone(&self.pipe),
+            bytes: Some(buf.to_vec()),
+            target,
+        }
+    }
+
+    fn recv_from<'a>(&'a self, buf: &'a mut [u8]) -> Self::RecvFuture<'a> {
+        MockRecvFut {
+            pipe: Arc::clone(&self.pipe),
+            buf,
+        }
+    }
+
+    fn local_addr(&self) -> Result<SocketAddrV4, TransportError> {
+        Ok(self.local)
+    }
+
+    fn join_multicast_v4(&self, _g: Ipv4Addr, _i: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+    fn leave_multicast_v4(&self, _g: Ipv4Addr, _i: Ipv4Addr) -> Result<(), TransportError> {
+        Ok(())
+    }
+}
+
+struct MockTimer;
+impl Timer for MockTimer {
+    type SleepFuture<'a> = core::pin::Pin<Box<dyn Future<Output = ()> + Send + 'a>>;
+    fn sleep(&self, duration: Duration) -> Self::SleepFuture<'_> {
+        Box::pin(async move {
+            tokio::time::sleep(duration).await;
+        })
+    }
+}
+
+struct TokioBackedSpawner;
+impl Spawner for TokioBackedSpawner {
+    fn spawn(&self, future: impl Future<Output = ()> + Send + 'static) {
+        drop(tokio::spawn(future));
+    }
+}
+
+// ── Witnesses ─────────────────────────────────────────────────────────
+
+#[tokio::test]
+async fn no_alloc_when_claiming_oneshot_through_static_pool() {
+    let _guard = MEASURE_LOCK.lock().unwrap();
+    // Warm any one-time tokio-runtime / first-claim seeding allocations
+    // before measuring.
+    {
+        let (tx, _rx) = WitnessChannels::oneshot::<Result<(), ClientError>>();
+        tx.send(Ok(())).unwrap();
+    }
+
+    let baseline = alloc_count();
+    {
+        // A second claim/release cycle must not allocate. The pool is
+        // already seeded; the slot returned from the first claim is on
+        // the free list.
+        let (tx, _rx) = WitnessChannels::oneshot::<Result<(), ClientError>>();
+        tx.send(Ok(())).unwrap();
+    }
+    let delta = alloc_count() - baseline;
+    assert_eq!(
+        delta, 0,
+        "static-pool oneshot claim/release allocated {delta} times \
+         after warm-up; expected zero",
+    );
+}
+
+#[tokio::test]
+async fn client_interface_read_after_construction_does_not_allocate() {
+    let pipe = Arc::new(MockPipe::default());
+    let factory = MockFactory {
+        pipe: Arc::clone(&pipe),
+        local_port: Arc::new(Mutex::new(0)),
+    };
+    let interface_handle: Arc<std::sync::RwLock<Ipv4Addr>> =
+        Arc::new(std::sync::RwLock::new(Ipv4Addr::LOCALHOST));
+    let e2e_handle: Arc<Mutex<E2ERegistry>> = Arc::new(Mutex::new(E2ERegistry::new()));
+
+    let (client, _updates, run_fut) = Client::<
+        RawPayload,
+        Arc<Mutex<E2ERegistry>>,
+        Arc<std::sync::RwLock<Ipv4Addr>>,
+        WitnessChannels,
+    >::new_with_deps(
+        ClientDeps {
+            factory,
+            spawner: TokioBackedSpawner,
+            timer: MockTimer,
+            e2e_registry: e2e_handle,
+            interface: interface_handle,
+        },
+        false,
+    );
+    let run_handle = tokio::spawn(run_fut);
+
+    // After construction (and after a yield to give the spawn loop a
+    // chance to do its one-time setup allocs), measure pure-handle
+    // operations under the serialization lock.
+    tokio::task::yield_now().await;
+    let _guard = MEASURE_LOCK.lock().unwrap();
+    let baseline = alloc_count();
+    for _ in 0..16 {
+        assert_eq!(client.interface(), Ipv4Addr::LOCALHOST);
+    }
+    let delta = alloc_count() - baseline;
+    assert_eq!(
+        delta, 0,
+        "Client::interface() x16 allocated {delta} times; expected zero",
+    );
+
+    run_handle.abort();
+    drop(client);
+}